Add new python scripts.

AlbertaBeef · AlbertaBeef · commit 09e8e26be0a6 · 2023-01-27T11:37:03.000-05:00
diff --git a/app/asl_classify_files.py b/app/asl_classify_files.py
@@ -0,0 +1,215 @@
+'''
+Copyright 2023 Avnet Inc.
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+'''
+
+from ctypes import *
+from typing import List
+import cv2
+import numpy as np
+import vart
+import os
+import pathlib
+import xir
+import threading
+import time
+import sys
+import argparse
+
+divider = '------------------------------------'
+
+def preprocess_fn(image_path, fix_scale):
+    '''
+    Image pre-processing.
+    Rearranges from BGR to RGB then normalizes to range 0:1
+    and then scales by input quantization scaling factor
+    input arg: path of image file
+    return: numpy array
+    '''
+    image = cv2.imread(image_path)
+    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    image = image * fix_scale
+    image = image.astype(np.int8)
+    return image
+
+
+def get_child_subgraph_dpu(graph: "Graph") -> List["Subgraph"]:
+    assert graph is not None, "'graph' should not be None."
+    root_subgraph = graph.get_root_subgraph()
+    assert (root_subgraph is not None), "Failed to get root subgraph of input Graph object."
+    if root_subgraph.is_leaf:
+        return []
+    child_subgraphs = root_subgraph.toposort_child_subgraph()
+    assert child_subgraphs is not None and len(child_subgraphs) > 0
+    return [
+        cs
+        for cs in child_subgraphs
+        if cs.has_attr("device") and cs.get_attr("device").upper() == "DPU"
+    ]
+
+
+def runDPU(id,start,dpu,img):
+    '''get tensor'''
+    inputTensors = dpu.get_input_tensors()
+    outputTensors = dpu.get_output_tensors()
+    input_ndim = tuple(inputTensors[0].dims)
+    output_ndim = tuple(outputTensors[0].dims)
+
+    # we can avoid output scaling if use argmax instead of softmax
+    #output_fixpos = outputTensors[0].get_attr("fix_point")
+    #output_scale = 1 / (2**output_fixpos)
+
+    batchSize = input_ndim[0]
+    n_of_images = len(img)
+    count = 0
+    write_index = start
+    ids=[]
+    ids_max = 50
+    outputData = []
+    for i in range(ids_max):
+        outputData.append([np.empty(output_ndim, dtype=np.int8, order="C")])
+    while count < n_of_images:
+        if (count+batchSize<=n_of_images):
+            runSize = batchSize
+        else:
+            runSize=n_of_images-count
+
+        '''prepare batch input/output '''
+        inputData = []
+        inputData = [np.empty(input_ndim, dtype=np.int8, order="C")]
+
+        '''init input image to input buffer '''
+        for j in range(runSize):
+            imageRun = inputData[0]
+            imageRun[j, ...] = img[(count + j) % n_of_images].reshape(input_ndim[1:])
+        '''run with batch '''
+        job_id = dpu.execute_async(inputData,outputData[len(ids)])
+        ids.append((job_id,runSize,start+count))
+        count = count + runSize 
+        if count<n_of_images:
+            if len(ids) < ids_max-1:
+                continue
+        for index in range(len(ids)):
+            dpu.wait(ids[index][0])
+            write_index = ids[index][2]
+            '''store output vectors '''
+            for j in range(ids[index][1]):
+                # we can avoid output scaling if use argmax instead of softmax
+                # out_q[write_index] = np.argmax(outputData[0][j] * output_scale)
+                out_q[write_index] = np.argmax(outputData[index][0][j])
+                write_index += 1
+        ids=[]
+
+
+def app(image_dir,threads,model):
+
+    listimage=os.listdir(image_dir)
+    runTotal = len(listimage)
+
+    global out_q
+    out_q = [None] * runTotal
+    g = xir.Graph.deserialize(model)
+    subgraphs = get_child_subgraph_dpu(g)
+    all_dpu_runners = []
+    for i in range(threads):
+        all_dpu_runners.append(vart.Runner.create_runner(subgraphs[0], "run"))
+
+    # input scaling
+    input_fixpos = all_dpu_runners[0].get_input_tensors()[0].get_attr("fix_point")
+    input_scale = 2**input_fixpos
+    print('[INFO] fix_point = ',input_fixpos)
+    print('[INFO] input_scale = ',input_scale)
+
+    ''' preprocess images '''
+    print (divider)
+    print('Pre-processing',runTotal,'images...')
+    img = []
+    for i in range(runTotal):
+        path = os.path.join(image_dir,listimage[i])
+        img.append(preprocess_fn(path, input_scale))
+
+    '''run threads '''
+    print('Starting',threads,'threads...')
+    threadAll = []
+    start=0
+    for i in range(threads):
+        if (i==threads-1):
+            end = len(img)
+        else:
+            end = start+(len(img)//threads)
+        in_q = img[start:end]
+        t1 = threading.Thread(target=runDPU, args=(i,start,all_dpu_runners[i], in_q))
+        threadAll.append(t1)
+        start=end
+
+    time1 = time.time()
+    for x in threadAll:
+        x.start()
+    for x in threadAll:
+        x.join()
+    time2 = time.time()
+    timetotal = time2 - time1
+
+    fps = float(runTotal / timetotal)
+    print (divider)
+    print("Throughput=%.2f fps, total frames = %.0f, time=%.4f seconds" %(fps, runTotal, timetotal))
+
+
+    ''' post-processing '''
+    classes = ['A','B','C','D','E','F','G','H','I','J','K','L','M','N','O','P','Q','R','S','T','U','V','W','X','Y','Z','del','nothing','space']
+    correct = 0
+    wrong = 0
+    print('Post-processing',len(out_q),'test images..')
+    for i in range(len(out_q)):
+        #prediction = classes[out_q[i]]
+        #ground_truth, _ = listimage[i].split('.',1)
+        prediction = out_q[i]
+        path_split = listimage[i].split('_')
+        # ['test0174', '2', 'C.png']
+        ground_truth = path_split[len(path_split)-2]
+        # '2'
+        ground_truth = int( ground_truth )
+        # 2
+        #print(listimage[i],classes[ground_truth],'=>',classes[prediction])
+        if (ground_truth==prediction):
+            correct += 1
+        else:
+            wrong += 1
+            print(listimage[i],classes[ground_truth],'=>',classes[prediction])
+    accuracy = correct/len(out_q)
+    print('Correct:%d, Wrong:%d, Accuracy:%.4f' %(correct,wrong,accuracy))
+    print (divider)
+    
+    return
+
+
+
+# only used if script is run as 'main' from command line
+def main():
+
+  # construct the argument parser and parse the arguments
+  ap = argparse.ArgumentParser()  
+  ap.add_argument('-d', '--image_dir', type=str, default='test-images', help='Path to folder of test images. Default is test-images')  
+  ap.add_argument('-t', '--threads',   type=int, default=1,        help='Number of threads. Default is 1')
+  ap.add_argument('-m', '--model',     type=str, default='asl_classifier.xmodel', help='Path of xmodel. Default is asl_classifier.xmodel')
+
+  args = ap.parse_args()  
+  
+  print ('Command line options:')
+  print (' --image_dir : ', args.image_dir)
+  print (' --threads   : ', args.threads)
+  print (' --model     : ', args.model)
+
+  app(args.image_dir,args.threads,args.model)
+
+if __name__ == '__main__':
+  main()
+
diff --git a/app/asl_classify_live.py b/app/asl_classify_live.py
@@ -1,3 +1,15 @@
+'''
+Copyright 2023 Avnet Inc.
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+'''
 #
 # ASL Classification (live with USB camera)
 #
@@ -47,16 +59,16 @@ def get_video_dev_by_name(src):
             if src in line:
                 return dev
 
-def detect_dpu_architecture():
-    proc = subprocess.run(['xdputil','query'], capture_output=True, encoding='utf8')
-    for line in proc.stdout.splitlines():
-        if 'DPU Arch' in line:
-            #                 "DPU Arch":"DPUCZDX8G_ISA0_B128_01000020E2012208",
-            #dpu_arch = re.search('DPUCZDX8G_ISA0_(.+?)_', line).group(1)  
-            #                 "DPU Arch":"DPUCZDX8G_ISA1_B2304",
-            #dpu_arch = re.search('DPUCZDX8G_ISA1_(.+?)', line).group(1)
-            dpu_arch = "B2304"
-            return dpu_arch
+# ...work in progress ...
+#def detect_dpu_architecture():
+#    proc = subprocess.run(['xdputil','query'], capture_output=True, encoding='utf8')
+#    for line in proc.stdout.splitlines():
+#        if 'DPU Arch' in line:
+#            #                 "DPU Arch":"DPUCZDX8G_ISA0_B128_01000020E2012208",
+#            #dpu_arch = re.search('DPUCZDX8G_ISA0_(.+?)_', line).group(1)  
+#            #                 "DPU Arch":"DPUCZDX8G_ISA1_B2304",
+#            #dpu_arch = re.search('DPUCZDX8G_ISA1_(.+?)', line).group(1)
+#            return dpu_arch
 
 # Parameters (tweaked for video)
 scale = 1.0
@@ -76,7 +88,10 @@ def detect_dpu_architecture():
 input_video = dev_video  
 print("[INFO] Input Video : ",input_video)
 
-displayReference = True
+output_dir = './captured-images'
+
+if not os.path.exists(output_dir):      
+    os.mkdir(output_dir)            # Create the output directory if it doesn't already exist
 
 cv2.namedWindow('ASL Classification')
 
@@ -158,11 +173,22 @@ def TopK(datain, size, filePath):
                 print("Top[%d] %d %s" % (i, idx, (line.strip)("\n")))
             idx = idx + 1
 
-dpu_arch = detect_dpu_architecture()
-print('[INFO] Detected DPU architecture : ',dpu_arch)
+# construct the argument parser and parse the arguments
+ap = argparse.ArgumentParser()  
+ap.add_argument('-m', '--model',     type=str, default='asl_classifier.xmodel', help='Path of xmodel. Default is asl_classifier.xmodel')
+
+args = ap.parse_args()  
+  
+print ('Command line options:')
+print (' --model     : ', args.model)
+
+#dpu_arch = detect_dpu_architecture()
+#print('[INFO] Detected DPU architecture : ',dpu_arch)
+#
+#model_path = './model_1/'+dpu_arch+'/asl_classifier_1.xmodel'
+#print('[INFO] ASL model : ',model_path)
+model_path = args.model
 
-model_path = './model_1/'+dpu_arch+'/asl_classifier_1.xmodel'
-print('[INFO] ASL model : ',model_path)
 
 # Create DPU runner
 g = xir.Graph.deserialize(model_path)
@@ -255,11 +281,26 @@ def TopK(datain, size, filePath):
             output = image.copy()
             
             asl_id = -1
-            #try:
-            if True:
+            try:
+                # 448x448 ROI for classification
+                #y1 = (16)
+                #y2 = (16+448)
+                #x1 = (96)
+                #x2 = (96+448)
+                #roi_img = output[ y1:y2, x1:x2, : ]
+                #roi_img = cv2.resize(asl_img,(224,224),interpolation=cv2.INTER_CUBIC)
+            
+                # 224x224 ROI for classification
+                y1 = (128)
+                y2 = (128+224)
+                x1 = (208)
+                x2 = (208+224)
+                roi_img = output[ y1:y2, x1:x2, : ]
+                
+                cv2.rectangle(output, (x1,y1), (x2,y2), (0, 255, 0), 2)
+
                 # ASL pre-processing
-                asl_img = cv2.resize(image,(224,224),interpolation=cv2.INTER_CUBIC)
-                asl_img = cv2.cvtColor(asl_img, cv2.COLOR_BGR2RGB)
+                asl_img = cv2.cvtColor(roi_img, cv2.COLOR_BGR2RGB)
                 asl_img = asl_img*input_scale
                 asl_img = asl_img.astype(np.int8)
                 #cv2.imshow('asl_img',asl_img)
@@ -298,8 +339,8 @@ def TopK(datain, size, filePath):
                 asl_text = '['+str(asl_id)+']='+asl_sign
                 cv2.putText(output,asl_text,(10,30),text_fontType,text_fontSize,text_color,text_lineSize,text_lineType)
                         
-            #except:
-            #    print("ERROR : Exception occured during ASL classification ...")
+            except:
+                print("ERROR : Exception occured during ASL classification ...")
 
                          
             matching_text = ("[%04d] [%02d]=%s"%(frame_count,asl_id,asl_sign))
@@ -325,7 +366,7 @@ def TopK(datain, size, filePath):
         filename = ("frame%04d_asl%02d.tif"%(frame_count,asl_id))
             
         print("Capturing ",filename," ...")
-        cv2.imwrite(os.path.join(output_dir,filename),asl_img)
+        cv2.imwrite(os.path.join(output_dir,filename),roi_img)
        
     if key == 115: # 's'
         step = True    
@@ -337,7 +378,7 @@ def TopK(datain, size, filePath):
         step = False
         pause = False
 
-    if key == 27:
+    if key == 27 or key == 113: # ESC or 'q':
         break
 
     # Update the real-time FPS counter
diff --git a/asl-classifier-transferlearning-tf2-deployment-dpu.ipynb b/asl-classifier-transferlearning-tf2-deployment-dpu.ipynb