VisionProcessing/image_processor.py at master · team3238/VisionProcessing · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
#!/usr/bin/python
#Team3238 Cyborg Ferrets 2014 Object Detection Code
#Start with
#python image_processor.py 'path/to/image.jpg'
#don't pass an image argument to use the VideoCapture(0) stream.
# Video capture mode updates the frame to process every video_pause milliseconds, so adjust that.
#set enable_dashboard = True to send range and bearing over smart dashboard network_tables interface.
#set show_windows     = False for on-robot, no monitor processing on pandaboard.

#This code is a merge of vision_lib.py, bearing_formula.py, distance_formula.py and team341 java vision detection code from (2012?) competition.

#java -jar SmartDashboard ip 127.0.0.1, for example, will start the dashboard if running on this same host.
#Now tuned for green leds.
#expected camera settings (sorry no numbers on camera interface.)
# exposure -> far right
# gain -> far left
# brightness ~ 20% from left
# contrast ~ 20% from left
# color intensity ~ 18% from left


#yavta -l /dev/video0
#control 0x00980900 `Brightness' min 0 max 255 step 1 default 128 current 128.
#control 0x00980901 `Contrast' min 0 max 255 step 1 default 32 current 32.
#control 0x00980902 `Saturation' min 0 max 255 step 1 default 32 current 32.
#control 0x0098090c `White Balance Temperature, Auto' min 0 max 1 step 1 default 1 current 1.
#control 0x00980913 `Gain' min 0 max 255 step 1 default 0 current 0.
#control 0x00980918 `Power Line Frequency' min 0 max 2 step 1 default 2 current 2.
#  0: Disabled
#  1: 50 Hz
#  2: 60 Hz (*)
#control 0x0098091a `White Balance Temperature' min 0 max 10000 step 10 default 4000 current 10000.
#control 0x0098091b `Sharpness' min 0 max 255 step 1 default 53 current 53.
#control 0x0098091c `Backlight Compensation' min 0 max 1 step 1 default 0 current 0.
#control 0x009a0901 `Exposure, Auto' min 0 max 3 step 1 default 3 current 1.
#  1: Manual Mode (*)
#  3: Aperture Priority Mode
#control 0x009a0902 `Exposure (Absolute)' min 1 max 10000 step 1 default 166 current 10.
#control 0x009a0903 `Exposure, Auto Priority' min 0 max 1 step 1 default 0 current 1.
#12 controls found.


enable_dashboard = True
show_windows     = False

window_scale = 0.5
window_size = (int(640*window_scale), int(480*window_scale))

from cv2 import *
import numpy as np
import sys
import math
import commands

if enable_dashboard:
  from pynetworktables import *

if enable_dashboard:
  ip = '10.32.38.2'
  NetworkTable.SetIPAddress(ip)
  NetworkTable.SetClientMode()
  NetworkTable.Initialize()
  SmartDashboard.init()
#pretend the robot is on the network reporting its heading to the SmartDashboard,
#  then let the SmartDashboard user modify it and send it back to this code to simulate movement.
camera_exposure_title = 'Camera Exposure:'
camera_gain_title     = 'Camera Gain:'
save_frame_title      = 'SaveFrame:'

class ImageProcessor:
  #all these values could be put into the SmartDashboard for live tuning as conditions change.

  process_loop_count = 0
  default_shape   = (480,640,3)
  h               = np.zeros(default_shape, dtype=np.uint8)
  s               = np.zeros(default_shape, dtype=np.uint8)
  v               = np.zeros(default_shape, dtype=np.uint8)
  combined        = np.zeros(default_shape, dtype=np.uint8)
  img             = np.zeros(default_shape, dtype=np.uint8)
  h_title         = "hue"
  s_title         = "sat"
  v_title         = "val"
  combined_title  = "Combined + Morphed"
  targets_title   = "Targets"

  #for video capture mode, what approx frame rate do we want? frame rate = approx video_pause + processing time
  video_pause     =  1 #0 milliseconds means wait for key press, waitKey takes an integer so 1 millisecond is minimal with this approach.

  #tuned for the camera settings above and the green leds. (Red didn't work as well and requires changing the threshold function to use OR of inverse and normal threshold, because red is on the top and bottom of the hue scale (wraps around.).)
  hue_delta                   = 15
  sat_delta                   = 25
  val_delta                   = 100
  hue_thresh      = 80
  sat_thresh      = 233
  val_thresh      = 212
  hue_low_thresh  = hue_thresh - hue_delta #center on 80, delta as previous
  hue_high_thresh = hue_thresh + hue_delta
  sat_low_thresh  = sat_thresh - sat_delta #center on 233, delta as previous
  sat_high_thresh = sat_thresh + sat_delta
  val_low_thresh  = val_thresh - val_delta # center on 212, delta as previous
  val_high_thresh = val_thresh + val_delta
  max_thresh      = 255

  #used for the morphologyEx method that fills in the pixels in the combined image prior to identifying polygons and contours.
  kernel     = getStructuringElement(MORPH_RECT, (2,2), anchor=(1,1))
  morph_close_iterations = 9

  #colors in BGR format for drawing the targets over the image.
  selected_target_color    = (0,0,255)
  passed_up_target_color   = (255,0,0)
  possible_target_color    = (0,255,0)

  #used to judge whether a polygon side is near vertical or near horizontal, for filtering out shapes that don't match expected target characteristics
  vert_threshold           = math.tan(math.radians(90-20))
  horiz_threshold          = math.tan(math.radians(20))

  #used to look for only horizontal or vertical rectangles of an aspect ratio that matches the targets.
  #currently open wide to find both horizontal and vertical targets
  max_target_aspect_ratio  = 10 # 1.0 # top target is expected to be 24.5 in x 4 in.
  min_target_aspect_ratio  = 0.1 #0.01# 3# 0.5

  camera_exposure             = 20
  save_frame		      = False
  camera_gain                 = 0
  robot_heading               = 0.0 #input from SmartDashboard if enabled, else hard coded here.
  x_resolution                = 640 #needs to match the camera.
  y_resolution                = 480
  #theta                      = math.radians(49.165) #half of field of view of the camera
#  field_of_view_degrees      = 53.0 horizontal field of view
  field_of_view_degrees       = 35 #26.4382 # vertical field of view
  theta                       = math.radians(field_of_view_degrees/2.0) #half of field of view of the camera, in radians to work with math.tan function.
# real_target_width           = 24.5 #inches #24 * 0.0254 #1 inch / 0.254 meters target is 24 inches wide
  real_target_height          = 28.5 #using these constants and may not be correct for current robot configuration.
  angle_to_shooter            = 0

  #not currently using these constants and may not be correct for current robot configuration.
  # target_min_width       = 20
  # target_max_width       = 200
  # degrees_horiz_field_of_view = 47.0
  # degrees_vert_field_of_view  = 480.0/640*degrees_horiz_field_of_view
  # inches_camera_height        = 54.0
  # inches_top_target_height    = 98 + 2 + 98
  # degrees_camera_pitch        = 21.0
  # degrees_sighting_offset     = -1.55

  def __init__(self, img_path):
    self.img_path = img_path
    self.layout_result_windows(self.h,self.s,self.v)
    self.vc = VideoCapture(0)
#    if enable_dashboard:
      #These won't work often due to not yet being connected to network_tables server.
#      print("getting ready to put exposure=%s" % self.camera_exposure)
#      SmartDashboard.PutNumber(camera_gain_title, self.camera_gain)

  def video_feed(self):
    while True:
      if self.img is not None:
        self.process()

      if self.img_path is None:
        rval, self.img      = self.vc.read() #might set to None
      else:
        self.img            = imread(self.img_path)

  def set_camera_settings(self):
    if self.img_path is None:
      commands.getoutput(" yavta --set-control '0x009a0901 1' /dev/video0")
      commands.getoutput("yavta --set-control '0x009a0902 %s' /dev/video0" % self.camera_exposure)
#      commands.getoutput("yavta --set-control '0x00980913 %s' /dev/video0" % self.camera_gain)
      #print(commands.getoutput(" yavta --get-control '0x009a0902' /dev/video0"))


  def process(self):
    if enable_dashboard:
      #force initial values until smart dashboard server connects.
      if self.process_loop_count < 20:
        SmartDashboard.PutNumber(camera_exposure_title, self.camera_exposure)
        SmartDashboard.PutNumber(camera_gain_title, self.camera_gain)
        SmartDashboard.PutBoolean(save_frame_title, self.save_frame)
        self.process_loop_count +=1
      self.save_frame      = SmartDashboard.GetBoolean(save_frame_title)
      self.camera_exposure = int(SmartDashboard.GetNumber(camera_exposure_title))
      #print('smart_dashboard camera exposure = %s' % self.camera_exposure)
      self.camera_gain     = int(SmartDashboard.GetNumber(camera_gain_title))
#      print('smart_dashboard camera gain = %s' % self.camera_gain)

    self.set_camera_settings

    drawing             = np.zeros(self.img.shape, dtype=np.uint8)


    self.hsv               = cvtColor(self.img, cv.CV_BGR2HSV)
    self.h, self.s, self.v = split(self.hsv)
    self.h_clipped         = self.threshold_in_range(self.h, self.hue_low_thresh, self.hue_high_thresh)
    self.s_clipped         = self.threshold_in_range(self.s, self.sat_low_thresh, self.sat_high_thresh)
    self.v_clipped         = self.threshold_in_range(self.v, self.val_low_thresh, self.val_high_thresh)
    if show_windows:
      h_scaled = resize(self.h_clipped, window_size)
      s_scaled = resize(self.s_clipped, window_size)
      v_scaled = resize(self.v_clipped, window_size)

      imshow(self.h_title, h_scaled)
      imshow(self.s_title, s_scaled)
      imshow(self.v_title, v_scaled)

    self.find_targets()

    if waitKey(self.video_pause) == ord('q'):
      exit(1)

  def layout_result_windows(self, h, s, v):
    if show_windows:
      pos_x, pos_y        = 500,500
      # imshow(self.img_path, self.img)

      h_scaled        = resize(h, window_size)
      s_scaled        = resize(s, window_size)
      v_scaled        = resize(v, window_size)
      combined_scaled = resize(self.combined, window_size)
      img_scaled      = resize(self.img, window_size)

      imshow(self.h_title       , h_scaled)
      imshow(self.s_title       , s_scaled)
      imshow(self.v_title       , v_scaled)
      imshow(self.combined_title, combined_scaled)
      imshow(self.targets_title , img_scaled)

      #moveWindow(self.h_title, pos_x*1, pos_y*0);
      #moveWindow(self.s_title, pos_x*0, pos_y*1);
      #moveWindow(self.v_title, pos_x*1, pos_y*1);
      #moveWindow(self.combined_title, pos_x*2, pos_y*0);
      #moveWindow(self.targets_title, pos_x*2, pos_y*1);

      #these seem to be placed alphabetically....
      createTrackbar( "Hue High Threshold:", self.targets_title, self.hue_high_thresh, self.max_thresh, self.update_hue_high_threshold);
      createTrackbar( "Hue Low Threshold:", self.targets_title, self.hue_low_thresh, self.max_thresh, self.update_hue_low_threshold);
      createTrackbar( "Sat High Threshold:", self.targets_title, self.sat_high_thresh, self.max_thresh, self.update_sat_high_threshold);
      createTrackbar( "Sat Low Threshold:", self.targets_title, self.sat_low_thresh, self.max_thresh, self.update_sat_low_threshold);
      createTrackbar( "Val High Threshold:", self.targets_title, self.val_high_thresh, self.max_thresh, self.update_val_high_threshold);
      createTrackbar( "Val Low Threshold:", self.targets_title, self.val_low_thresh, self.max_thresh, self.update_val_low_threshold);

  def update_hue_high_threshold(self, thresh):
    self.hue_high_thresh = thresh

  def update_hue_low_threshold(self, thresh):
    self.hue_low_thresh = thresh

  def update_sat_high_threshold(self, thresh):
    self.sat_high_thresh = thresh

  def update_sat_low_threshold(self, thresh):
    self.sat_low_thresh = thresh

  def update_val_high_threshold(self, thresh):
    self.val_high_thresh = thresh

  def update_val_low_threshold(self, thresh):
    self.val_low_thresh = thresh

  def update_hue_threshold(self, thresh):
    delta = 15
    self.h_clipped = self.threshold_in_range(self.h, thresh-delta, thresh+delta)
    imshow(self.h_title, self.h_clipped)
    self.find_targets()

  def update_sat_threshold(self, thresh):
    delta = 25
    self.s_clipped = self.threshold_in_range(self.s, thresh-delta, thresh+delta)
    imshow(self.s_title, self.s_clipped)
    self.find_targets()

  def update_val_threshold(self, thresh):
    delta = 100
    self.v_clipped = self.threshold_in_range(self.v, thresh-delta, thresh+delta)
    imshow(self.v_title, self.v_clipped)
    self.find_targets()

  def threshold_in_range(self, img, low, high):
    unused, above = threshold(img, low, self.max_thresh, THRESH_BINARY)
    unused, below = threshold(img, high, self.max_thresh, THRESH_BINARY_INV)
    return bitwise_and(above, below)

  def find_targets(self):
    #combine all the masks together to get their overlapping regions.
    if True:
      self.reset_targeting()
      self.combined = bitwise_and(self.h_clipped, bitwise_and(self.s_clipped, self.v_clipped))

      #comment above line and uncomment next line to ignore hue channel til we sort out red light hue matching around zero.
      #self.combined = bitwise_and(self.s_clipped, self.v_clipped)

      self.combined = morphologyEx(src=self.combined, op=MORPH_CLOSE, kernel=self.kernel, iterations=self.morph_close_iterations)
      if show_windows:
        combined_scaled = resize(self.combined, window_size)
        imshow(self.combined_title, combined_scaled )

      self.contoured      = self.combined.copy()
      contours, heirarchy = findContours(self.contoured, RETR_LIST, CHAIN_APPROX_TC89_KCOS)
      #print("number of contours found = "+str(len(contours)))

      #contours = [convexHull(c.astype(np.float32),clockwise=True,returnPoints=True) for c in contours]
      #
      polygon_tuples = self.contours_to_polygon_tuples(contours)
      polygons       = [self.unpack_polygon(t) for t in polygon_tuples]


      for polygon_tuple in polygon_tuples:
        self.mark_correct_shape_and_orientation(polygon_tuple)

      if self.selected_target is not None:
        self.draw_target(self.lowest_found_so_far_x, self.lowest_found_so_far, self.selected_target_color)
#        drawContours(self.drawing, contours, -1, self.selected_target_color, thickness=10)
        drawContours(self.drawing, [self.unpack_polygon(self.selected_target).astype(np.int32)], -1, self.selected_target_color, thickness=10)
        self.aim()

      if show_windows:
#        drawing_scaled = resize(self.drawing, window_size)
#        imshow(self.targets_title, drawing_scaled)
        imshow(self.targets_title, self.drawing)

      if enable_dashboard:
        SmartDashboard.PutNumber("Potential Targets:", len(polygons))
        #print("Potential Targets:", len(polygons))
        if self.save_frame:
          SmartDashboard.PutBoolean(save_frame_title, False)
          self.save_frame = False
          imwrite("pictures/CapturedFrame.jpg", drawing_scaled)

  def aim(self):
#    if enable_dashboard:
#      self.robot_heading    = SmartDashboard.GetNumber(robot_heading_title)

    polygon, x, y, w, h   = self.selected_target
    self.target_bearing   = self.get_bearing(x + w/2.0)
    self.target_range     = self.get_range(x, y, w, h)
    #self.target_elevation = self.get_elevation(x, y, w, h)
    #print("Range = " + str(self.target_range))
    #print("Bearing = " + str(self.target_bearing))
    if enable_dashboard:
      SmartDashboard.PutNumber("Target Range:",    self.target_range)
      SmartDashboard.PutNumber("Target Bearing:",  self.target_bearing)
      SmartDashboard.PutNumber("Target Elevation:",self.target_elevation)
      SmartDashboard.PutString("Target: ","Acquired!")


  def get_bearing(self, target_center_x):
    return (self.field_of_view_degrees/self.x_resolution)*(target_center_x-(self.x_resolution/2))-self.angle_to_shooter

  def get_range(self, x, y, w, h):
    if enable_dashboard:
      SmartDashboard.PutNumber("TargetWidth: ",w)
      SmartDashboard.PutNumber("TargetHeight",h)
      SmartDashboard.PutNumber("TargetX",x)
      SmartDashboard.PutNumber("TargetY",y)

    return self.distance(h)

  def distance(self, pix_height):
    fovr = self.x_resolution * self.real_target_height / pix_height
#    if enable_dashboard:
#      SmartDashboard.PutNumber("FieldOfViewReal", fovr) # = 2w_real
#      SmartDashboard.PutNumber("TanTheta", math.tan(self.theta))
#      SmartDashboard.PutNumber("fovr/tan(theta)", fovr/math.tan(self.theta))

    return self.real_target_height*self.y_resolution/(2*pix_height*math.tan(self.theta))

  def reset_targeting(self):
    if enable_dashboard:
      SmartDashboard.PutString("Target: ","lost...")

    self.drawing                = self.img.copy()
    self.selected_target        = None
    self.lowest_found_so_far_x  = None
    self.lowest_found_so_far    = 0
    self.target_range           = 0
    self.target_bearing         = -1
    self.target_elevation       = 0

  def mark_correct_shape_and_orientation(self, polygon_tuple):
    p,x,y,w,h                               = polygon_tuple
    #if isContourConvex(p) and 4==len(p) and self.slope_angles_correct(p):

    #print("testing polygon with len(p)= ",len(p))
    if True:
      center_x = int(x + w/2.0)
      center_y = int(y + h/2.0)
      self.draw_target(center_x, center_y, self.possible_target_color)

      if center_y > self.lowest_found_so_far:
        self.selected_target = polygon_tuple
        self.lowest_found_so_far   = center_y
        self.lowest_found_so_far_x = center_x

    else:
      drawContours(self.drawing, [p.astype(np.int32)], -1, self.passed_up_target_color, thickness=7)

  def draw_target(self, center_x, center_y, a_color):
    #circle(self.drawing,(center_x, center_y), radius=10, color=self.selected_target_color, thickness=5)
    radius      = 10
    a_thickness = 5
    line(self.drawing, (center_x - radius, center_y), (center_x + radius, center_y), color=a_color, thickness=a_thickness)
    line(self.drawing, (center_x, center_y-radius), (center_x, center_y+radius), color=a_color, thickness=a_thickness)

  def slope_angles_correct(self, polygon):
    num_near_vert, num_near_horiz = 0,0
    for line_starting_point_index in xrange(0,4):
      slope = self.get_slope(polygon, line_starting_point_index)
      if slope < self.horiz_threshold:
        num_near_horiz += 1
      if slope > self.vert_threshold:
        num_near_vert += 1

    return 1 <= num_near_horiz and 2 == num_near_vert

  def get_slope(self, p, line_starting_point_index):
    line_ending_point_index = (line_starting_point_index+1)%4
    dy = p[line_starting_point_index, 0, 1] - p[line_ending_point_index, 0, 1]
    dx = p[line_starting_point_index, 0, 0] - p[line_ending_point_index, 0, 0]
    slope = sys.float_info.max
    if 0 != dx:
      slope = abs(float(dy)/dx)

    return slope

  def unpack_polygon(self,t):
    p,x,y,w,h = t
    return p

  def contours_to_polygon_tuples(self, contours):
    polygon_tuples = []
    for c in contours:
      x, y, w, h = boundingRect(c)
      if self.aspect_ratio_and_size_correct(w,h):
        p = approxPolyDP(c, 20, False)
        polygon_tuples.append((p,x,y,w,h))


    return polygon_tuples

  def aspect_ratio_and_size_correct(self, width, height):
    ratio = float(width)/height #float(height)/width
    return ratio < 0.25 or ratio > 4
    #return ratio < self.max_target_aspect_ratio and ratio > self.min_target_aspect_ratio #and width > self.target_min_width and width < self.target_max_width
    #note: we don't want to ignore potential targets based on pixel width and height since range will change the pixel coverage of a real target.


if '__main__'==__name__:
  try:
    img_path = sys.argv[1]
  except:
    img_path= None
    print('Please add an image path argument and try again.')
    sys.exit(2)

  ImageProcessor(img_path).video_feed()