Add files via upload

zhzgithub · Jun 18, 2018 · 290ebcc · 290ebcc
1 parent 4f03efb
commit 290ebcc
Show file tree

Hide file tree

Showing 13 changed files with 786 additions and 0 deletions.
diff --git a/project/检测条形码位置/detecting-barcodes-in-images/detect_barcode.py b/project/检测条形码位置/detecting-barcodes-in-images/detect_barcode.py
@@ -0,0 +1,53 @@
+# USAGE
+# python detect_barcode.py --image images/barcode_01.jpg
+
+# import the necessary packages
+import numpy as np
+import argparse
+import cv2
+
+# construct the argument parse and parse the arguments
+ap = argparse.ArgumentParser()
+ap.add_argument("-i", "--image", required = True, help = "path to the image file")
+args = vars(ap.parse_args())
+
+# load the image and convert it to grayscale
+image = cv2.imread(args["image"])
+gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+
+# compute the Scharr gradient magnitude representation of the images
+# in both the x and y direction
+gradX = cv2.Sobel(gray, ddepth = cv2.cv.CV_32F, dx = 1, dy = 0, ksize = -1)
+gradY = cv2.Sobel(gray, ddepth = cv2.cv.CV_32F, dx = 0, dy = 1, ksize = -1)
+
+# subtract the y-gradient from the x-gradient
+gradient = cv2.subtract(gradX, gradY)
+gradient = cv2.convertScaleAbs(gradient)
+
+# blur and threshold the image
+blurred = cv2.blur(gradient, (9, 9))
+(_, thresh) = cv2.threshold(blurred, 225, 255, cv2.THRESH_BINARY)
+
+# construct a closing kernel and apply it to the thresholded image
+kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (21, 7))
+closed = cv2.morphologyEx(thresh, cv2.MORPH_CLOSE, kernel)
+
+# perform a series of erosions and dilations
+closed = cv2.erode(closed, None, iterations = 4)
+closed = cv2.dilate(closed, None, iterations = 4)
+
+# find the contours in the thresholded image, then sort the contours
+# by their area, keeping only the largest one
+(cnts, _) = cv2.findContours(closed.copy(), cv2.RETR_EXTERNAL,
+	cv2.CHAIN_APPROX_SIMPLE)
+c = sorted(cnts, key = cv2.contourArea, reverse = True)[0]
+
+# compute the rotated bounding box of the largest contour
+rect = cv2.minAreaRect(c)
+box = np.int0(cv2.cv.BoxPoints(rect))
+
+# draw a bounding box arounded the detected barcode and display the
+# image
+cv2.drawContours(image, [box], -1, (0, 255, 0), 3)
+cv2.imshow("Image", image)
+cv2.waitKey(0)
diff --git a/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_01.jpg b/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_01.jpg
diff --git a/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_02.jpg b/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_02.jpg
diff --git a/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_03.jpg b/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_03.jpg
diff --git a/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_04.jpg b/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_04.jpg
diff --git a/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_05.jpg b/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_05.jpg
diff --git a/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_06.jpg b/project/检测条形码位置/detecting-barcodes-in-images/images/barcode_06.jpg
diff --git a/project/检测条形码位置/用 Python 和 OpenCV 检测图片上的条形码 - 文章 - 伯乐在线.pdf b/project/检测条形码位置/用 Python 和 OpenCV 检测图片上的条形码 - 文章 - 伯乐在线.pdf
diff --git a/project/汉字识别/tinymind_chinese_font_recognition/README.md b/project/汉字识别/tinymind_chinese_font_recognition/README.md
@@ -0,0 +1,8 @@
+# tinymind_chinese_font_recognition
+汉字书法识别           
+
+split_dataset.py 分割数据集，分割为训练集和验证集           
+
+pipline_model.py 使用卷积的pipline模型来进行训练               
+
+训练集在百度网盘
diff --git a/project/汉字识别/tinymind_chinese_font_recognition/pipline_model.py b/project/汉字识别/tinymind_chinese_font_recognition/pipline_model.py
diff --git a/project/汉字识别/tinymind_chinese_font_recognition/split_dataset.py b/project/汉字识别/tinymind_chinese_font_recognition/split_dataset.py
@@ -0,0 +1,107 @@
+# -*- coding: utf-8 -*-
+"""
+从数据集中划分train和validation两个文件
+train_test_split_ratio=0.1 or 0.2
+Tree目录：
+    data：
+        train：
+            folder1
+            ......
+            folder529
+        validation:
+            folder1
+            ......
+            folder529
+"""
+import os
+import random
+import PIL.Image as Image		# PIL是Python Imaging Library 图片库
+
+
+# 检查路径下面是否都是文件
+def isfile(path):
+    for folder in os.listdir(path):				# os.listdir() 方法用于返回指定的文件夹包含的文件或文件夹的名字的列表。这个列表以字母顺序
+        if not os.path.isdir(path+folder):
+            os.remove(path+folder)
+
+
+# 建立文件夹
+def mkdir(path):
+    """
+    if folder is exists, or make new dir
+    """
+    isexists = os.path.exists(path)
+    if not isexists:
+        os.makedirs(path)
+        print(path)
+        print('success')
+        return True
+    else:
+        print(path)
+        print('folder is exist')
+        return False
+
+
+# 返回文件列表		-----
+def eachFile(filepath):
+    pathDir = os.listdir(filepath)		# /train路径下的文件和文件夹，本例就是100个类别汉字文件夹
+    child_file_name = []
+    full_child_file_list = []
+    for allDir in pathDir:				#遍历100个类别的汉字文件夹，并不遍历汉字文件夹里面的汉字图片。allDir就是分别取值100个汉字文件夹的名称
+        if not allDir == '.DS_Store':	# 若allDir不为'.DS_Store'，则执行下面的合并路径命令。我感觉把'.DS_Store'随便改成别的字符串也能行的样子。
+            child = os.path.join(filepath, allDir)			# os.path.join()将多个路径组合后返回。本句话是创建child路径为每个汉字类别的路径
+
+            full_child_file_list.append(child)				# 将每个汉字类别路径添加到full_child_file_list列表
+            child_file_name.append(allDir)					# 将每个汉字文件夹的名称添加到child_file_name
+    return full_child_file_list, child_file_name			# 返回每个汉字类别路径所组成的full_child_file_list列表，和每个汉字文件夹的名称组成的child_file_name列表
+
+
+# 转移ratio文件
+def move_ratio(data_list, original_str, replace_str):		# 具体作用就是更换路径吗？我感觉这函数名称取得真烂，这函数名称和功能有任何关系吗?
+															# 涉及到复制移动图片
+    for x in data_list:
+        fromImage = Image.open(x)
+        x = x.replace(original_str, replace_str)			# x是图片，x.replace(original_str, replace_str)意义何在？---把原来文件夹的路径替换为现在的路径，然后再保存图片
+        fromImage.save(x)
+
+
+if __name__ == '__main__':
+
+    # data_path = 'C:/Users/Jack/Documents/jupyter/font_recognition/chinese_font_recognition/train/'  # 原始数据存放地址
+    # data_tra_path = 'C:/Users/Jack/Documents/jupyter/font_recognition/chinese_font_recognition/new_train_val_data/font_tra/'  # new_train_data新取的名
+    # data_val_path = 'C:/Users/Jack/Documents/jupyter/font_recognition/chinese_font_recognition/new_train_val_data/font_val/'
+
+    data_path = 'E:/BaiduNetdiskDownload/TMD/train/'  # 原始数据存放地址
+    data_tra_path = 'E:/BaiduNetdiskDownload/TMD/new_train_val_data/font_tra/'  # new_train_data新取的名
+    data_val_path = 'E:/BaiduNetdiskDownload/TMD/new_train_val_data/font_val/'
+
+    full_child_file, child_file = eachFile(data_path)	# 返回每个汉字类别路径所组成的full_child_file列表，和每个汉字文件夹的名称组成的child_file列表
+
+    # 建立相应的文件夹	-------建立了这么多文件夹，后面也没用到啊，那建立了做啥？----用到了，后面用到的路径在前面已经以字符串形式赋值了。
+    for i in child_file:			# 遍历每个汉字文件夹的名称组成的child_file列表
+        tra_path = data_tra_path + '/' + str(i)		# str(i)是汉字文件夹的名称，感觉中间的这个'/'可以去掉
+        mkdir(tra_path)								#	建立训练集文件夹		
+        val_path = data_val_path + '/' + str(i)
+        mkdir(val_path)								#	建立验证集文件夹
+
+    # 划分train和val
+    test_train_split_ratio = 0.9
+
+
+	# 注意一点：不只/train/是路径，/train/a.jpg 也是路径，读取这个路径，也就是读取这个图片文件了
+    for i in full_child_file:			# i遍历每个汉字类别路径所组成的full_child_file列表
+        pic_dir, pic_name = eachFile(i)		# 返回每个汉字类别路径下的所有汉字图片所组成的pic_dir列表，和每个汉字类别路径下的所有汉字图片的名称组成的pic_name列表
+				#由于eachFile()中有一句是child = os.path.join(filepath, allDir)，这一句是合并路径，所以pic_dir应该是汉字图片的路径，如./白/hdjahdksaj.jpg,而并不是读取了图片
+        random.shuffle(pic_dir)			# shuffle ：洗牌，搅乱
+        train_list = pic_dir[0:int(test_train_split_ratio * len(pic_dir))]	# pic_dir[0 : int(0.9*400)],即pic_dir[0:360]，即把每个汉字类别文件夹下的前360个汉字路径为作为训练集
+        val_list = pic_dir[int(test_train_split_ratio * len(pic_dir)):]	#pic_dir[int(0.9*400) : ],即pic_dir[360:],即把每个汉字类别文件夹下的第360到400的汉字路径为作为验证集
+													# 以上还仅仅只是对于一个汉字文件夹做的处理，i遍历full_child_file才是对所有的汉字类别做处理。
+													# 问题：最后的训练集train_list不是使用的append，对于每次i，train_list，val_list都是重新赋值？
+        # train_move, val_move
+        print('proprecessing %s' % i)
+        # print('train_list:',train_list)
+		# # 由于下面代码在for循环中，这意思是对每个类别汉字文件夹的每张图片都要做repalce操作，是更换每张图片名称的操作吗？
+        move_ratio(train_list, 'train', 'new_train_val_data/font_tra')	# train_list是某个汉字文件夹的前360张图片路径列表。
+																		# 把原来train文件夹下的某类别汉字的前360张图片复制到new_train_val_data/font_tra路径下
+        move_ratio(val_list, 'train', 'new_train_val_data/font_val')		# val_list  是某个汉字文件夹的后 40张图片路径列表
+
diff --git a/project/用 Python 和 OpenCV 检测和跟踪运动对象/motion_detector.py b/project/用 Python 和 OpenCV 检测和跟踪运动对象/motion_detector.py
@@ -0,0 +1,87 @@
+# 导入必要的软件包
+import argparse
+import datetime
+import imutils
+import time
+import cv2
+
+# 创建参数解析器并解析参数
+ap = argparse.ArgumentParser()
+ap.add_argument("-v", "--video", help="path to the video file")
+ap.add_argument("-a", "--min-area", type=int, default=500, help="minimum area size")
+args = vars(ap.parse_args())
+
+# 如果video参数为None，那么我们从摄像头读取数据
+if args.get("video", None) is None:
+    camera = cv2.VideoCapture(0)
+    time.sleep(0.25)
+
+# 否则我们读取一个视频文件
+else:
+    camera = cv2.VideoCapture(args["video"])
+
+# 初始化视频流的第一帧
+firstFrame = None
+
+# 遍历视频的每一帧
+while True:
+    # 获取当前帧并初始化occupied/unoccupied文本
+    (grabbed, frame) = camera.read()
+    text = "Unoccupied"
+
+    # 如果不能抓取到一帧，说明我们到了视频的结尾
+    if not grabbed:
+        break
+
+    # 调整该帧的大小，转换为灰阶图像并且对其进行高斯模糊
+    frame = imutils.resize(frame, width=500)
+    gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+    gray = cv2.GaussianBlur(gray, (21, 21), 0)
+
+    # 如果第一帧是None，对其进行初始化
+    if firstFrame is None:
+        firstFrame = gray
+        continue
+
+# 计算当前帧和第一帧的不同
+    frameDelta = cv2.absdiff(firstFrame, gray)
+    thresh = cv2.threshold(frameDelta, 25, 255, cv2.THRESH_BINARY)[1]
+
+    # 扩展阀值图像填充孔洞，然后找到阀值图像上的轮廓
+    thresh = cv2.dilate(thresh, None, iterations=2)
+    (_frame,cnts, _) = cv2.findContours(thresh.copy(), cv2.RETR_EXTERNAL,
+        cv2.CHAIN_APPROX_SIMPLE)
+
+    # 遍历轮廓
+    for c in cnts:
+        # if the contour is too small, ignore it
+        if cv2.contourArea(c) < args["min_area"]:
+            continue
+
+        # compute the bounding box for the contour, draw it on the frame,
+        # and update the text
+        # 计算轮廓的边界框，在当前帧中画出该框
+        (x, y, w, h) = cv2.boundingRect(c)
+        cv2.rectangle(frame, (x, y), (x + w, y + h), (0, 255, 0), 2)
+        text = "Occupied"
+
+# draw the text and timestamp on the frame
+    # 在当前帧上写文字以及时间戳
+    cv2.putText(frame, "Room Status: {}".format(text), (10, 20),
+        cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 255), 2)
+    cv2.putText(frame, datetime.datetime.now().strftime("%A %d %B %Y %I:%M:%S%p"),
+        (10, frame.shape[0] - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.35, (0, 0, 255), 1)
+
+    # 显示当前帧并记录用户是否按下按键
+    cv2.imshow("Security Feed", frame)
+    cv2.imshow("Thresh", thresh)
+    cv2.imshow("Frame Delta", frameDelta)
+    key = cv2.waitKey(1) & 0xFF
+
+    # 如果q键被按下，跳出循环
+    if key == ord("q"):
+        break
+
+# 清理摄像机资源并关闭打开的窗口
+camera.release()
+cv2.destroyAllWindows()
diff --git a/project/用 Python 和 OpenCV 检测和跟踪运动对象/用 Python 和 OpenCV 检测和跟踪运动对象 - Python - 伯乐在线.pdf b/project/用 Python 和 OpenCV 检测和跟踪运动对象/用 Python 和 OpenCV 检测和跟踪运动对象 - Python - 伯乐在线.pdf