opensourceai
diff --git a/‎.gitignore
+114 b/‎.gitignore
+114
diff --git a/‎LICENSE
+21 b/‎LICENSE
+21
diff --git a/‎README.md
+30 b/‎README.md
+30
diff --git a/‎core/common.py
+37 b/‎core/common.py
+37
diff --git a/‎core/convert_tfrecord.py
+53 b/‎core/convert_tfrecord.py
+53
@@ -0,0 +1,114 @@
+# Created by .ignore support plugin (hsz.mobi)
+### Example user template template
+### Example user template
+
+# IntelliJ project files
+.idea
+*.iml
+out
+gen### Python template
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+.hypothesis/
+.pytest_cache/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# pyenv
+.python-version
+
+# celery beat schedule file
+celerybeat-schedule
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+/data
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2019 OpenSourceAI
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
@@ -0,0 +1,30 @@
+# 简介
+本项目是对[yolov3的tensorflow实现](https://github.com/YunYang1994/tensorflow-yolov3)项目的"整合"吧,做了一些细微的修改,添加大量的中文注释,帮助进行快速阅读理解. 基础好的可以直接阅读原代码.
+
+[yolov3的tensorflow实现](https://github.com/YunYang1994/tensorflow-yolov3)这个项目,应该是作为菜鸟的我到目前为止在原理和代码实现上最复杂的深度学习项目了. 项目代码量大,shape变换,维度广播,看着看着一不小心就迷失了,反反复复的看了好几遍,感觉才把整个项目代码的逻辑给拉通,整个过程反复调试,计算维度变换,运算的处理过程,总之收获巨大.
+
+欢迎交流,指出错误等.
+# 开箱即用
+
+下载[data]()
+
+```
+$ python video_dome.py # 默认使用0摄像头, 也可以通过局域网调用手机摄像头
+```
+![截图]()
+# 学习
+
+通过快速训练[quick_train.py]()开始,阅读项目代码开始学习yolov3的细节. 在之前
+- 下载[data](),使用浣熊数据集
+
+![]()|![]()
+- [pic_vis.py] 可视化数据
+- 使用[core.convert_tfrecord.py](),转换为tfrecord文件
+- [show_image_from_tfrecord.py](),检查文件是否正常
+- [quick_train.py]()开始训练调试
+- [show_train_result.py]() 检测所训练的模型效果.
+
+# 使用其他数据集进行训练
+待更新....
+
+>https://github.com/YunYang1994/tensorflow-yolov3
@@ -0,0 +1,37 @@
+import tensorflow as tf
+
+# 构建模型的基本组件
+slim = tf.contrib.slim
+
+
+def _conv2d_fixed_padding(inputs, filters, kernel_size, strides=1):
+    if strides > 1: inputs = _fixed_padding(inputs, kernel_size)
+    inputs = slim.conv2d(inputs, filters, kernel_size, stride=strides,
+                         padding=('SAME' if strides == 1 else 'VALID'))
+    return inputs
+
+
+@tf.contrib.framework.add_arg_scope
+def _fixed_padding(inputs, kernel_size, *args, mode='CONSTANT', **kwargs):
+    """
+    演空间维度填充输入,与输入大小无关, 只有与所使用的卷积核有关,左右两边进行填充
+
+    Args:
+      inputs: A tensor of size [batch, channels, height_in, width_in] or
+        [batch, height_in, width_in, channels] depending on data_format.
+      kernel_size: The kernel to be used in the conv2d or max_pool2d operation.
+                   Should be a positive integer.
+      mode: The mode for tf.pad.
+
+    Returns:
+      A tensor with the same format as the input with the data either intact
+      (if kernel_size == 1) or padded (if kernel_size > 1).
+    """
+    # 使得kernel完整走过边缘
+    pad_total = kernel_size - 1
+    pad_beg = pad_total // 2
+    pad_end = pad_total - pad_beg
+
+    padded_inputs = tf.pad(inputs, [[0, 0], [pad_beg, pad_end],
+                                    [pad_beg, pad_end], [0, 0]], mode=mode)
+    return padded_inputs
@@ -0,0 +1,53 @@
+import sys
+import argparse
+import numpy as np
+import tensorflow as tf
+
+
+# 将训练图片转换为tfrecord文件
+
+def main(argv):
+    parser = argparse.ArgumentParser()
+    # 物体映射表 , 图片地址, boxe , class_id 文件
+    parser.add_argument("--dataset_txt", default='../data/train_dome_data/new_test.txt')
+    parser.add_argument("--tfrecord_path_prefix",
+                        default='../data/train_dome_data/images')
+    # default='./data/train_data/quick_train_data/tfrecords/quick_train_data')
+    flags = parser.parse_args()
+
+    dataset = {}
+    with open(flags.dataset_txt, 'r') as f:
+        for line in f.readlines():
+            example = line.split(' ')
+            image_path = example[0]
+            boxes_num = len(example[1:]) // 5  # boxs数量
+            boxes = np.zeros([boxes_num, 5], dtype=np.float32)
+            for i in range(boxes_num):
+                boxes[i] = example[1 + i * 5:6 + i * 5]
+                # print(boxes[i])
+            dataset[image_path] = boxes
+
+    image_paths = list(dataset.keys())
+    images_num = len(image_paths)
+    print(">> Processing %d images" % images_num)
+
+    tfrecord_file = flags.tfrecord_path_prefix + "_" + flags.dataset_txt.split("_")[-1].split(".")[0] + ".tfrecords"
+    with tf.python_io.TFRecordWriter(tfrecord_file) as record_writer:
+        for i in range(images_num):
+            image = tf.gfile.FastGFile(image_paths[i], 'rb').read()  # 读取除二进制文件
+            boxes = dataset[image_paths[i]]  # 得到图片的boxes
+            boxes = boxes.tostring()  # 转出string
+
+            example = tf.train.Example(features=tf.train.Features(
+                feature={
+                    'image': tf.train.Feature(bytes_list=tf.train.BytesList(value=[image])),
+                    'boxes': tf.train.Feature(bytes_list=tf.train.BytesList(value=[boxes])),
+                }
+            ))
+            sys.stdout.write("\r>> %d / %d" % (i + 1, images_num))
+            sys.stdout.flush()
+            record_writer.write(example.SerializeToString())
+        print(">> Saving %d images in %s" % (images_num, tfrecord_file))
+
+
+if __name__ == "__main__": main(sys.argv[1:])