├── .gitattributes
├── .gitignore
├── LaneDetectionLaneNet
    ├── .idea
    │   ├── inspectionProfiles
    │   │   └── profiles_settings.xml
    │   ├── lanenet-lane-detection-master.iml
    │   ├── misc.xml
    │   ├── modules.xml
    │   └── workspace.xml
    ├── LICENSE
    ├── README.md
    ├── _config.yml
    ├── config
    │   └── global_config.py
    ├── data_provider
    │   ├── lanenet_data_feed_pipline.py
    │   └── tf_io_pipline_tools.py
    ├── lanenet_model
    │   ├── lanenet.py
    │   ├── lanenet_back_end.py
    │   ├── lanenet_discriminative_loss.py
    │   ├── lanenet_front_end.py
    │   └── lanenet_postprocess.py
    ├── mnn_project
    │   ├── __init__.py
    │   ├── config.ini
    │   ├── config_parser.cpp
    │   ├── config_parser.h
    │   ├── convert_lanenet_model_into_mnn_model.sh
    │   ├── dbscan.hpp
    │   ├── freeze_lanenet_model.py
    │   ├── kdtree.cpp
    │   ├── kdtree.h
    │   ├── lanenet_model.cpp
    │   └── lanenet_model.h
    ├── requirements.txt
    ├── semantic_segmentation_zoo
    │   ├── __init__.py
    │   ├── cnn_basenet.py
    │   └── vgg16_based_fcn.py
    └── tools
    │   ├── evaluate_lanenet_on_tusimple.py
    │   ├── evaluate_model_utils.py
    │   ├── generate_tusimple_dataset.py
    │   ├── lane_and_object_detection_on_video.py
    │   ├── test_lanenet.py
    │   └── train_lanenet.py
├── OUT
    ├── output_video - Copy.avi
    └── output_video.avi
├── ObstacleDetectionYOLO
    ├── ObjectDetection_YOLO.py
    └── images
    │   ├── 0.jpg
    │   └── 3.jpg
├── Project_report.pdf
├── Test_Detections_On_Video.py
└── readme.md


/.gitattributes:
--------------------------------------------------------------------------------
1 | # Auto detect text files and perform LF normalization
2 | * text=auto
3 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | pip-wheel-metadata/
 24 | share/python-wheels/
 25 | *.egg-info/
 26 | .installed.cfg
 27 | *.egg
 28 | MANIFEST
 29 | 
 30 | # PyInstaller
 31 | #  Usually these files are written by a python script from a template
 32 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 33 | *.manifest
 34 | *.spec
 35 | 
 36 | # Installer logs
 37 | pip-log.txt
 38 | pip-delete-this-directory.txt
 39 | 
 40 | # Unit test / coverage reports
 41 | htmlcov/
 42 | .tox/
 43 | .nox/
 44 | .coverage
 45 | .coverage.*
 46 | .cache
 47 | nosetests.xml
 48 | coverage.xml
 49 | *.cover
 50 | *.py,cover
 51 | .hypothesis/
 52 | .pytest_cache/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | db.sqlite3-journal
 63 | 
 64 | # Flask stuff:
 65 | instance/
 66 | .webassets-cache
 67 | 
 68 | # Scrapy stuff:
 69 | .scrapy
 70 | 
 71 | # Sphinx documentation
 72 | docs/_build/
 73 | 
 74 | # PyBuilder
 75 | target/
 76 | 
 77 | # Jupyter Notebook
 78 | .ipynb_checkpoints
 79 | 
 80 | # IPython
 81 | profile_default/
 82 | ipython_config.py
 83 | 
 84 | # pyenv
 85 | .python-version
 86 | 
 87 | # pipenv
 88 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 89 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 90 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 91 | #   install all needed dependencies.
 92 | #Pipfile.lock
 93 | 
 94 | # celery beat schedule file
 95 | celerybeat-schedule
 96 | 
 97 | # SageMath parsed files
 98 | *.sage.py
 99 | 
100 | # Environments
101 | .env
102 | .venv
103 | env/
104 | venv/
105 | ENV/
106 | env.bak/
107 | venv.bak/
108 | 
109 | # Spyder project settings
110 | .spyderproject
111 | .spyproject
112 | 
113 | # Rope project settings
114 | .ropeproject
115 | 
116 | # mkdocs documentation
117 | /site
118 | 
119 | # mypy
120 | .mypy_cache/
121 | .dmypy.json
122 | dmypy.json
123 | 
124 | # Pyre type checker
125 | .pyre/
126 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/.idea/inspectionProfiles/profiles_settings.xml:
--------------------------------------------------------------------------------
1 | <component name="InspectionProjectProfileManager">
2 |   <settings>
3 |     <option name="USE_PROJECT_PROFILE" value="false" />
4 |     <version value="1.0" />
5 |   </settings>
6 | </component>


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/.idea/lanenet-lane-detection-master.iml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <module type="PYTHON_MODULE" version="4">
 3 |   <component name="NewModuleRootManager">
 4 |     <content url="file://$MODULE_DIR$" />
 5 |     <orderEntry type="inheritedJdk" />
 6 |     <orderEntry type="sourceFolder" forTests="false" />
 7 |   </component>
 8 |   <component name="PyDocumentationSettings">
 9 |     <option name="format" value="REST" />
10 |     <option name="myDocStringFormat" value="reStructuredText" />
11 |   </component>
12 |   <component name="TestRunnerService">
13 |     <option name="PROJECT_TEST_RUNNER" value="Twisted Trial" />
14 |   </component>
15 | </module>


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/.idea/misc.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="JavaScriptSettings">
4 |     <option name="languageLevel" value="ES6" />
5 |   </component>
6 |   <component name="ProjectRootManager" version="2" project-jdk-name="Python 3.7" project-jdk-type="Python SDK" />
7 | </project>


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/.idea/modules.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="ProjectModuleManager">
4 |     <modules>
5 |       <module fileurl="file://$PROJECT_DIR$/.idea/lanenet-lane-detection-master.iml" filepath="$PROJECT_DIR$/.idea/lanenet-lane-detection-master.iml" />
6 |     </modules>
7 |   </component>
8 | </project>


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/.idea/workspace.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="UTF-8"?>
  2 | <project version="4">
  3 |   <component name="ChangeListManager">
  4 |     <list default="true" id="90a2059d-5099-4bc6-bad8-a3be70e02879" name="Default Changelist" comment="" />
  5 |     <option name="SHOW_DIALOG" value="false" />
  6 |     <option name="HIGHLIGHT_CONFLICTS" value="true" />
  7 |     <option name="HIGHLIGHT_NON_ACTIVE_CHANGELIST" value="false" />
  8 |     <option name="LAST_RESOLUTION" value="IGNORE" />
  9 |   </component>
 10 |   <component name="FileTemplateManagerImpl">
 11 |     <option name="RECENT_TEMPLATES">
 12 |       <list>
 13 |         <option value="Python Script" />
 14 |       </list>
 15 |     </option>
 16 |   </component>
 17 |   <component name="ProjectId" id="1aMoZxRxn9ullK1qVaijlJzJ6DH" />
 18 |   <component name="ProjectLevelVcsManager" settingsEditedManually="true" />
 19 |   <component name="ProjectViewState">
 20 |     <option name="hideEmptyMiddlePackages" value="true" />
 21 |     <option name="showExcludedFiles" value="true" />
 22 |     <option name="showLibraryContents" value="true" />
 23 |   </component>
 24 |   <component name="PropertiesComponent">
 25 |     <property name="RunOnceActivity.ShowReadmeOnStart" value="true" />
 26 |     <property name="WebServerToolWindowFactoryState" value="false" />
 27 |     <property name="last_opened_file_path" value="$PROJECT_DIR$" />
 28 |     <property name="settings.editor.selected.configurable" value="com.jetbrains.python.configuration.PythonContentEntriesConfigurable" />
 29 |   </component>
 30 |   <component name="RecentsManager">
 31 |     <key name="MoveFile.RECENT_KEYS">
 32 |       <recent name="F:\Study Material\Semester 4\Adv CV\lanenet-lane-detection-master\data" />
 33 |       <recent name="F:\Study Material\Semester 4\Adv CV\lanenet-lane-detection-master\tools" />
 34 |     </key>
 35 |     <key name="CopyFile.RECENT_KEYS">
 36 |       <recent name="F:\Study Material\Semester 4\Adv CV\lanenet-lane-detection-master" />
 37 |       <recent name="F:\Study Material\Semester 4\Adv CV\lanenet-lane-detection-master\data" />
 38 |     </key>
 39 |   </component>
 40 |   <component name="RunManager" selected="Python.ObjectDetectionCode">
 41 |     <configuration name="ObjectDetectionCode" type="PythonConfigurationType" factoryName="Python" temporary="true">
 42 |       <module name="lanenet-lane-detection-master" />
 43 |       <option name="INTERPRETER_OPTIONS" value="" />
 44 |       <option name="PARENT_ENVS" value="true" />
 45 |       <envs>
 46 |         <env name="PYTHONUNBUFFERED" value="1" />
 47 |       </envs>
 48 |       <option name="SDK_HOME" value="" />
 49 |       <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$/" />
 50 |       <option name="IS_MODULE_SDK" value="true" />
 51 |       <option name="ADD_CONTENT_ROOTS" value="true" />
 52 |       <option name="ADD_SOURCE_ROOTS" value="true" />
 53 |       <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
 54 |       <option name="SCRIPT_NAME" value="$PROJECT_DIR$/tools/ObjectDetectionCode.py" />
 55 |       <option name="PARAMETERS" value="--input data/lane_traffic.avi --output test_set/lane_output.avi --yolo yolo-coco" />
 56 |       <option name="SHOW_COMMAND_LINE" value="false" />
 57 |       <option name="EMULATE_TERMINAL" value="false" />
 58 |       <option name="MODULE_MODE" value="false" />
 59 |       <option name="REDIRECT_INPUT" value="false" />
 60 |       <option name="INPUT_FILE" value="" />
 61 |       <method v="2" />
 62 |     </configuration>
 63 |     <configuration name="evaluate_lanenet_on_tusimple.py" type="PythonConfigurationType" factoryName="Python" temporary="true">
 64 |       <module name="lanenet-lane-detection-master" />
 65 |       <option name="INTERPRETER_OPTIONS" value="" />
 66 |       <option name="PARENT_ENVS" value="true" />
 67 |       <envs>
 68 |         <env name="PYTHONUNBUFFERED" value="1" />
 69 |         <env name="LD_LIBRARY_PATH" value="/usr/local/cuda/lib64:$LD_LIBRARY_PATH" />
 70 |         <env name="Path" value="C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v10.2\lib;C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v10.2\bin;C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v10.2\libnvvp;C:\Program Files (x86)\Common Files\Oracle\Java\javapath;C:\Program Files (x86)\Intel\Intel(R) Management Engine Components\iCLS\;C:\Program Files\Intel\Intel(R) Management Engine Components\iCLS\;C:\Windows\system32;C:\Windows;C:\Windows\System32\Wbem;C:\Windows\System32\WindowsPowerShell\v1.0\;C:\Program Files (x86)\Intel\Intel(R) Management Engine Components\DAL;C:\Program Files\Intel\Intel(R) Management Engine Components\DAL;C:\Program Files (x86)\Intel\Intel(R) Management Engine Components\IPT;C:\Program Files\Intel\Intel(R) Management Engine Components\IPT;C:\Program Files (x86)\NVIDIA Corporation\PhysX\Common;C:\Program Files\PuTTY\;C:\WINDOWS\system32;C:\WINDOWS;C:\WINDOWS\System32\Wbem;C:\WINDOWS\System32\WindowsPowerShell\v1.0\;C:\WINDOWS\System32\OpenSSH\;C:\Program Files\Java\jdk-10.0.2\bin;C:\Program Files\Java\jdk-10.0.2\lib;C:\Program Files\NVIDIA Corporation\NVIDIA NvDLISR;C:\Program Files\dotnet\;C:\Users\mayur\Downloads\cudnn-10.1-windows10-x64-v7.5.0.56\cuda\bin\;C:\Users\mayur\Downloads\cudnn-10.1-windows10-x64-v7.5.0.56\cuda\lib\;C:\Program Files\MATLAB\R2019a\bin;C:\Program Files\Git\cmd;C:\WINDOWS\system32;C:\WINDOWS;C:\WINDOWS\System32\Wbem;C:\WINDOWS\System32\WindowsPowerShell\v1.0\;C:\WINDOWS\System32\OpenSSH\;C:\Program Files\py4j-0.10.8.1\py4j-java\py4j0.10.8.1.jar;C:\Program Files\Java\jdk-10.0.2\lib\py4j0.10.8.1.jar;C:\Program Files\NVIDIA Corporation\Nsight Compute 2019.5.0\;C:\Program Files\MySQL\MySQL Shell 8.0\bin\;C:\Users\mayur\AppData\Local\Programs\Python\Python37\Scripts\;C:\Users\mayur\AppData\Local\Programs\Python\Python37\;C:\Program Files\py4j-0.10.8.1\py4j-java\py4j0.10.8.1.jar;C:\Program Files\Java\jdk-10.0.2\lib\py4j0.10.8.1.jar;C:\Users\mayur\Downloads\Softwares\chromedriver_win32\chromedriver.exe;C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v10.1\bin\;C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v10.1\extras\CUPTI\libx64\;C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v10.1\include\;C:\tools\cuda\bin\;" />
 71 |       </envs>
 72 |       <option name="SDK_HOME" value="" />
 73 |       <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$/" />
 74 |       <option name="IS_MODULE_SDK" value="true" />
 75 |       <option name="ADD_CONTENT_ROOTS" value="true" />
 76 |       <option name="ADD_SOURCE_ROOTS" value="true" />
 77 |       <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
 78 |       <option name="SCRIPT_NAME" value="$PROJECT_DIR$/tools/evaluate_lanenet_on_tusimple.py" />
 79 |       <option name="PARAMETERS" value="--image_dir ./test_set/clips_1/ --weights_path ./model/tusimple_lanenet_vgg/tusimple_lanenet_vgg.ckpt --save_dir ./test_set/test_output" />
 80 |       <option name="SHOW_COMMAND_LINE" value="false" />
 81 |       <option name="EMULATE_TERMINAL" value="false" />
 82 |       <option name="MODULE_MODE" value="false" />
 83 |       <option name="REDIRECT_INPUT" value="false" />
 84 |       <option name="INPUT_FILE" value="" />
 85 |       <method v="2" />
 86 |     </configuration>
 87 |     <configuration name="test_lanenet" type="PythonConfigurationType" factoryName="Python" temporary="true">
 88 |       <module name="lanenet-lane-detection-master" />
 89 |       <option name="INTERPRETER_OPTIONS" value="" />
 90 |       <option name="PARENT_ENVS" value="true" />
 91 |       <envs>
 92 |         <env name="PYTHONUNBUFFERED" value="1" />
 93 |       </envs>
 94 |       <option name="SDK_HOME" value="" />
 95 |       <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$/" />
 96 |       <option name="IS_MODULE_SDK" value="true" />
 97 |       <option name="ADD_CONTENT_ROOTS" value="true" />
 98 |       <option name="ADD_SOURCE_ROOTS" value="true" />
 99 |       <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
100 |       <option name="SCRIPT_NAME" value="$PROJECT_DIR$/tools/test_lanenet.py" />
101 |       <option name="PARAMETERS" value="--weights_path ./model/tusimple_lanenet_vgg/tusimple_lanenet_vgg.ckpt  --image_path ./data/tusimple_test_image/3.jpg" />
102 |       <option name="SHOW_COMMAND_LINE" value="false" />
103 |       <option name="EMULATE_TERMINAL" value="false" />
104 |       <option name="MODULE_MODE" value="false" />
105 |       <option name="REDIRECT_INPUT" value="false" />
106 |       <option name="INPUT_FILE" value="" />
107 |       <method v="2" />
108 |     </configuration>
109 |     <list>
110 |       <item itemvalue="Python.evaluate_lanenet_on_tusimple.py" />
111 |       <item itemvalue="Python.test_lanenet" />
112 |       <item itemvalue="Python.ObjectDetectionCode" />
113 |     </list>
114 |     <recent_temporary>
115 |       <list>
116 |         <item itemvalue="Python.ObjectDetectionCode" />
117 |         <item itemvalue="Python.evaluate_lanenet_on_tusimple.py" />
118 |         <item itemvalue="Python.test_lanenet" />
119 |       </list>
120 |     </recent_temporary>
121 |   </component>
122 |   <component name="ServiceViewManager">
123 |     <option name="viewStates">
124 |       <list>
125 |         <serviceView>
126 |           <treeState>
127 |             <expand />
128 |             <select />
129 |           </treeState>
130 |         </serviceView>
131 |       </list>
132 |     </option>
133 |   </component>
134 |   <component name="SvnConfiguration">
135 |     <configuration />
136 |   </component>
137 |   <component name="TaskManager">
138 |     <task active="true" id="Default" summary="Default task">
139 |       <changelist id="90a2059d-5099-4bc6-bad8-a3be70e02879" name="Default Changelist" comment="" />
140 |       <created>1586554882638</created>
141 |       <option name="number" value="Default" />
142 |       <option name="presentableId" value="Default" />
143 |       <updated>1586554882638</updated>
144 |       <workItem from="1586554893325" duration="6234000" />
145 |       <workItem from="1586804132439" duration="774000" />
146 |       <workItem from="1587589998884" duration="3918000" />
147 |       <workItem from="1587596598778" duration="2767000" />
148 |       <workItem from="1587601885440" duration="7266000" />
149 |       <workItem from="1587870557358" duration="1755000" />
150 |     </task>
151 |     <servers />
152 |   </component>
153 |   <component name="TypeScriptGeneratedFilesManager">
154 |     <option name="version" value="1" />
155 |   </component>
156 |   <component name="VcsManagerConfiguration">
157 |     <ignored-roots>
158 |       <path value="$PROJECT_DIR$" />
159 |     </ignored-roots>
160 |   </component>
161 |   <component name="WindowStateProjectService">
162 |     <state x="338" y="50" width="1086" height="538" key="#com.intellij.execution.impl.EditConfigurationsDialog" timestamp="1587624100753">
163 |       <screen x="0" y="0" width="1536" height="764" />
164 |     </state>
165 |     <state x="338" y="50" width="1086" height="538" key="#com.intellij.execution.impl.EditConfigurationsDialog/0.0.1536.764@0.0.1536.764" timestamp="1587624100753" />
166 |     <state x="426" y="216" key="#com.intellij.fileTypes.FileTypeChooser" timestamp="1586556357895">
167 |       <screen x="0" y="0" width="1536" height="764" />
168 |     </state>
169 |     <state x="426" y="216" key="#com.intellij.fileTypes.FileTypeChooser/0.0.1536.764@0.0.1536.764" timestamp="1586556357895" />
170 |     <state x="617" y="81" key="EnvironmentVariablesDialog" timestamp="1587605464918">
171 |       <screen x="0" y="0" width="1536" height="764" />
172 |     </state>
173 |     <state x="617" y="81" key="EnvironmentVariablesDialog/0.0.1536.764@0.0.1536.764" timestamp="1587605464918" />
174 |     <state width="1493" height="280" key="GridCell.Tab.0.bottom" timestamp="1587624106349">
175 |       <screen x="0" y="0" width="1536" height="764" />
176 |     </state>
177 |     <state width="1493" height="280" key="GridCell.Tab.0.bottom/0.0.1536.764@0.0.1536.764" timestamp="1587624106349" />
178 |     <state width="1493" height="280" key="GridCell.Tab.0.center" timestamp="1587624106349">
179 |       <screen x="0" y="0" width="1536" height="764" />
180 |     </state>
181 |     <state width="1493" height="280" key="GridCell.Tab.0.center/0.0.1536.764@0.0.1536.764" timestamp="1587624106349" />
182 |     <state width="1493" height="280" key="GridCell.Tab.0.left" timestamp="1587624106349">
183 |       <screen x="0" y="0" width="1536" height="764" />
184 |     </state>
185 |     <state width="1493" height="280" key="GridCell.Tab.0.left/0.0.1536.764@0.0.1536.764" timestamp="1587624106349" />
186 |     <state width="1493" height="280" key="GridCell.Tab.0.right" timestamp="1587624106349">
187 |       <screen x="0" y="0" width="1536" height="764" />
188 |     </state>
189 |     <state width="1493" height="280" key="GridCell.Tab.0.right/0.0.1536.764@0.0.1536.764" timestamp="1587624106349" />
190 |     <state width="1493" height="256" key="GridCell.Tab.1.bottom" timestamp="1587596165418">
191 |       <screen x="0" y="0" width="1536" height="764" />
192 |     </state>
193 |     <state width="1493" height="256" key="GridCell.Tab.1.bottom/0.0.1536.764@0.0.1536.764" timestamp="1587596165418" />
194 |     <state width="1493" height="256" key="GridCell.Tab.1.center" timestamp="1587596165418">
195 |       <screen x="0" y="0" width="1536" height="764" />
196 |     </state>
197 |     <state width="1493" height="256" key="GridCell.Tab.1.center/0.0.1536.764@0.0.1536.764" timestamp="1587596165418" />
198 |     <state width="1493" height="256" key="GridCell.Tab.1.left" timestamp="1587596165418">
199 |       <screen x="0" y="0" width="1536" height="764" />
200 |     </state>
201 |     <state width="1493" height="256" key="GridCell.Tab.1.left/0.0.1536.764@0.0.1536.764" timestamp="1587596165418" />
202 |     <state width="1493" height="256" key="GridCell.Tab.1.right" timestamp="1587596165418">
203 |       <screen x="0" y="0" width="1536" height="764" />
204 |     </state>
205 |     <state width="1493" height="256" key="GridCell.Tab.1.right/0.0.1536.764@0.0.1536.764" timestamp="1587596165418" />
206 |     <state x="279" y="29" key="SettingsEditor" timestamp="1587604386926">
207 |       <screen x="0" y="0" width="1536" height="764" />
208 |     </state>
209 |     <state x="279" y="29" key="SettingsEditor/0.0.1536.764@0.0.1536.764" timestamp="1587604386926" />
210 |   </component>
211 |   <component name="com.intellij.coverage.CoverageDataManagerImpl">
212 |     <SUITE FILE_PATH="coverage/lanenet_lane_detection_master$evaluate_lanenet_on_tusimple_py.coverage" NAME="evaluate_lanenet_on_tusimple.py Coverage Results" MODIFIED="1587608433663" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/" />
213 |     <SUITE FILE_PATH="coverage/lanenet_lane_detection_master$ObjectDetectionCode.coverage" NAME="ObjectDetectionCode Coverage Results" MODIFIED="1587624106343" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/" />
214 |     <SUITE FILE_PATH="coverage/lanenet_lane_detection_master$test_lanenet.coverage" NAME="test_lanenet Coverage Results" MODIFIED="1587590189221" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/" />
215 |   </component>
216 | </project>


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/LICENSE:
--------------------------------------------------------------------------------
  1 |                                  Apache License
  2 |                            Version 2.0, January 2004
  3 |                         http://www.apache.org/licenses/
  4 | 
  5 |    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
  6 | 
  7 |    1. Definitions.
  8 | 
  9 |       "License" shall mean the terms and conditions for use, reproduction,
 10 |       and distribution as defined by Sections 1 through 9 of this document.
 11 | 
 12 |       "Licensor" shall mean the copyright owner or entity authorized by
 13 |       the copyright owner that is granting the License.
 14 | 
 15 |       "Legal Entity" shall mean the union of the acting entity and all
 16 |       other entities that control, are controlled by, or are under common
 17 |       control with that entity. For the purposes of this definition,
 18 |       "control" means (i) the power, direct or indirect, to cause the
 19 |       direction or management of such entity, whether by contract or
 20 |       otherwise, or (ii) ownership of fifty percent (50%) or more of the
 21 |       outstanding shares, or (iii) beneficial ownership of such entity.
 22 | 
 23 |       "You" (or "Your") shall mean an individual or Legal Entity
 24 |       exercising permissions granted by this License.
 25 | 
 26 |       "Source" form shall mean the preferred form for making modifications,
 27 |       including but not limited to software source code, documentation
 28 |       source, and configuration files.
 29 | 
 30 |       "Object" form shall mean any form resulting from mechanical
 31 |       transformation or translation of a Source form, including but
 32 |       not limited to compiled object code, generated documentation,
 33 |       and conversions to other media types.
 34 | 
 35 |       "Work" shall mean the work of authorship, whether in Source or
 36 |       Object form, made available under the License, as indicated by a
 37 |       copyright notice that is included in or attached to the work
 38 |       (an example is provided in the Appendix below).
 39 | 
 40 |       "Derivative Works" shall mean any work, whether in Source or Object
 41 |       form, that is based on (or derived from) the Work and for which the
 42 |       editorial revisions, annotations, elaborations, or other modifications
 43 |       represent, as a whole, an original work of authorship. For the purposes
 44 |       of this License, Derivative Works shall not include works that remain
 45 |       separable from, or merely link (or bind by name) to the interfaces of,
 46 |       the Work and Derivative Works thereof.
 47 | 
 48 |       "Contribution" shall mean any work of authorship, including
 49 |       the original version of the Work and any modifications or additions
 50 |       to that Work or Derivative Works thereof, that is intentionally
 51 |       submitted to Licensor for inclusion in the Work by the copyright owner
 52 |       or by an individual or Legal Entity authorized to submit on behalf of
 53 |       the copyright owner. For the purposes of this definition, "submitted"
 54 |       means any form of electronic, verbal, or written communication sent
 55 |       to the Licensor or its representatives, including but not limited to
 56 |       communication on electronic mailing lists, source code control systems,
 57 |       and issue tracking systems that are managed by, or on behalf of, the
 58 |       Licensor for the purpose of discussing and improving the Work, but
 59 |       excluding communication that is conspicuously marked or otherwise
 60 |       designated in writing by the copyright owner as "Not a Contribution."
 61 | 
 62 |       "Contributor" shall mean Licensor and any individual or Legal Entity
 63 |       on behalf of whom a Contribution has been received by Licensor and
 64 |       subsequently incorporated within the Work.
 65 | 
 66 |    2. Grant of Copyright License. Subject to the terms and conditions of
 67 |       this License, each Contributor hereby grants to You a perpetual,
 68 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 69 |       copyright license to reproduce, prepare Derivative Works of,
 70 |       publicly display, publicly perform, sublicense, and distribute the
 71 |       Work and such Derivative Works in Source or Object form.
 72 | 
 73 |    3. Grant of Patent License. Subject to the terms and conditions of
 74 |       this License, each Contributor hereby grants to You a perpetual,
 75 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 76 |       (except as stated in this section) patent license to make, have made,
 77 |       use, offer to sell, sell, import, and otherwise transfer the Work,
 78 |       where such license applies only to those patent claims licensable
 79 |       by such Contributor that are necessarily infringed by their
 80 |       Contribution(s) alone or by combination of their Contribution(s)
 81 |       with the Work to which such Contribution(s) was submitted. If You
 82 |       institute patent litigation against any entity (including a
 83 |       cross-claim or counterclaim in a lawsuit) alleging that the Work
 84 |       or a Contribution incorporated within the Work constitutes direct
 85 |       or contributory patent infringement, then any patent licenses
 86 |       granted to You under this License for that Work shall terminate
 87 |       as of the date such litigation is filed.
 88 | 
 89 |    4. Redistribution. You may reproduce and distribute copies of the
 90 |       Work or Derivative Works thereof in any medium, with or without
 91 |       modifications, and in Source or Object form, provided that You
 92 |       meet the following conditions:
 93 | 
 94 |       (a) You must give any other recipients of the Work or
 95 |           Derivative Works a copy of this License; and
 96 | 
 97 |       (b) You must cause any modified files to carry prominent notices
 98 |           stating that You changed the files; and
 99 | 
100 |       (c) You must retain, in the Source form of any Derivative Works
101 |           that You distribute, all copyright, patent, trademark, and
102 |           attribution notices from the Source form of the Work,
103 |           excluding those notices that do not pertain to any part of
104 |           the Derivative Works; and
105 | 
106 |       (d) If the Work includes a "NOTICE" text file as part of its
107 |           distribution, then any Derivative Works that You distribute must
108 |           include a readable copy of the attribution notices contained
109 |           within such NOTICE file, excluding those notices that do not
110 |           pertain to any part of the Derivative Works, in at least one
111 |           of the following places: within a NOTICE text file distributed
112 |           as part of the Derivative Works; within the Source form or
113 |           documentation, if provided along with the Derivative Works; or,
114 |           within a display generated by the Derivative Works, if and
115 |           wherever such third-party notices normally appear. The contents
116 |           of the NOTICE file are for informational purposes only and
117 |           do not modify the License. You may add Your own attribution
118 |           notices within Derivative Works that You distribute, alongside
119 |           or as an addendum to the NOTICE text from the Work, provided
120 |           that such additional attribution notices cannot be construed
121 |           as modifying the License.
122 | 
123 |       You may add Your own copyright statement to Your modifications and
124 |       may provide additional or different license terms and conditions
125 |       for use, reproduction, or distribution of Your modifications, or
126 |       for any such Derivative Works as a whole, provided Your use,
127 |       reproduction, and distribution of the Work otherwise complies with
128 |       the conditions stated in this License.
129 | 
130 |    5. Submission of Contributions. Unless You explicitly state otherwise,
131 |       any Contribution intentionally submitted for inclusion in the Work
132 |       by You to the Licensor shall be under the terms and conditions of
133 |       this License, without any additional terms or conditions.
134 |       Notwithstanding the above, nothing herein shall supersede or modify
135 |       the terms of any separate license agreement you may have executed
136 |       with Licensor regarding such Contributions.
137 | 
138 |    6. Trademarks. This License does not grant permission to use the trade
139 |       names, trademarks, service marks, or product names of the Licensor,
140 |       except as required for reasonable and customary use in describing the
141 |       origin of the Work and reproducing the content of the NOTICE file.
142 | 
143 |    7. Disclaimer of Warranty. Unless required by applicable law or
144 |       agreed to in writing, Licensor provides the Work (and each
145 |       Contributor provides its Contributions) on an "AS IS" BASIS,
146 |       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
147 |       implied, including, without limitation, any warranties or conditions
148 |       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
149 |       PARTICULAR PURPOSE. You are solely responsible for determining the
150 |       appropriateness of using or redistributing the Work and assume any
151 |       risks associated with Your exercise of permissions under this License.
152 | 
153 |    8. Limitation of Liability. In no event and under no legal theory,
154 |       whether in tort (including negligence), contract, or otherwise,
155 |       unless required by applicable law (such as deliberate and grossly
156 |       negligent acts) or agreed to in writing, shall any Contributor be
157 |       liable to You for damages, including any direct, indirect, special,
158 |       incidental, or consequential damages of any character arising as a
159 |       result of this License or out of the use or inability to use the
160 |       Work (including but not limited to damages for loss of goodwill,
161 |       work stoppage, computer failure or malfunction, or any and all
162 |       other commercial damages or losses), even if such Contributor
163 |       has been advised of the possibility of such damages.
164 | 
165 |    9. Accepting Warranty or Additional Liability. While redistributing
166 |       the Work or Derivative Works thereof, You may choose to offer,
167 |       and charge a fee for, acceptance of support, warranty, indemnity,
168 |       or other liability obligations and/or rights consistent with this
169 |       License. However, in accepting such obligations, You may act only
170 |       on Your own behalf and on Your sole responsibility, not on behalf
171 |       of any other Contributor, and only if You agree to indemnify,
172 |       defend, and hold each Contributor harmless for any liability
173 |       incurred by, or claims asserted against, such Contributor by reason
174 |       of your accepting any such warranty or additional liability.
175 | 
176 |    END OF TERMS AND CONDITIONS
177 | 
178 |    APPENDIX: How to apply the Apache License to your work.
179 | 
180 |       To apply the Apache License to your work, attach the following
181 |       boilerplate notice, with the fields enclosed by brackets "[]"
182 |       replaced with your own identifying information. (Don't include
183 |       the brackets!)  The text should be enclosed in the appropriate
184 |       comment syntax for the file format. We also recommend that a
185 |       file or class name and description of purpose be included on the
186 |       same "printed page" as the copyright notice for easier
187 |       identification within third-party archives.
188 | 
189 |    Copyright 2018 Luo Yao
190 | 
191 |    Licensed under the Apache License, Version 2.0 (the "License");
192 |    you may not use this file except in compliance with the License.
193 |    You may obtain a copy of the License at
194 | 
195 |        http://www.apache.org/licenses/LICENSE-2.0
196 | 
197 |    Unless required by applicable law or agreed to in writing, software
198 |    distributed under the License is distributed on an "AS IS" BASIS,
199 |    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
200 |    See the License for the specific language governing permissions and
201 |    limitations under the License.
202 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/README.md:
--------------------------------------------------------------------------------
  1 | # LaneNet-Lane-Detection
  2 | Use tensorflow to implement a Deep Neural Network for real time lane detection mainly based on the IEEE IV conference 
  3 | paper "Towards End-to-End Lane Detection: an Instance Segmentation Approach".You can refer to their paper for details 
  4 | https://arxiv.org/abs/1802.05591. This model consists of a encoder-decoder stage, binary semantic segmentation stage 
  5 | and instance semantic segmentation using discriminative loss function for real time lane detection task.
  6 | 
  7 | The main network architecture is as follows:
  8 | 
  9 | `Network Architecture`
 10 | ![NetWork_Architecture](./data/source_image/network_architecture.png)
 11 | 
 12 | ## Installation
 13 | This software has only been tested on ubuntu 16.04(x64), python3.5, cuda-9.0, cudnn-7.0 with a GTX-1070 GPU. 
 14 | To install this software you need tensorflow 1.10.0 and other version of tensorflow has not been tested but I think 
 15 | it will be able to work properly in tensorflow above version 1.10. Other required package you may install them by
 16 | 
 17 | ```
 18 | pip3 install -r requirements.txt
 19 | ```
 20 | 
 21 | ## Test model
 22 | In this repo I uploaded a model trained on tusimple lane dataset [Tusimple_Lane_Detection](http://benchmark.tusimple.ai/#/).
 23 | The deep neural network inference part can achieve around a 50fps which is similar to the description in the paper. But
 24 | the input pipeline I implemented now need to be improved to achieve a real time lane detection system.
 25 | 
 26 | The trained lanenet model weights files are stored in 
 27 | [new_lanenet_model_file](https://www.dropbox.com/sh/tnsf0lw6psszvy4/AAA81r53jpUI3wLsRW6TiPCya?dl=0). You can 
 28 | download the model and put them in folder model/tusimple_lanenet_vgg/
 29 | 
 30 | You can test a single image on the trained model as follows
 31 | 
 32 | ```
 33 | python tools/test_lanenet.py --weights_path ./model/tusimple_lanenet_vgg/tusimple_lanenet_vgg.ckpt 
 34 | --image_path ./data/tusimple_test_image/0.jpg
 35 | ```
 36 | The results are as follows:
 37 | 
 38 | `Test Input Image`
 39 | 
 40 | ![Test Input](./data/tusimple_test_image/0.jpg)
 41 | 
 42 | `Test Lane Mask Image`
 43 | 
 44 | ![Test Lane_Mask](./data/source_image/lanenet_mask_result.png)
 45 | 
 46 | `Test Lane Binary Segmentation Image`
 47 | 
 48 | ![Test Lane_Binary_Seg](./data/source_image/lanenet_binary_seg.png)
 49 | 
 50 | `Test Lane Instance Segmentation Image`
 51 | 
 52 | ![Test Lane_Instance_Seg](./data/source_image/lanenet_instance_seg.png)
 53 | 
 54 | If you want to evaluate the model on the whole tusimple test dataset you may call
 55 | ```
 56 | python tools/evaluate_lanenet_on_tusimple.py 
 57 | --image_dir ROOT_DIR/TUSIMPLE_DATASET/test_set/clips 
 58 | --weights_path ./model/tusimple_lanenet_vgg/tusimple_lanenet_vgg.ckpt 
 59 | --save_dir ROOT_DIR/TUSIMPLE_DATASET/test_set/test_output
 60 | ```
 61 | If you set the save_dir argument the result will be saved in that folder 
 62 | or the result will not be saved but be 
 63 | displayed during the inference process holding on 3 seconds per image. 
 64 | I test the model on the whole tusimple lane 
 65 | detection dataset and make it a video. You may catch a glimpse of it bellow.
 66 | 
 67 | `Tusimple test dataset gif`
 68 | ![tusimple_batch_test_gif](./data/source_image/lanenet_batch_test.gif)
 69 | 
 70 | ## Train your own model
 71 | #### Data Preparation
 72 | Firstly you need to organize your training data refer to the data/training_data_example folder structure. And you need 
 73 | to generate a train.txt and a val.txt to record the data used for training the model. 
 74 | 
 75 | The training samples are consist of three components. A binary segmentation label file and a instance segmentation label
 76 | file and the original image. The binary segmentation use 255 to represent the lane field and 0 for the rest. The 
 77 | instance use different pixel value to represent different lane field and 0 for the rest.
 78 | 
 79 | All your training image will be scaled into the same scale according to the config file.
 80 | 
 81 | Use the script here to generate the tensorflow records file
 82 | 
 83 | ```
 84 | python data_provider/lanenet_data_feed_pipline.py 
 85 | --dataset_dir ./data/training_data_example
 86 | --tfrecords_dir ./data/training_data_example/tfrecords
 87 | ```
 88 | 
 89 | #### Train model
 90 | In my experiment the training epochs are 80010, batch size is 4, initialized learning rate is 0.001 and use polynomial 
 91 | decay with power 0.9. About training parameters you can check the global_configuration/config.py for details. 
 92 | You can switch --net argument to change the base encoder stage. If you choose --net vgg then the vgg16 will be used as 
 93 | the base encoder stage and a pretrained parameters will be loaded. And you can modified the training 
 94 | script to load your own pretrained parameters or you can implement your own base encoder stage. 
 95 | You may call the following script to train your own model
 96 | 
 97 | ```
 98 | python tools/train_lanenet.py 
 99 | --net vgg 
100 | --dataset_dir ./data/training_data_example
101 | -m 0
102 | ```
103 | You can also continue the training process from the snapshot by
104 | ```
105 | python tools/train_lanenet.py 
106 | --net vgg 
107 | --dataset_dir data/training_data_example/ 
108 | --weights_path path/to/your/last/checkpoint
109 | -m 0
110 | ```
111 | 
112 | You may monitor the training process using tensorboard tools
113 | 
114 | During my experiment the `Total loss` drops as follows:  
115 | ![Training loss](./data/source_image/total_loss.png)
116 | 
117 | The `Binary Segmentation loss` drops as follows:  
118 | ![Training binary_seg_loss](./data/source_image/binary_seg_loss.png)
119 | 
120 | The `Instance Segmentation loss` drops as follows:  
121 | ![Training instance_seg_loss](./data/source_image/instance_seg_loss.png)
122 | 
123 | ## Experiment
124 | The accuracy during training process rises as follows: 
125 | ![Training accuracy](./data/source_image/accuracy.png)
126 | 
127 | Please cite my repo [lanenet-lane-detection](https://github.com/MaybeShewill-CV/lanenet-lane-detection) if you use it.
128 | 
129 | ## Recently updates 2018.11.10
130 | Adjust some basic cnn op according to the new tensorflow api. Use the 
131 | traditional SGD optimizer to optimize the whole model instead of the
132 | origin Adam optimizer used in the origin paper. I have found that the
133 | SGD optimizer will lead to more stable training process and will not 
134 | easily stuck into nan loss which may often happen when using the origin
135 | code.
136 | 
137 | I have uploaded a new lanenet model trained on tusimple dataset using the
138 | new code here [new_lanenet_model_file](https://www.dropbox.com/sh/tnsf0lw6psszvy4/AAA81r53jpUI3wLsRW6TiPCya?dl=0).
139 | You may download the new model weights and update the new code. To update
140 | the new code you just need to
141 | 
142 | ```
143 | git pull origin master
144 | ```
145 | The rest are just the same as which mentioned above. And recently I will 
146 | release a new model trained on culane dataset.
147 | 
148 | ## Recently updates 2018.12.13
149 | Since a lot of user want a automatic tools to generate the training samples
150 | from the Tusimple Dataset. I upload the tools I use to generate the training
151 | samples. You need to firstly download the Tusimple dataset and unzip the 
152 | file to your local disk. Then run the following command to generate the 
153 | training samples and the train.txt file.
154 | 
155 | ```angular2html
156 | python tools/generate_tusimple_dataset.py --src_dir path/to/your/unzipped/file
157 | ```
158 | 
159 | The script will make the train folder and the test folder. The training 
160 | samples of origin rgb image, binary label image, instance label image will
161 | be automatically generated in the training/gt_image, training/gt_binary_image,
162 | training/gt_instance_image folder.You may check it yourself before start
163 | the training process.
164 | 
165 | Pay attention that the script only process the training samples and you 
166 | need to select several lines from the train.txt to generate your own 
167 | val.txt file. In order to obtain the test images you can modify the 
168 | script on your own.
169 | 
170 | ## Recently updates 2019.05.16
171 | 
172 | New model weights can be found [here](https://www.dropbox.com/sh/tnsf0lw6psszvy4/AAA81r53jpUI3wLsRW6TiPCya?dl=0)
173 | 
174 | ## MNN Project
175 | 
176 | Add tools to convert lanenet tensorflow ckpt model into mnn model and deploy
177 | the model on mobile device
178 | 
179 | #### Freeze your tensorflow ckpt model weights file
180 | ```
181 | cd LANENET_PROJECT_ROOT_DIR
182 | python mnn_project/freeze_lanenet_model.py -w lanenet.ckpt -s lanenet.pb
183 | ```
184 | 
185 | #### Convert pb model into mnn model
186 | ```
187 | cd MNN_PROJECT_ROOT_DIR/tools/converter/build
188 | ./MNNConver -f TF --modelFile lanenet.pb --MNNModel lanenet.mnn --bizCode MNN
189 | ```
190 | 
191 | #### Add lanenet source code into MNN project 
192 | 
193 | Add lanenet source code into MNN project and modified CMakeList.txt to 
194 | compile the executable binary file.
195 | 
196 | ## TODO
197 | - [x] Add a embedding visualization tools to visualize the embedding feature map
198 | - [x] Add detailed explanation of training the components of lanenet separately.
199 | - [x] Training the model on different dataset
200 | - ~~[ ] Adjust the lanenet hnet model and merge the hnet model to the main lanenet model~~
201 | - ~~[ ] Change the normalization function from BN to GN~~
202 | 
203 | ## Acknowledgement
204 | 
205 | The lanenet project refers to the following projects:
206 | 
207 | - [MNN](https://github.com/alibaba/MNN)
208 | - [SimpleDBSCAN](https://github.com/CallmeNezha/SimpleDBSCAN)
209 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/_config.yml:
--------------------------------------------------------------------------------
1 | theme: jekyll-theme-cayman


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/config/global_config.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding: utf-8 -*-
 3 | # @Time    : 18-1-31 上午11:21
 4 | # @Author  : MaybeShewill-CV
 5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
 6 | # @File    : global_config.py
 7 | # @IDE: PyCharm Community Edition
 8 | """
 9 | Set global configuration
10 | """
11 | from easydict import EasyDict as edict
12 | 
13 | __C = edict()
14 | # Consumers can get config by: from config import cfg
15 | 
16 | cfg = __C
17 | 
18 | # Train options
19 | __C.TRAIN = edict()
20 | 
21 | # Set the shadownet training epochs
22 | __C.TRAIN.EPOCHS = 80010
23 | # Set the display step
24 | __C.TRAIN.DISPLAY_STEP = 1
25 | # Set the test display step during training process
26 | __C.TRAIN.VAL_DISPLAY_STEP = 1000
27 | # Set the momentum parameter of the optimizer
28 | __C.TRAIN.MOMENTUM = 0.9
29 | # Set the initial learning rate
30 | __C.TRAIN.LEARNING_RATE = 0.0005
31 | # Set the GPU resource used during training process
32 | __C.TRAIN.GPU_MEMORY_FRACTION = 0.95
33 | # Set the GPU allow growth parameter during tensorflow training process
34 | __C.TRAIN.TF_ALLOW_GROWTH = True
35 | # Set the shadownet training batch size
36 | __C.TRAIN.BATCH_SIZE = 4
37 | # Set the shadownet validation batch size
38 | __C.TRAIN.VAL_BATCH_SIZE = 4
39 | # Set the class numbers
40 | __C.TRAIN.CLASSES_NUMS = 2
41 | # Set the image height
42 | __C.TRAIN.IMG_HEIGHT = 256
43 | # Set the image width
44 | __C.TRAIN.IMG_WIDTH = 512
45 | # Set the embedding features dims
46 | __C.TRAIN.EMBEDDING_FEATS_DIMS = 4
47 | # Set the random crop pad size
48 | __C.TRAIN.CROP_PAD_SIZE = 32
49 | # Set cpu multi process thread nums
50 | __C.TRAIN.CPU_MULTI_PROCESS_NUMS = 6
51 | # Set the train moving average decay
52 | __C.TRAIN.MOVING_AVERAGE_DECAY = 0.9999
53 | # Set the GPU nums
54 | __C.TRAIN.GPU_NUM = 2
55 | 
56 | # Test options
57 | __C.TEST = edict()
58 | 
59 | # Set the GPU resource used during testing process
60 | __C.TEST.GPU_MEMORY_FRACTION = 0.8
61 | # Set the GPU allow growth parameter during tensorflow testing process
62 | __C.TEST.TF_ALLOW_GROWTH = True
63 | # Set the test batch size
64 | __C.TEST.BATCH_SIZE = 2
65 | 
66 | # Test options
67 | __C.POSTPROCESS = edict()
68 | 
69 | # Set the post process connect components analysis min area threshold
70 | __C.POSTPROCESS.MIN_AREA_THRESHOLD = 100
71 | # Set the post process dbscan search radius threshold
72 | __C.POSTPROCESS.DBSCAN_EPS = 0.35
73 | # Set the post process dbscan min samples threshold
74 | __C.POSTPROCESS.DBSCAN_MIN_SAMPLES = 1000
75 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/data_provider/lanenet_data_feed_pipline.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | # @Time    : 19-4-23 下午3:54
  4 | # @Author  : MaybeShewill-CV
  5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
  6 | # @File    : lanenet_data_feed_pipline.py
  7 | # @IDE: PyCharm
  8 | """
  9 | Lanenet data feed pip line
 10 | """
 11 | import argparse
 12 | import glob
 13 | import os
 14 | import os.path as ops
 15 | import random
 16 | 
 17 | import glog as log
 18 | import tensorflow as tf
 19 | 
 20 | from LaneDetectionLaneNet.config import global_config
 21 | from LaneDetectionLaneNet.data_provider import tf_io_pipline_tools
 22 | 
 23 | CFG = global_config.cfg
 24 | 
 25 | 
 26 | def init_args():
 27 |     """
 28 | 
 29 |     :return:
 30 |     """
 31 |     parser = argparse.ArgumentParser()
 32 |     parser.add_argument('--dataset_dir', type=str, help='The source nsfw data dir path')
 33 |     parser.add_argument('--tfrecords_dir', type=str, help='The dir path to save converted tfrecords')
 34 | 
 35 |     return parser.parse_args()
 36 | 
 37 | 
 38 | class LaneNetDataProducer(object):
 39 |     """
 40 |     Convert raw image file into tfrecords
 41 |     """
 42 | 
 43 |     def __init__(self, dataset_dir):
 44 |         """
 45 | 
 46 |         :param dataset_dir:
 47 |         """
 48 |         self._dataset_dir = dataset_dir
 49 | 
 50 |         self._gt_image_dir = ops.join(dataset_dir, 'gt_image')
 51 |         self._gt_binary_image_dir = ops.join(dataset_dir, 'gt_binary_image')
 52 |         self._gt_instance_image_dir = ops.join(dataset_dir, 'gt_instance_image')
 53 | 
 54 |         self._train_example_index_file_path = ops.join(self._dataset_dir, 'train.txt')
 55 |         self._test_example_index_file_path = ops.join(self._dataset_dir, 'test.txt')
 56 |         self._val_example_index_file_path = ops.join(self._dataset_dir, 'val.txt')
 57 | 
 58 |         if not self._is_source_data_complete():
 59 |             raise ValueError('Source image data is not complete, '
 60 |                              'please check if one of the image folder is not exist')
 61 | 
 62 |         if not self._is_training_sample_index_file_complete():
 63 |             self._generate_training_example_index_file()
 64 | 
 65 |     def generate_tfrecords(self, save_dir, step_size=10000):
 66 |         """
 67 |         Generate tensorflow records file
 68 |         :param save_dir:
 69 |         :param step_size: generate a tfrecord every step_size examples
 70 |         :return:
 71 |         """
 72 | 
 73 |         def _read_training_example_index_file(_index_file_path):
 74 | 
 75 |             assert ops.exists(_index_file_path)
 76 | 
 77 |             _example_gt_path_info = []
 78 |             _example_gt_binary_path_info = []
 79 |             _example_gt_instance_path_info = []
 80 | 
 81 |             with open(_index_file_path, 'r') as _file:
 82 |                 for _line in _file:
 83 |                     _example_info = _line.rstrip('\r').rstrip('\n').split(' ')
 84 |                     _example_gt_path_info.append(_example_info[0])
 85 |                     _example_gt_binary_path_info.append(_example_info[1])
 86 |                     _example_gt_instance_path_info.append(_example_info[2])
 87 | 
 88 |             ret = {
 89 |                 'gt_path_info': _example_gt_path_info,
 90 |                 'gt_binary_path_info': _example_gt_binary_path_info,
 91 |                 'gt_instance_path_info': _example_gt_instance_path_info
 92 |             }
 93 | 
 94 |             return ret
 95 | 
 96 |         def _split_writing_tfrecords_task(
 97 |                 _example_gt_paths, _example_gt_binary_paths, _example_gt_instance_paths, _flags='train'):
 98 | 
 99 |             _split_example_gt_paths = []
100 |             _split_example_gt_binary_paths = []
101 |             _split_example_gt_instance_paths = []
102 |             _split_tfrecords_save_paths = []
103 | 
104 |             for i in range(0, len(_example_gt_paths), step_size):
105 |                 _split_example_gt_paths.append(_example_gt_paths[i:i + step_size])
106 |                 _split_example_gt_binary_paths.append(_example_gt_binary_paths[i:i + step_size])
107 |                 _split_example_gt_instance_paths.append(_example_gt_instance_paths[i:i + step_size])
108 | 
109 |                 if i + step_size > len(_example_gt_paths):
110 |                     _split_tfrecords_save_paths.append(
111 |                         ops.join(save_dir, '{:s}_{:d}_{:d}.tfrecords'.format(_flags, i, len(_example_gt_paths))))
112 |                 else:
113 |                     _split_tfrecords_save_paths.append(
114 |                         ops.join(save_dir, '{:s}_{:d}_{:d}.tfrecords'.format(_flags, i, i + step_size)))
115 | 
116 |             ret = {
117 |                 'gt_paths': _split_example_gt_paths,
118 |                 'gt_binary_paths': _split_example_gt_binary_paths,
119 |                 'gt_instance_paths': _split_example_gt_instance_paths,
120 |                 'tfrecords_paths': _split_tfrecords_save_paths
121 |             }
122 | 
123 |             return ret
124 | 
125 |         # make save dirs
126 |         os.makedirs(save_dir, exist_ok=True)
127 | 
128 |         # start generating training example tfrecords
129 |         log.info('Start generating training example tfrecords')
130 | 
131 |         # collecting train images paths info
132 |         train_image_paths_info = _read_training_example_index_file(self._train_example_index_file_path)
133 |         train_gt_images_paths = train_image_paths_info['gt_path_info']
134 |         train_gt_binary_images_paths = train_image_paths_info['gt_binary_path_info']
135 |         train_gt_instance_images_paths = train_image_paths_info['gt_instance_path_info']
136 | 
137 |         # split training images according step size
138 |         train_split_result = _split_writing_tfrecords_task(
139 |             train_gt_images_paths, train_gt_binary_images_paths, train_gt_instance_images_paths, _flags='train')
140 |         train_example_gt_paths = train_split_result['gt_paths']
141 |         train_example_gt_binary_paths = train_split_result['gt_binary_paths']
142 |         train_example_gt_instance_paths = train_split_result['gt_instance_paths']
143 |         train_example_tfrecords_paths = train_split_result['tfrecords_paths']
144 | 
145 |         for index, example_gt_paths in enumerate(train_example_gt_paths):
146 |             tf_io_pipline_tools.write_example_tfrecords(
147 |                 example_gt_paths,
148 |                 train_example_gt_binary_paths[index],
149 |                 train_example_gt_instance_paths[index],
150 |                 train_example_tfrecords_paths[index]
151 |             )
152 | 
153 |         log.info('Generating training example tfrecords complete')
154 | 
155 |         # start generating validation example tfrecords
156 |         log.info('Start generating validation example tfrecords')
157 | 
158 |         # collecting validation images paths info
159 |         val_image_paths_info = _read_training_example_index_file(self._val_example_index_file_path)
160 |         val_gt_images_paths = val_image_paths_info['gt_path_info']
161 |         val_gt_binary_images_paths = val_image_paths_info['gt_binary_path_info']
162 |         val_gt_instance_images_paths = val_image_paths_info['gt_instance_path_info']
163 | 
164 |         # split validation images according step size
165 |         val_split_result = _split_writing_tfrecords_task(
166 |             val_gt_images_paths, val_gt_binary_images_paths, val_gt_instance_images_paths, _flags='val')
167 |         val_example_gt_paths = val_split_result['gt_paths']
168 |         val_example_gt_binary_paths = val_split_result['gt_binary_paths']
169 |         val_example_gt_instance_paths = val_split_result['gt_instance_paths']
170 |         val_example_tfrecords_paths = val_split_result['tfrecords_paths']
171 | 
172 |         for index, example_gt_paths in enumerate(val_example_gt_paths):
173 |             tf_io_pipline_tools.write_example_tfrecords(
174 |                 example_gt_paths,
175 |                 val_example_gt_binary_paths[index],
176 |                 val_example_gt_instance_paths[index],
177 |                 val_example_tfrecords_paths[index]
178 |             )
179 | 
180 |         log.info('Generating validation example tfrecords complete')
181 | 
182 |         # generate test example tfrecords
183 |         log.info('Start generating testing example tfrecords')
184 | 
185 |         # collecting test images paths info
186 |         test_image_paths_info = _read_training_example_index_file(self._test_example_index_file_path)
187 |         test_gt_images_paths = test_image_paths_info['gt_path_info']
188 |         test_gt_binary_images_paths = test_image_paths_info['gt_binary_path_info']
189 |         test_gt_instance_images_paths = test_image_paths_info['gt_instance_path_info']
190 | 
191 |         # split validating images according step size
192 |         test_split_result = _split_writing_tfrecords_task(
193 |             test_gt_images_paths, test_gt_binary_images_paths, test_gt_instance_images_paths, _flags='test')
194 |         test_example_gt_paths = test_split_result['gt_paths']
195 |         test_example_gt_binary_paths = test_split_result['gt_binary_paths']
196 |         test_example_gt_instance_paths = test_split_result['gt_instance_paths']
197 |         test_example_tfrecords_paths = test_split_result['tfrecords_paths']
198 | 
199 |         for index, example_gt_paths in enumerate(test_example_gt_paths):
200 |             tf_io_pipline_tools.write_example_tfrecords(
201 |                 example_gt_paths,
202 |                 test_example_gt_binary_paths[index],
203 |                 test_example_gt_instance_paths[index],
204 |                 test_example_tfrecords_paths[index]
205 |             )
206 | 
207 |         log.info('Generating testing example tfrecords complete')
208 | 
209 |         return
210 | 
211 |     def _is_source_data_complete(self):
212 |         """
213 |         Check if source data complete
214 |         :return:
215 |         """
216 |         return \
217 |             ops.exists(self._gt_binary_image_dir) and \
218 |             ops.exists(self._gt_instance_image_dir) and \
219 |             ops.exists(self._gt_image_dir)
220 | 
221 |     def _is_training_sample_index_file_complete(self):
222 |         """
223 |         Check if the training sample index file is complete
224 |         :return:
225 |         """
226 |         return \
227 |             ops.exists(self._train_example_index_file_path) and \
228 |             ops.exists(self._test_example_index_file_path) and \
229 |             ops.exists(self._val_example_index_file_path)
230 | 
231 |     def _generate_training_example_index_file(self):
232 |         """
233 |         Generate training example index file, split source file into 0.85, 0.1, 0.05 for training,
234 |         testing and validation. Each image folder are processed separately
235 |         :return:
236 |         """
237 | 
238 |         def _gather_example_info():
239 |             """
240 | 
241 |             :return:
242 |             """
243 |             _info = []
244 | 
245 |             for _gt_image_path in glob.glob('{:s}/*.png'.format(self._gt_image_dir)):
246 |                 _gt_binary_image_name = ops.split(_gt_image_path)[1]
247 |                 _gt_binary_image_path = ops.join(self._gt_binary_image_dir, _gt_binary_image_name)
248 |                 _gt_instance_image_name = ops.split(_gt_image_path)[1]
249 |                 _gt_instance_image_path = ops.join(self._gt_instance_image_dir, _gt_instance_image_name)
250 | 
251 |                 assert ops.exists(_gt_binary_image_path), '{:s} not exist'.format(_gt_binary_image_path)
252 |                 assert ops.exists(_gt_instance_image_path), '{:s} not exist'.format(_gt_instance_image_path)
253 | 
254 |                 _info.append('{:s} {:s} {:s}\n'.format(
255 |                     _gt_image_path,
256 |                     _gt_binary_image_path,
257 |                     _gt_instance_image_path)
258 |                 )
259 | 
260 |             return _info
261 | 
262 |         def _split_training_examples(_example_info):
263 |             random.shuffle(_example_info)
264 | 
265 |             _example_nums = len(_example_info)
266 | 
267 |             _train_example_info = _example_info[:int(_example_nums * 0.85)]
268 |             _val_example_info = _example_info[int(_example_nums * 0.85):int(_example_nums * 0.9)]
269 |             _test_example_info = _example_info[int(_example_nums * 0.9):]
270 | 
271 |             return _train_example_info, _test_example_info, _val_example_info
272 | 
273 |         train_example_info, test_example_info, val_example_info = _split_training_examples(_gather_example_info())
274 | 
275 |         random.shuffle(train_example_info)
276 |         random.shuffle(test_example_info)
277 |         random.shuffle(val_example_info)
278 | 
279 |         with open(ops.join(self._dataset_dir, 'train.txt'), 'w') as file:
280 |             file.write(''.join(train_example_info))
281 | 
282 |         with open(ops.join(self._dataset_dir, 'test.txt'), 'w') as file:
283 |             file.write(''.join(test_example_info))
284 | 
285 |         with open(ops.join(self._dataset_dir, 'val.txt'), 'w') as file:
286 |             file.write(''.join(val_example_info))
287 | 
288 |         log.info('Generating training example index file complete')
289 | 
290 |         return
291 | 
292 | 
293 | class LaneNetDataFeeder(object):
294 |     """
295 |     Read training examples from tfrecords for nsfw model
296 |     """
297 | 
298 |     def __init__(self, dataset_dir, flags='train'):
299 |         """
300 | 
301 |         :param dataset_dir:
302 |         :param flags:
303 |         """
304 |         self._dataset_dir = dataset_dir
305 | 
306 |         self._tfrecords_dir = ops.join(dataset_dir, 'tfrecords')
307 |         if not ops.exists(self._tfrecords_dir):
308 |             raise ValueError('{:s} not exist, please check again'.format(self._tfrecords_dir))
309 | 
310 |         self._dataset_flags = flags.lower()
311 |         if self._dataset_flags not in ['train', 'test', 'val']:
312 |             raise ValueError('flags of the data feeder should be \'train\', \'test\', \'val\'')
313 | 
314 |     def inputs(self, batch_size, num_epochs):
315 |         """
316 |         dataset feed pipline input
317 |         :param batch_size:
318 |         :param num_epochs:
319 |         :return: A tuple (images, labels), where:
320 |                     * images is a float tensor with shape [batch_size, H, W, C]
321 |                       in the range [-0.5, 0.5].
322 |                     * labels is an int32 tensor with shape [batch_size] with the true label,
323 |                       a number in the range [0, CLASS_NUMS).
324 |         """
325 |         if not num_epochs:
326 |             num_epochs = None
327 | 
328 |         tfrecords_file_paths = glob.glob('{:s}/{:s}*.tfrecords'.format(
329 |             self._tfrecords_dir, self._dataset_flags)
330 |         )
331 |         random.shuffle(tfrecords_file_paths)
332 | 
333 |         with tf.name_scope('input_tensor'):
334 | 
335 |             # TFRecordDataset opens a binary file and reads one record at a time.
336 |             # `tfrecords_file_paths` could also be a list of filenames, which will be read in order.
337 |             dataset = tf.data.TFRecordDataset(tfrecords_file_paths)
338 | 
339 |             # The map transformation takes a function and applies it to every element
340 |             # of the dataset.
341 |             dataset = dataset.map(map_func=tf_io_pipline_tools.decode,
342 |                                   num_parallel_calls=CFG.TRAIN.CPU_MULTI_PROCESS_NUMS)
343 |             if self._dataset_flags != 'test':
344 |                 dataset = dataset.map(map_func=tf_io_pipline_tools.augment_for_train,
345 |                                       num_parallel_calls=CFG.TRAIN.CPU_MULTI_PROCESS_NUMS)
346 |             else:
347 |                 dataset = dataset.map(map_func=tf_io_pipline_tools.augment_for_test,
348 |                                       num_parallel_calls=CFG.TRAIN.CPU_MULTI_PROCESS_NUMS)
349 |             dataset = dataset.map(map_func=tf_io_pipline_tools.normalize,
350 |                                   num_parallel_calls=CFG.TRAIN.CPU_MULTI_PROCESS_NUMS)
351 | 
352 |             # The shuffle transformation uses a finite-sized buffer to shuffle elements
353 |             # in memory. The parameter is the number of elements in the buffer. For
354 |             # completely uniform shuffling, set the parameter to be the same as the
355 |             # number of elements in the dataset.
356 |             if self._dataset_flags != 'test':
357 |                 dataset = dataset.shuffle(buffer_size=1000)
358 |                 # repeat num epochs
359 |                 dataset = dataset.repeat()
360 | 
361 |             dataset = dataset.batch(batch_size, drop_remainder=True)
362 | 
363 |             iterator = dataset.make_one_shot_iterator()
364 | 
365 |         return iterator.get_next(name='{:s}_IteratorGetNext'.format(self._dataset_flags))
366 | 
367 | 
368 | if __name__ == '__main__':
369 |     # init args
370 |     args = init_args()
371 | 
372 |     assert ops.exists(args.dataset_dir), '{:s} not exist'.format(args.dataset_dir)
373 | 
374 |     producer = LaneNetDataProducer(dataset_dir=args.dataset_dir)
375 |     producer.generate_tfrecords(save_dir=args.tfrecords_dir, step_size=1000)
376 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/data_provider/tf_io_pipline_tools.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | # @Time    : 19-4-23 下午3:53
  4 | # @Author  : MaybeShewill-CV
  5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
  6 | # @File    : tf_io_pipline_tools.py
  7 | # @IDE: PyCharm
  8 | """
  9 | tensorflow io pip line tools
 10 | """
 11 | import os
 12 | import os.path as ops
 13 | 
 14 | import cv2
 15 | import glog as log
 16 | import numpy as np
 17 | import tensorflow as tf
 18 | 
 19 | from LaneDetectionLaneNet.config import global_config
 20 | 
 21 | CFG = global_config.cfg
 22 | 
 23 | RESIZE_IMAGE_HEIGHT = CFG.TRAIN.IMG_HEIGHT + CFG.TRAIN.CROP_PAD_SIZE
 24 | RESIZE_IMAGE_WIDTH = CFG.TRAIN.IMG_WIDTH + CFG.TRAIN.CROP_PAD_SIZE
 25 | CROP_IMAGE_HEIGHT = CFG.TRAIN.IMG_HEIGHT
 26 | CROP_IMAGE_WIDTH = CFG.TRAIN.IMG_WIDTH
 27 | 
 28 | 
 29 | def int64_feature(value):
 30 |     """
 31 | 
 32 |     :return:
 33 |     """
 34 |     return tf.train.Feature(int64_list=tf.train.Int64List(value=[value]))
 35 | 
 36 | 
 37 | def bytes_feature(value):
 38 |     """
 39 | 
 40 |     :param value:
 41 |     :return:
 42 |     """
 43 |     return tf.train.Feature(bytes_list=tf.train.BytesList(value=[value]))
 44 | 
 45 | 
 46 | def write_example_tfrecords(gt_images_paths, gt_binary_images_paths, gt_instance_images_paths, tfrecords_path):
 47 |     """
 48 |     write tfrecords
 49 |     :param gt_images_paths:
 50 |     :param gt_binary_images_paths:
 51 |     :param gt_instance_images_paths:
 52 |     :param tfrecords_path:
 53 |     :return:
 54 |     """
 55 |     _tfrecords_dir = ops.split(tfrecords_path)[0]
 56 |     os.makedirs(_tfrecords_dir, exist_ok=True)
 57 | 
 58 |     log.info('Writing {:s}....'.format(tfrecords_path))
 59 | 
 60 |     with tf.python_io.TFRecordWriter(tfrecords_path) as _writer:
 61 |         for _index, _gt_image_path in enumerate(gt_images_paths):
 62 | 
 63 |             # prepare gt image
 64 |             _gt_image = cv2.imread(_gt_image_path, cv2.IMREAD_UNCHANGED)
 65 |             if _gt_image.shape != (RESIZE_IMAGE_WIDTH, RESIZE_IMAGE_HEIGHT, 3):
 66 |                 _gt_image = cv2.resize(
 67 |                     _gt_image,
 68 |                     dsize=(RESIZE_IMAGE_WIDTH, RESIZE_IMAGE_HEIGHT),
 69 |                     interpolation=cv2.INTER_LINEAR
 70 |                 )
 71 |             _gt_image_raw = _gt_image.tostring()
 72 | 
 73 |             # prepare gt binary image
 74 |             _gt_binary_image = cv2.imread(gt_binary_images_paths[_index], cv2.IMREAD_UNCHANGED)
 75 |             if _gt_binary_image.shape != (RESIZE_IMAGE_WIDTH, RESIZE_IMAGE_HEIGHT):
 76 |                 _gt_binary_image = cv2.resize(
 77 |                     _gt_binary_image,
 78 |                     dsize=(RESIZE_IMAGE_WIDTH, RESIZE_IMAGE_HEIGHT),
 79 |                     interpolation=cv2.INTER_NEAREST
 80 |                 )
 81 |                 _gt_binary_image = np.array(_gt_binary_image / 255.0, dtype=np.uint8)
 82 |             _gt_binary_image_raw = _gt_binary_image.tostring()
 83 | 
 84 |             # prepare gt instance image
 85 |             _gt_instance_image = cv2.imread(gt_instance_images_paths[_index], cv2.IMREAD_UNCHANGED)
 86 |             if _gt_instance_image.shape != (RESIZE_IMAGE_WIDTH, RESIZE_IMAGE_HEIGHT):
 87 |                 _gt_instance_image = cv2.resize(
 88 |                     _gt_instance_image,
 89 |                     dsize=(RESIZE_IMAGE_WIDTH, RESIZE_IMAGE_HEIGHT),
 90 |                     interpolation=cv2.INTER_NEAREST
 91 |                 )
 92 |             _gt_instance_image_raw = _gt_instance_image.tostring()
 93 | 
 94 |             _example = tf.train.Example(
 95 |                 features=tf.train.Features(
 96 |                     feature={
 97 |                         'gt_image_raw': bytes_feature(_gt_image_raw),
 98 |                         'gt_binary_image_raw': bytes_feature(_gt_binary_image_raw),
 99 |                         'gt_instance_image_raw': bytes_feature(_gt_instance_image_raw)
100 |                     }))
101 |             _writer.write(_example.SerializeToString())
102 | 
103 |     log.info('Writing {:s} complete'.format(tfrecords_path))
104 | 
105 |     return
106 | 
107 | 
108 | def decode(serialized_example):
109 |     """
110 |     Parses an image and label from the given `serialized_example`
111 |     :param serialized_example:
112 |     :return:
113 |     """
114 |     features = tf.parse_single_example(
115 |         serialized_example,
116 |         # Defaults are not specified since both keys are required.
117 |         features={
118 |             'gt_image_raw': tf.FixedLenFeature([], tf.string),
119 |             'gt_binary_image_raw': tf.FixedLenFeature([], tf.string),
120 |             'gt_instance_image_raw': tf.FixedLenFeature([], tf.string)
121 |         })
122 | 
123 |     # decode gt image
124 |     gt_image_shape = tf.stack([RESIZE_IMAGE_HEIGHT, RESIZE_IMAGE_WIDTH, 3])
125 |     gt_image = tf.decode_raw(features['gt_image_raw'], tf.uint8)
126 |     gt_image = tf.reshape(gt_image, gt_image_shape)
127 | 
128 |     # decode gt binary image
129 |     gt_binary_image_shape = tf.stack([RESIZE_IMAGE_HEIGHT, RESIZE_IMAGE_WIDTH, 1])
130 |     gt_binary_image = tf.decode_raw(features['gt_binary_image_raw'], tf.uint8)
131 |     gt_binary_image = tf.reshape(gt_binary_image, gt_binary_image_shape)
132 | 
133 |     # decode gt instance image
134 |     gt_instance_image_shape = tf.stack([RESIZE_IMAGE_HEIGHT, RESIZE_IMAGE_WIDTH, 1])
135 |     gt_instance_image = tf.decode_raw(features['gt_instance_image_raw'], tf.uint8)
136 |     gt_instance_image = tf.reshape(gt_instance_image, gt_instance_image_shape)
137 | 
138 |     return gt_image, gt_binary_image, gt_instance_image
139 | 
140 | 
141 | def central_crop(image, crop_height, crop_width):
142 |     """
143 |     Performs central crops of the given image
144 |     :param image:
145 |     :param crop_height:
146 |     :param crop_width:
147 |     :return:
148 |     """
149 |     shape = tf.shape(input=image)
150 |     height, width = shape[0], shape[1]
151 | 
152 |     amount_to_be_cropped_h = (height - crop_height)
153 |     crop_top = amount_to_be_cropped_h // 2
154 |     amount_to_be_cropped_w = (width - crop_width)
155 |     crop_left = amount_to_be_cropped_w // 2
156 | 
157 |     return tf.slice(image, [crop_top, crop_left, 0], [crop_height, crop_width, -1])
158 | 
159 | 
160 | def augment_for_train(gt_image, gt_binary_image, gt_instance_image):
161 |     """
162 | 
163 |     :param gt_image:
164 |     :param gt_binary_image:
165 |     :param gt_instance_image:
166 |     :return:
167 |     """
168 |     # convert image from uint8 to float32
169 |     gt_image = tf.cast(gt_image, tf.float32)
170 |     gt_binary_image = tf.cast(gt_binary_image, tf.float32)
171 |     gt_instance_image = tf.cast(gt_instance_image, tf.float32)
172 | 
173 |     # apply random color augmentation
174 |     gt_image, gt_binary_image, gt_instance_image = random_color_augmentation(
175 |         gt_image, gt_binary_image, gt_instance_image
176 |     )
177 | 
178 |     # apply random flip augmentation
179 |     gt_image, gt_binary_image, gt_instance_image = random_horizon_flip_batch_images(
180 |         gt_image, gt_binary_image, gt_instance_image
181 |     )
182 | 
183 |     # apply random crop image
184 |     return random_crop_batch_images(
185 |         gt_image=gt_image,
186 |         gt_binary_image=gt_binary_image,
187 |         gt_instance_image=gt_instance_image,
188 |         cropped_size=[CROP_IMAGE_WIDTH, CROP_IMAGE_HEIGHT]
189 |     )
190 | 
191 | 
192 | def augment_for_test(gt_image, gt_binary_image, gt_instance_image):
193 |     """
194 | 
195 |     :param gt_image:
196 |     :param gt_binary_image:
197 |     :param gt_instance_image:
198 |     :return:
199 |     """
200 |     # apply central crop
201 |     gt_image = central_crop(
202 |         image=gt_image, crop_height=CROP_IMAGE_HEIGHT, crop_width=CROP_IMAGE_WIDTH
203 |     )
204 |     gt_binary_image = central_crop(
205 |         image=gt_binary_image, crop_height=CROP_IMAGE_HEIGHT, crop_width=CROP_IMAGE_WIDTH
206 |     )
207 |     gt_instance_image = central_crop(
208 |         image=gt_instance_image, crop_height=CROP_IMAGE_HEIGHT, crop_width=CROP_IMAGE_WIDTH
209 |     )
210 | 
211 |     return gt_image, gt_binary_image, gt_instance_image
212 | 
213 | 
214 | def normalize(gt_image, gt_binary_image, gt_instance_image):
215 |     """
216 |     Normalize the image data by substracting the imagenet mean value
217 |     :param gt_image:
218 |     :param gt_binary_image:
219 |     :param gt_instance_image:
220 |     :return:
221 |     """
222 | 
223 |     if gt_image.get_shape().as_list()[-1] != 3 \
224 |             or gt_binary_image.get_shape().as_list()[-1] != 1 \
225 |             or gt_instance_image.get_shape().as_list()[-1] != 1:
226 |         log.error(gt_image.get_shape())
227 |         log.error(gt_binary_image.get_shape())
228 |         log.error(gt_instance_image.get_shape())
229 |         raise ValueError('Input must be of size [height, width, C>0]')
230 | 
231 |     gt_image = tf.subtract(tf.divide(gt_image, tf.constant(127.5, dtype=tf.float32)),
232 |                            tf.constant(1.0, dtype=tf.float32))
233 | 
234 |     return gt_image, gt_binary_image, gt_instance_image
235 | 
236 | 
237 | def random_crop_batch_images(gt_image, gt_binary_image, gt_instance_image, cropped_size):
238 |     """
239 |     Random crop image batch data for training
240 |     :param gt_image:
241 |     :param gt_binary_image:
242 |     :param gt_instance_image:
243 |     :param cropped_size:
244 |     :return:
245 |     """
246 |     concat_images = tf.concat([gt_image, gt_binary_image, gt_instance_image], axis=-1)
247 | 
248 |     concat_cropped_images = tf.image.random_crop(
249 |         concat_images,
250 |         [cropped_size[1], cropped_size[0], tf.shape(concat_images)[-1]],
251 |         seed=tf.random.set_random_seed(1234)
252 |     )
253 | 
254 |     cropped_gt_image = tf.slice(
255 |         concat_cropped_images,
256 |         begin=[0, 0, 0],
257 |         size=[cropped_size[1], cropped_size[0], 3]
258 |     )
259 |     cropped_gt_binary_image = tf.slice(
260 |         concat_cropped_images,
261 |         begin=[0, 0, 3],
262 |         size=[cropped_size[1], cropped_size[0], 1]
263 |     )
264 |     cropped_gt_instance_image = tf.slice(
265 |         concat_cropped_images,
266 |         begin=[0, 0, 4],
267 |         size=[cropped_size[1], cropped_size[0], 1]
268 |     )
269 | 
270 |     return cropped_gt_image, cropped_gt_binary_image, cropped_gt_instance_image
271 | 
272 | 
273 | def random_horizon_flip_batch_images(gt_image, gt_binary_image, gt_instance_image):
274 |     """
275 |     Random horizon flip image batch data for training
276 |     :param gt_image:
277 |     :param gt_binary_image:
278 |     :param gt_instance_image:
279 |     :return:
280 |     """
281 |     concat_images = tf.concat([gt_image, gt_binary_image, gt_instance_image], axis=-1)
282 | 
283 |     [image_height, image_width, _] = gt_image.get_shape().as_list()
284 | 
285 |     concat_flipped_images = tf.image.random_flip_left_right(
286 |         image=concat_images,
287 |         seed=tf.random.set_random_seed(1)
288 |     )
289 | 
290 |     flipped_gt_image = tf.slice(
291 |         concat_flipped_images,
292 |         begin=[0, 0, 0],
293 |         size=[image_height, image_width, 3]
294 |     )
295 |     flipped_gt_binary_image = tf.slice(
296 |         concat_flipped_images,
297 |         begin=[0, 0, 3],
298 |         size=[image_height, image_width, 1]
299 |     )
300 |     flipped_gt_instance_image = tf.slice(
301 |         concat_flipped_images,
302 |         begin=[0, 0, 4],
303 |         size=[image_height, image_width, 1]
304 |     )
305 | 
306 |     return flipped_gt_image, flipped_gt_binary_image, flipped_gt_instance_image
307 | 
308 | 
309 | def random_color_augmentation(gt_image, gt_binary_image, gt_instance_image):
310 |     """
311 |     andom color augmentation
312 |     :param gt_image:
313 |     :param gt_binary_image:
314 |     :param gt_instance_image:
315 |     :return:
316 |     """
317 |     # first apply random saturation augmentation
318 |     gt_image = tf.image.random_saturation(gt_image, 0.8, 1.2)
319 |     # sencond apply random brightness augmentation
320 |     gt_image = tf.image.random_brightness(gt_image, 0.05)
321 |     # third apply random contrast augmentation
322 |     gt_image = tf.image.random_contrast(gt_image, 0.7, 1.3)
323 | 
324 |     gt_image = tf.clip_by_value(gt_image, 0.0, 255.0)
325 | 
326 |     return gt_image, gt_binary_image, gt_instance_image
327 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/lanenet_model/lanenet.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding: utf-8 -*-
 3 | """
 4 | Author: Mayur Sunil Jawalkar (mj8628)
 5 |         Kunjan Suresh Mhaske (km1556)
 6 | 
 7 | Implement LaneNet Model
 8 | """
 9 | import tensorflow as tf
10 | 
11 | from LaneDetectionLaneNet.config import global_config
12 | from LaneDetectionLaneNet.lanenet_model import lanenet_back_end
13 | from LaneDetectionLaneNet.lanenet_model import lanenet_front_end
14 | from LaneDetectionLaneNet.semantic_segmentation_zoo import cnn_basenet
15 | 
16 | CFG = global_config.cfg
17 | 
18 | 
19 | class LaneNet(cnn_basenet.CNNBaseModel):
20 |     """
21 | 
22 |     """
23 |     def __init__(self, phase, net_flag='vgg', reuse=tf.AUTO_REUSE):
24 |         """
25 | 
26 |         """
27 |         super(LaneNet, self).__init__()
28 |         self._net_flag = net_flag
29 |         self._reuse = reuse
30 | 
31 |         self._frontend = lanenet_front_end.LaneNetFrondEnd(
32 |             phase=phase, net_flag=net_flag
33 |         )
34 |         self._backend = lanenet_back_end.LaneNetBackEnd(
35 |             phase=phase
36 |         )
37 | 
38 |     def inference(self, input_tensor, name):
39 |         """
40 | 
41 |         :param input_tensor:
42 |         :param name:
43 |         :return:
44 |         """
45 |         with tf.variable_scope(name_or_scope=name, reuse=self._reuse):
46 |             # first extract image features
47 |             extract_feats_result = self._frontend.build_model(
48 |                 input_tensor=input_tensor,
49 |                 name='{:s}_frontend'.format(self._net_flag),
50 |                 reuse=self._reuse
51 |             )
52 | 
53 |             # second apply backend process
54 |             binary_seg_prediction, instance_seg_prediction = self._backend.inference(
55 |                 binary_seg_logits=extract_feats_result['binary_segment_logits']['data'],
56 |                 instance_seg_logits=extract_feats_result['instance_segment_logits']['data'],
57 |                 name='{:s}_backend'.format(self._net_flag),
58 |                 reuse=self._reuse
59 |             )
60 | 
61 |             if not self._reuse:
62 |                 self._reuse = True
63 | 
64 |         return binary_seg_prediction, instance_seg_prediction
65 | 
66 |     def compute_loss(self, input_tensor, binary_label, instance_label, name):
67 |         """
68 |         calculate lanenet loss for training
69 |         :param input_tensor:
70 |         :param binary_label:
71 |         :param instance_label:
72 |         :param name:
73 |         :return:
74 |         """
75 |         with tf.variable_scope(name_or_scope=name, reuse=self._reuse):
76 |             # first extract image features
77 |             extract_feats_result = self._frontend.build_model(
78 |                 input_tensor=input_tensor,
79 |                 name='{:s}_frontend'.format(self._net_flag),
80 |                 reuse=self._reuse
81 |             )
82 | 
83 |             # second apply backend process
84 |             calculated_losses = self._backend.compute_loss(
85 |                 binary_seg_logits=extract_feats_result['binary_segment_logits']['data'],
86 |                 binary_label=binary_label,
87 |                 instance_seg_logits=extract_feats_result['instance_segment_logits']['data'],
88 |                 instance_label=instance_label,
89 |                 name='{:s}_backend'.format(self._net_flag),
90 |                 reuse=self._reuse
91 |             )
92 | 
93 |             if not self._reuse:
94 |                 self._reuse = True
95 | 
96 |         return calculated_losses
97 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/lanenet_model/lanenet_back_end.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | # @Time    : 19-4-24 下午3:54
  4 | # @Author  : MaybeShewill-CV
  5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
  6 | # @File    : lanenet_back_end.py
  7 | # @IDE: PyCharm
  8 | """
  9 | LaneNet backend branch which is mainly used for binary and instance segmentation loss calculation
 10 | """
 11 | import tensorflow as tf
 12 | 
 13 | from LaneDetectionLaneNet.config import global_config
 14 | from LaneDetectionLaneNet.lanenet_model import lanenet_discriminative_loss
 15 | from LaneDetectionLaneNet.semantic_segmentation_zoo import cnn_basenet
 16 | 
 17 | CFG = global_config.cfg
 18 | 
 19 | 
 20 | class LaneNetBackEnd(cnn_basenet.CNNBaseModel):
 21 |     """
 22 |     LaneNet backend branch which is mainly used for binary and instance segmentation loss calculation
 23 |     """
 24 |     def __init__(self, phase):
 25 |         """
 26 |         init lanenet backend
 27 |         :param phase: train or test
 28 |         """
 29 |         super(LaneNetBackEnd, self).__init__()
 30 |         self._phase = phase
 31 |         self._is_training = self._is_net_for_training()
 32 | 
 33 |     def _is_net_for_training(self):
 34 |         """
 35 |         if the net is used for training or not
 36 |         :return:
 37 |         """
 38 |         if isinstance(self._phase, tf.Tensor):
 39 |             phase = self._phase
 40 |         else:
 41 |             phase = tf.constant(self._phase, dtype=tf.string)
 42 | 
 43 |         return tf.equal(phase, tf.constant('train', dtype=tf.string))
 44 | 
 45 |     @classmethod
 46 |     def _compute_class_weighted_cross_entropy_loss(cls, onehot_labels, logits, classes_weights):
 47 |         """
 48 | 
 49 |         :param onehot_labels:
 50 |         :param logits:
 51 |         :param classes_weights:
 52 |         :return:
 53 |         """
 54 |         loss_weights = tf.reduce_sum(tf.multiply(onehot_labels, classes_weights), axis=3)
 55 | 
 56 |         loss = tf.losses.softmax_cross_entropy(
 57 |             onehot_labels=onehot_labels,
 58 |             logits=logits,
 59 |             weights=loss_weights
 60 |         )
 61 | 
 62 |         return loss
 63 | 
 64 |     def compute_loss(self, binary_seg_logits, binary_label,
 65 |                      instance_seg_logits, instance_label,
 66 |                      name, reuse):
 67 |         """
 68 |         compute lanenet loss
 69 |         :param binary_seg_logits:
 70 |         :param binary_label:
 71 |         :param instance_seg_logits:
 72 |         :param instance_label:
 73 |         :param name:
 74 |         :param reuse:
 75 |         :return:
 76 |         """
 77 |         with tf.variable_scope(name_or_scope=name, reuse=reuse):
 78 |             # calculate class weighted binary seg loss
 79 |             with tf.variable_scope(name_or_scope='binary_seg'):
 80 |                 binary_label_onehot = tf.one_hot(
 81 |                     tf.reshape(
 82 |                         tf.cast(binary_label, tf.int32),
 83 |                         shape=[binary_label.get_shape().as_list()[0],
 84 |                                binary_label.get_shape().as_list()[1],
 85 |                                binary_label.get_shape().as_list()[2]]),
 86 |                     depth=CFG.TRAIN.CLASSES_NUMS,
 87 |                     axis=-1
 88 |                 )
 89 | 
 90 |                 binary_label_plain = tf.reshape(
 91 |                     binary_label,
 92 |                     shape=[binary_label.get_shape().as_list()[0] *
 93 |                            binary_label.get_shape().as_list()[1] *
 94 |                            binary_label.get_shape().as_list()[2] *
 95 |                            binary_label.get_shape().as_list()[3]])
 96 |                 unique_labels, unique_id, counts = tf.unique_with_counts(binary_label_plain)
 97 |                 counts = tf.cast(counts, tf.float32)
 98 |                 inverse_weights = tf.divide(
 99 |                     1.0,
100 |                     tf.log(tf.add(tf.divide(counts, tf.reduce_sum(counts)), tf.constant(1.02)))
101 |                 )
102 | 
103 |                 binary_segmenatation_loss = self._compute_class_weighted_cross_entropy_loss(
104 |                     onehot_labels=binary_label_onehot,
105 |                     logits=binary_seg_logits,
106 |                     classes_weights=inverse_weights
107 |                 )
108 | 
109 |             # calculate class weighted instance seg loss
110 |             with tf.variable_scope(name_or_scope='instance_seg'):
111 | 
112 |                 pix_bn = self.layerbn(
113 |                     inputdata=instance_seg_logits, is_training=self._is_training, name='pix_bn')
114 |                 pix_relu = self.relu(inputdata=pix_bn, name='pix_relu')
115 |                 pix_embedding = self.conv2d(
116 |                     inputdata=pix_relu,
117 |                     out_channel=CFG.TRAIN.EMBEDDING_FEATS_DIMS,
118 |                     kernel_size=1,
119 |                     use_bias=False,
120 |                     name='pix_embedding_conv'
121 |                 )
122 |                 pix_image_shape = (pix_embedding.get_shape().as_list()[1], pix_embedding.get_shape().as_list()[2])
123 |                 instance_segmentation_loss, l_var, l_dist, l_reg = \
124 |                     lanenet_discriminative_loss.discriminative_loss(
125 |                         pix_embedding, instance_label, CFG.TRAIN.EMBEDDING_FEATS_DIMS,
126 |                         pix_image_shape, 0.5, 3.0, 1.0, 1.0, 0.001
127 |                     )
128 | 
129 |             l2_reg_loss = tf.constant(0.0, tf.float32)
130 |             for vv in tf.trainable_variables():
131 |                 if 'bn' in vv.name or 'gn' in vv.name:
132 |                     continue
133 |                 else:
134 |                     l2_reg_loss = tf.add(l2_reg_loss, tf.nn.l2_loss(vv))
135 |             l2_reg_loss *= 0.001
136 |             total_loss = binary_segmenatation_loss + instance_segmentation_loss + l2_reg_loss
137 | 
138 |             ret = {
139 |                 'total_loss': total_loss,
140 |                 'binary_seg_logits': binary_seg_logits,
141 |                 'instance_seg_logits': pix_embedding,
142 |                 'binary_seg_loss': binary_segmenatation_loss,
143 |                 'discriminative_loss': instance_segmentation_loss
144 |             }
145 | 
146 |         return ret
147 | 
148 |     def inference(self, binary_seg_logits, instance_seg_logits, name, reuse):
149 |         """
150 | 
151 |         :param binary_seg_logits:
152 |         :param instance_seg_logits:
153 |         :param name:
154 |         :param reuse:
155 |         :return:
156 |         """
157 |         with tf.variable_scope(name_or_scope=name, reuse=reuse):
158 | 
159 |             with tf.variable_scope(name_or_scope='binary_seg'):
160 |                 binary_seg_score = tf.nn.softmax(logits=binary_seg_logits)
161 |                 binary_seg_prediction = tf.argmax(binary_seg_score, axis=-1)
162 | 
163 |             with tf.variable_scope(name_or_scope='instance_seg'):
164 | 
165 |                 pix_bn = self.layerbn(
166 |                     inputdata=instance_seg_logits, is_training=self._is_training, name='pix_bn')
167 |                 pix_relu = self.relu(inputdata=pix_bn, name='pix_relu')
168 |                 instance_seg_prediction = self.conv2d(
169 |                     inputdata=pix_relu,
170 |                     out_channel=CFG.TRAIN.EMBEDDING_FEATS_DIMS,
171 |                     kernel_size=1,
172 |                     use_bias=False,
173 |                     name='pix_embedding_conv'
174 |                 )
175 | 
176 |         return binary_seg_prediction, instance_seg_prediction
177 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/lanenet_model/lanenet_discriminative_loss.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | # @Time    : 18-5-11 下午3:48
  4 | # @Author  : MaybeShewill-CV
  5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
  6 | # @File    : lanenet_discriminative_loss.py
  7 | # @IDE: PyCharm Community Edition
  8 | """
  9 | Discriminative Loss for instance segmentation
 10 | """
 11 | import tensorflow as tf
 12 | 
 13 | 
 14 | def discriminative_loss_single(
 15 |         prediction,
 16 |         correct_label,
 17 |         feature_dim,
 18 |         label_shape,
 19 |         delta_v,
 20 |         delta_d,
 21 |         param_var,
 22 |         param_dist,
 23 |         param_reg):
 24 |     """
 25 |     discriminative loss
 26 |     :param prediction: inference of network
 27 |     :param correct_label: instance label
 28 |     :param feature_dim: feature dimension of prediction
 29 |     :param label_shape: shape of label
 30 |     :param delta_v: cut off variance distance
 31 |     :param delta_d: cut off cluster distance
 32 |     :param param_var: weight for intra cluster variance
 33 |     :param param_dist: weight for inter cluster distances
 34 |     :param param_reg: weight regularization
 35 |     """
 36 |     correct_label = tf.reshape(
 37 |         correct_label, [label_shape[1] * label_shape[0]]
 38 |     )
 39 |     reshaped_pred = tf.reshape(
 40 |         prediction, [label_shape[1] * label_shape[0], feature_dim]
 41 |     )
 42 | 
 43 |     # calculate instance nums
 44 |     unique_labels, unique_id, counts = tf.unique_with_counts(correct_label)
 45 |     counts = tf.cast(counts, tf.float32)
 46 |     num_instances = tf.size(unique_labels)
 47 | 
 48 |     # calculate instance pixel embedding mean vec
 49 |     segmented_sum = tf.unsorted_segment_sum(
 50 |         reshaped_pred, unique_id, num_instances)
 51 |     mu = tf.div(segmented_sum, tf.reshape(counts, (-1, 1)))
 52 |     mu_expand = tf.gather(mu, unique_id)
 53 | 
 54 |     distance = tf.norm(tf.subtract(mu_expand, reshaped_pred), axis=1, ord=1)
 55 |     distance = tf.subtract(distance, delta_v)
 56 |     distance = tf.clip_by_value(distance, 0., distance)
 57 |     distance = tf.square(distance)
 58 | 
 59 |     l_var = tf.unsorted_segment_sum(distance, unique_id, num_instances)
 60 |     l_var = tf.div(l_var, counts)
 61 |     l_var = tf.reduce_sum(l_var)
 62 |     l_var = tf.divide(l_var, tf.cast(num_instances, tf.float32))
 63 | 
 64 |     mu_interleaved_rep = tf.tile(mu, [num_instances, 1])
 65 |     mu_band_rep = tf.tile(mu, [1, num_instances])
 66 |     mu_band_rep = tf.reshape(
 67 |         mu_band_rep,
 68 |         (num_instances *
 69 |          num_instances,
 70 |          feature_dim))
 71 | 
 72 |     mu_diff = tf.subtract(mu_band_rep, mu_interleaved_rep)
 73 | 
 74 |     intermediate_tensor = tf.reduce_sum(tf.abs(mu_diff), axis=1)
 75 |     zero_vector = tf.zeros(1, dtype=tf.float32)
 76 |     bool_mask = tf.not_equal(intermediate_tensor, zero_vector)
 77 |     mu_diff_bool = tf.boolean_mask(mu_diff, bool_mask)
 78 | 
 79 |     mu_norm = tf.norm(mu_diff_bool, axis=1, ord=1)
 80 |     mu_norm = tf.subtract(2. * delta_d, mu_norm)
 81 |     mu_norm = tf.clip_by_value(mu_norm, 0., mu_norm)
 82 |     mu_norm = tf.square(mu_norm)
 83 | 
 84 |     l_dist = tf.reduce_mean(mu_norm)
 85 | 
 86 |     l_reg = tf.reduce_mean(tf.norm(mu, axis=1, ord=1))
 87 | 
 88 |     param_scale = 1.
 89 |     l_var = param_var * l_var
 90 |     l_dist = param_dist * l_dist
 91 |     l_reg = param_reg * l_reg
 92 | 
 93 |     loss = param_scale * (l_var + l_dist + l_reg)
 94 | 
 95 |     return loss, l_var, l_dist, l_reg
 96 | 
 97 | 
 98 | def discriminative_loss(prediction, correct_label, feature_dim, image_shape,
 99 |                         delta_v, delta_d, param_var, param_dist, param_reg):
100 |     """
101 | 
102 |     :return: discriminative loss and its three components
103 |     """
104 | 
105 |     def cond(label, batch, out_loss, out_var, out_dist, out_reg, i):
106 |         return tf.less(i, tf.shape(batch)[0])
107 | 
108 |     def body(label, batch, out_loss, out_var, out_dist, out_reg, i):
109 |         disc_loss, l_var, l_dist, l_reg = discriminative_loss_single(
110 |             prediction[i], correct_label[i], feature_dim, image_shape, delta_v, delta_d, param_var, param_dist, param_reg)
111 | 
112 |         out_loss = out_loss.write(i, disc_loss)
113 |         out_var = out_var.write(i, l_var)
114 |         out_dist = out_dist.write(i, l_dist)
115 |         out_reg = out_reg.write(i, l_reg)
116 | 
117 |         return label, batch, out_loss, out_var, out_dist, out_reg, i + 1
118 | 
119 |     # TensorArray is a data structure that support dynamic writing
120 |     output_ta_loss = tf.TensorArray(
121 |         dtype=tf.float32, size=0, dynamic_size=True)
122 |     output_ta_var = tf.TensorArray(
123 |         dtype=tf.float32, size=0, dynamic_size=True)
124 |     output_ta_dist = tf.TensorArray(
125 |         dtype=tf.float32, size=0, dynamic_size=True)
126 |     output_ta_reg = tf.TensorArray(
127 |         dtype=tf.float32, size=0, dynamic_size=True)
128 | 
129 |     _, _, out_loss_op, out_var_op, out_dist_op, out_reg_op, _ = tf.while_loop(
130 |         cond, body, [
131 |             correct_label, prediction, output_ta_loss, output_ta_var, output_ta_dist, output_ta_reg, 0])
132 |     out_loss_op = out_loss_op.stack()
133 |     out_var_op = out_var_op.stack()
134 |     out_dist_op = out_dist_op.stack()
135 |     out_reg_op = out_reg_op.stack()
136 | 
137 |     disc_loss = tf.reduce_mean(out_loss_op)
138 |     l_var = tf.reduce_mean(out_var_op)
139 |     l_dist = tf.reduce_mean(out_dist_op)
140 |     l_reg = tf.reduce_mean(out_reg_op)
141 | 
142 |     return disc_loss, l_var, l_dist, l_reg
143 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/lanenet_model/lanenet_front_end.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding: utf-8 -*-
 3 | # @Time    : 19-4-24 下午3:53
 4 | # @Author  : MaybeShewill-CV
 5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
 6 | # @File    : lanenet_front_end.py
 7 | # @IDE: PyCharm
 8 | """
 9 | LaneNet frontend branch which is mainly used for feature extraction
10 | """
11 | from LaneDetectionLaneNet.semantic_segmentation_zoo import cnn_basenet
12 | from LaneDetectionLaneNet.semantic_segmentation_zoo import vgg16_based_fcn
13 | 
14 | 
15 | class LaneNetFrondEnd(cnn_basenet.CNNBaseModel):
16 |     """
17 |     LaneNet frontend which is used to extract image features for following process
18 |     """
19 |     def __init__(self, phase, net_flag):
20 |         """
21 | 
22 |         """
23 |         super(LaneNetFrondEnd, self).__init__()
24 | 
25 |         self._frontend_net_map = {
26 |             'vgg': vgg16_based_fcn.VGG16FCN(phase=phase)
27 |         }
28 | 
29 |         self._net = self._frontend_net_map[net_flag]
30 | 
31 |     def build_model(self, input_tensor, name, reuse):
32 |         """
33 | 
34 |         :param input_tensor:
35 |         :param name:
36 |         :param reuse:
37 |         :return:
38 |         """
39 | 
40 |         return self._net.build_model(
41 |             input_tensor=input_tensor,
42 |             name=name,
43 |             reuse=reuse
44 |         )
45 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/lanenet_model/lanenet_postprocess.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | # @Time    : 18-5-30 上午10:04
  4 | # @Author  : MaybeShewill-CV
  5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
  6 | # @File    : lanenet_postprocess.py
  7 | # @IDE: PyCharm Community Edition
  8 | """
  9 | LaneNet model post process
 10 | """
 11 | import os.path as ops
 12 | import math
 13 | 
 14 | import cv2
 15 | import glog as log
 16 | import numpy as np
 17 | from sklearn.cluster import DBSCAN
 18 | from sklearn.preprocessing import StandardScaler
 19 | 
 20 | from LaneDetectionLaneNet.config import global_config
 21 | 
 22 | CFG = global_config.cfg
 23 | 
 24 | 
 25 | def _morphological_process(image, kernel_size=5):
 26 |     """
 27 |     morphological process to fill the hole in the binary segmentation result
 28 |     :param image:
 29 |     :param kernel_size:
 30 |     :return:
 31 |     """
 32 |     if len(image.shape) == 3:
 33 |         raise ValueError('Binary segmentation result image should be a single channel image')
 34 | 
 35 |     if image.dtype is not np.uint8:
 36 |         image = np.array(image, np.uint8)
 37 | 
 38 |     kernel = cv2.getStructuringElement(shape=cv2.MORPH_ELLIPSE, ksize=(kernel_size, kernel_size))
 39 | 
 40 |     # close operation fille hole
 41 |     closing = cv2.morphologyEx(image, cv2.MORPH_CLOSE, kernel, iterations=1)
 42 | 
 43 |     return closing
 44 | 
 45 | 
 46 | def _connect_components_analysis(image):
 47 |     """
 48 |     connect components analysis to remove the small components
 49 |     :param image:
 50 |     :return:
 51 |     """
 52 |     if len(image.shape) == 3:
 53 |         gray_image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
 54 |     else:
 55 |         gray_image = image
 56 | 
 57 |     return cv2.connectedComponentsWithStats(gray_image, connectivity=8, ltype=cv2.CV_32S)
 58 | 
 59 | 
 60 | class _LaneFeat(object):
 61 |     """
 62 | 
 63 |     """
 64 |     def __init__(self, feat, coord, class_id=-1):
 65 |         """
 66 |         lane feat object
 67 |         :param feat: lane embeddng feats [feature_1, feature_2, ...]
 68 |         :param coord: lane coordinates [x, y]
 69 |         :param class_id: lane class id
 70 |         """
 71 |         self._feat = feat
 72 |         self._coord = coord
 73 |         self._class_id = class_id
 74 | 
 75 |     @property
 76 |     def feat(self):
 77 |         """
 78 | 
 79 |         :return:
 80 |         """
 81 |         return self._feat
 82 | 
 83 |     @feat.setter
 84 |     def feat(self, value):
 85 |         """
 86 | 
 87 |         :param value:
 88 |         :return:
 89 |         """
 90 |         if not isinstance(value, np.ndarray):
 91 |             value = np.array(value, dtype=np.float64)
 92 | 
 93 |         if value.dtype != np.float32:
 94 |             value = np.array(value, dtype=np.float64)
 95 | 
 96 |         self._feat = value
 97 | 
 98 |     @property
 99 |     def coord(self):
100 |         """
101 | 
102 |         :return:
103 |         """
104 |         return self._coord
105 | 
106 |     @coord.setter
107 |     def coord(self, value):
108 |         """
109 | 
110 |         :param value:
111 |         :return:
112 |         """
113 |         if not isinstance(value, np.ndarray):
114 |             value = np.array(value)
115 | 
116 |         if value.dtype != np.int32:
117 |             value = np.array(value, dtype=np.int32)
118 | 
119 |         self._coord = value
120 | 
121 |     @property
122 |     def class_id(self):
123 |         """
124 | 
125 |         :return:
126 |         """
127 |         return self._class_id
128 | 
129 |     @class_id.setter
130 |     def class_id(self, value):
131 |         """
132 | 
133 |         :param value:
134 |         :return:
135 |         """
136 |         if not isinstance(value, np.int64):
137 |             raise ValueError('Class id must be integer')
138 | 
139 |         self._class_id = value
140 | 
141 | 
142 | class _LaneNetCluster(object):
143 |     """
144 |      Instance segmentation result cluster
145 |     """
146 | 
147 |     def __init__(self):
148 |         """
149 | 
150 |         """
151 |         self._color_map = [np.array([255, 0, 0]),
152 |                            np.array([0, 255, 0]),
153 |                            np.array([0, 0, 255]),
154 |                            np.array([125, 125, 0]),
155 |                            np.array([0, 125, 125]),
156 |                            np.array([125, 0, 125]),
157 |                            np.array([50, 100, 50]),
158 |                            np.array([100, 50, 100])]
159 | 
160 |     @staticmethod
161 |     def _embedding_feats_dbscan_cluster(embedding_image_feats):
162 |         """
163 |         dbscan cluster
164 |         :param embedding_image_feats:
165 |         :return:
166 |         """
167 |         db = DBSCAN(eps=CFG.POSTPROCESS.DBSCAN_EPS, min_samples=CFG.POSTPROCESS.DBSCAN_MIN_SAMPLES)
168 |         try:
169 |             features = StandardScaler().fit_transform(embedding_image_feats)
170 |             db.fit(features)
171 |         except Exception as err:
172 |             log.error(err)
173 |             ret = {
174 |                 'origin_features': None,
175 |                 'cluster_nums': 0,
176 |                 'db_labels': None,
177 |                 'unique_labels': None,
178 |                 'cluster_center': None
179 |             }
180 |             return ret
181 |         db_labels = db.labels_
182 |         unique_labels = np.unique(db_labels)
183 | 
184 |         num_clusters = len(unique_labels)
185 |         cluster_centers = db.components_
186 | 
187 |         ret = {
188 |             'origin_features': features,
189 |             'cluster_nums': num_clusters,
190 |             'db_labels': db_labels,
191 |             'unique_labels': unique_labels,
192 |             'cluster_center': cluster_centers
193 |         }
194 | 
195 |         return ret
196 | 
197 |     @staticmethod
198 |     def _get_lane_embedding_feats(binary_seg_ret, instance_seg_ret):
199 |         """
200 |         get lane embedding features according the binary seg result
201 |         :param binary_seg_ret:
202 |         :param instance_seg_ret:
203 |         :return:
204 |         """
205 |         idx = np.where(binary_seg_ret == 255)
206 |         lane_embedding_feats = instance_seg_ret[idx]
207 |         # idx_scale = np.vstack((idx[0] / 256.0, idx[1] / 512.0)).transpose()
208 |         # lane_embedding_feats = np.hstack((lane_embedding_feats, idx_scale))
209 |         lane_coordinate = np.vstack((idx[1], idx[0])).transpose()
210 | 
211 |         assert lane_embedding_feats.shape[0] == lane_coordinate.shape[0]
212 | 
213 |         ret = {
214 |             'lane_embedding_feats': lane_embedding_feats,
215 |             'lane_coordinates': lane_coordinate
216 |         }
217 | 
218 |         return ret
219 | 
220 |     def apply_lane_feats_cluster(self, binary_seg_result, instance_seg_result):
221 |         """
222 | 
223 |         :param binary_seg_result:
224 |         :param instance_seg_result:
225 |         :return:
226 |         """
227 |         # get embedding feats and coords
228 |         get_lane_embedding_feats_result = self._get_lane_embedding_feats(
229 |             binary_seg_ret=binary_seg_result,
230 |             instance_seg_ret=instance_seg_result
231 |         )
232 | 
233 |         # dbscan cluster
234 |         dbscan_cluster_result = self._embedding_feats_dbscan_cluster(
235 |             embedding_image_feats=get_lane_embedding_feats_result['lane_embedding_feats']
236 |         )
237 | 
238 |         mask = np.zeros(shape=[binary_seg_result.shape[0], binary_seg_result.shape[1], 3], dtype=np.uint8)
239 |         db_labels = dbscan_cluster_result['db_labels']
240 |         unique_labels = dbscan_cluster_result['unique_labels']
241 |         coord = get_lane_embedding_feats_result['lane_coordinates']
242 | 
243 |         if db_labels is None:
244 |             return None, None
245 | 
246 |         lane_coords = []
247 | 
248 |         for index, label in enumerate(unique_labels.tolist()):
249 |             if label == -1:
250 |                 continue
251 |             idx = np.where(db_labels == label)
252 |             pix_coord_idx = tuple((coord[idx][:, 1], coord[idx][:, 0]))
253 |             mask[pix_coord_idx] = self._color_map[index]
254 |             lane_coords.append(coord[idx])
255 | 
256 |         return mask, lane_coords
257 | 
258 | 
259 | class LaneNetPostProcessor(object):
260 |     """
261 |     lanenet post process for lane generation
262 |     """
263 |     def __init__(self, ipm_remap_file_path='./LaneDetectionLaneNet/data/tusimple_ipm_remap.yml'):
264 |         """
265 | 
266 |         :param ipm_remap_file_path: ipm generate file path
267 |         """
268 |         assert ops.exists(ipm_remap_file_path), '{:s} not exist'.format(ipm_remap_file_path)
269 | 
270 |         self._cluster = _LaneNetCluster()
271 |         self._ipm_remap_file_path = ipm_remap_file_path
272 | 
273 |         remap_file_load_ret = self._load_remap_matrix()
274 |         self._remap_to_ipm_x = remap_file_load_ret['remap_to_ipm_x']
275 |         self._remap_to_ipm_y = remap_file_load_ret['remap_to_ipm_y']
276 | 
277 |         self._color_map = [np.array([255, 0, 0]),
278 |                            np.array([0, 255, 0]),
279 |                            np.array([0, 0, 255]),
280 |                            np.array([125, 125, 0]),
281 |                            np.array([0, 125, 125]),
282 |                            np.array([125, 0, 125]),
283 |                            np.array([50, 100, 50]),
284 |                            np.array([100, 50, 100])]
285 | 
286 |     def _load_remap_matrix(self):
287 |         """
288 | 
289 |         :return:
290 |         """
291 |         fs = cv2.FileStorage(self._ipm_remap_file_path, cv2.FILE_STORAGE_READ)
292 | 
293 |         remap_to_ipm_x = fs.getNode('remap_ipm_x').mat()
294 |         remap_to_ipm_y = fs.getNode('remap_ipm_y').mat()
295 | 
296 |         ret = {
297 |             'remap_to_ipm_x': remap_to_ipm_x,
298 |             'remap_to_ipm_y': remap_to_ipm_y,
299 |         }
300 | 
301 |         fs.release()
302 | 
303 |         return ret
304 | 
305 |     def postprocess(self, binary_seg_result, instance_seg_result=None,
306 |                     min_area_threshold=100, source_image=None,
307 |                     data_source='tusimple'):
308 |         """
309 | 
310 |         :param binary_seg_result:
311 |         :param instance_seg_result:
312 |         :param min_area_threshold:
313 |         :param source_image:
314 |         :param data_source:
315 |         :return:
316 |         """
317 |         # convert binary_seg_result
318 |         binary_seg_result = np.array(binary_seg_result * 255, dtype=np.uint8)
319 | 
320 |         # apply image morphology operation to fill in the hold and reduce the small area
321 |         morphological_ret = _morphological_process(binary_seg_result, kernel_size=5)
322 | 
323 |         connect_components_analysis_ret = _connect_components_analysis(image=morphological_ret)
324 | 
325 |         labels = connect_components_analysis_ret[1]
326 |         stats = connect_components_analysis_ret[2]
327 |         for index, stat in enumerate(stats):
328 |             if stat[4] <= min_area_threshold:
329 |                 idx = np.where(labels == index)
330 |                 morphological_ret[idx] = 0
331 | 
332 |         # apply embedding features cluster
333 |         mask_image, lane_coords = self._cluster.apply_lane_feats_cluster(
334 |             binary_seg_result=morphological_ret,
335 |             instance_seg_result=instance_seg_result
336 |         )
337 | 
338 |         if mask_image is None:
339 |             return {
340 |                 'mask_image': None,
341 |                 'fit_params': None,
342 |                 'source_image': None,
343 |             }
344 | 
345 |         # lane line fit
346 |         fit_params = []
347 |         src_lane_pts = []  # lane pts every single lane
348 |         for lane_index, coords in enumerate(lane_coords):
349 |             if data_source == 'tusimple':
350 |                 tmp_mask = np.zeros(shape=(720, 1280), dtype=np.uint8)
351 |                 tmp_mask[tuple((np.int_(coords[:, 1] * 720 / 256), np.int_(coords[:, 0] * 1280 / 512)))] = 255
352 |             elif data_source == 'beec_ccd':
353 |                 tmp_mask = np.zeros(shape=(1350, 2448), dtype=np.uint8)
354 |                 tmp_mask[tuple((np.int_(coords[:, 1] * 1350 / 256), np.int_(coords[:, 0] * 2448 / 512)))] = 255
355 |             else:
356 |                 raise ValueError('Wrong data source now only support tusimple and beec_ccd')
357 |             tmp_ipm_mask = cv2.remap(
358 |                 tmp_mask,
359 |                 self._remap_to_ipm_x,
360 |                 self._remap_to_ipm_y,
361 |                 interpolation=cv2.INTER_NEAREST
362 |             )
363 |             nonzero_y = np.array(tmp_ipm_mask.nonzero()[0])
364 |             nonzero_x = np.array(tmp_ipm_mask.nonzero()[1])
365 | 
366 |             fit_param = np.polyfit(nonzero_y, nonzero_x, 2)
367 |             fit_params.append(fit_param)
368 | 
369 |             [ipm_image_height, ipm_image_width] = tmp_ipm_mask.shape
370 |             plot_y = np.linspace(10, ipm_image_height, ipm_image_height - 10)
371 |             fit_x = fit_param[0] * plot_y ** 2 + fit_param[1] * plot_y + fit_param[2]
372 |             # fit_x = fit_param[0] * plot_y ** 3 + fit_param[1] * plot_y ** 2 + fit_param[2] * plot_y + fit_param[3]
373 | 
374 |             lane_pts = []
375 |             for index in range(0, plot_y.shape[0], 5):
376 |                 src_x = self._remap_to_ipm_x[
377 |                     int(plot_y[index]), int(np.clip(fit_x[index], 0, ipm_image_width - 1))]
378 |                 if src_x <= 0:
379 |                     continue
380 |                 src_y = self._remap_to_ipm_y[
381 |                     int(plot_y[index]), int(np.clip(fit_x[index], 0, ipm_image_width - 1))]
382 |                 src_y = src_y if src_y > 0 else 0
383 | 
384 |                 lane_pts.append([src_x, src_y])
385 | 
386 |             src_lane_pts.append(lane_pts)
387 | 
388 |         # tusimple test data sample point along y axis every 10 pixels
389 |         source_image_width = source_image.shape[1]
390 |         for index, single_lane_pts in enumerate(src_lane_pts):
391 |             single_lane_pt_x = np.array(single_lane_pts, dtype=np.float32)[:, 0]
392 |             single_lane_pt_y = np.array(single_lane_pts, dtype=np.float32)[:, 1]
393 |             if data_source == 'tusimple':
394 |                 start_plot_y = 240
395 |                 end_plot_y = 720
396 |             elif data_source == 'beec_ccd':
397 |                 start_plot_y = 820
398 |                 end_plot_y = 1350
399 |             else:
400 |                 raise ValueError('Wrong data source now only support tusimple and beec_ccd')
401 |             step = int(math.floor((end_plot_y - start_plot_y) / 10))
402 |             for plot_y in np.linspace(start_plot_y, end_plot_y, step):
403 |                 diff = single_lane_pt_y - plot_y
404 |                 fake_diff_bigger_than_zero = diff.copy()
405 |                 fake_diff_smaller_than_zero = diff.copy()
406 |                 fake_diff_bigger_than_zero[np.where(diff <= 0)] = float('inf')
407 |                 fake_diff_smaller_than_zero[np.where(diff > 0)] = float('-inf')
408 |                 idx_low = np.argmax(fake_diff_smaller_than_zero)
409 |                 idx_high = np.argmin(fake_diff_bigger_than_zero)
410 | 
411 |                 previous_src_pt_x = single_lane_pt_x[idx_low]
412 |                 previous_src_pt_y = single_lane_pt_y[idx_low]
413 |                 last_src_pt_x = single_lane_pt_x[idx_high]
414 |                 last_src_pt_y = single_lane_pt_y[idx_high]
415 | 
416 |                 if previous_src_pt_y < start_plot_y or last_src_pt_y < start_plot_y or \
417 |                         fake_diff_smaller_than_zero[idx_low] == float('-inf') or \
418 |                         fake_diff_bigger_than_zero[idx_high] == float('inf'):
419 |                     continue
420 | 
421 |                 interpolation_src_pt_x = (abs(previous_src_pt_y - plot_y) * previous_src_pt_x +
422 |                                           abs(last_src_pt_y - plot_y) * last_src_pt_x) / \
423 |                                          (abs(previous_src_pt_y - plot_y) + abs(last_src_pt_y - plot_y))
424 |                 interpolation_src_pt_y = (abs(previous_src_pt_y - plot_y) * previous_src_pt_y +
425 |                                           abs(last_src_pt_y - plot_y) * last_src_pt_y) / \
426 |                                          (abs(previous_src_pt_y - plot_y) + abs(last_src_pt_y - plot_y))
427 | 
428 |                 if interpolation_src_pt_x > source_image_width or interpolation_src_pt_x < 10:
429 |                     continue
430 | 
431 |                 lane_color = self._color_map[index].tolist()
432 |                 cv2.circle(source_image, (int(interpolation_src_pt_x),
433 |                                           int(interpolation_src_pt_y)), 5, lane_color, -1)
434 |         ret = {
435 |             'mask_image': mask_image,
436 |             'fit_params': fit_params,
437 |             'source_image': source_image,
438 |         }
439 | 
440 |         return ret
441 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/__init__.py:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env python3
2 | # -*- coding: utf-8 -*-
3 | # @Time    : 2019/11/5 下午5:03
4 | # @Author  : LuoYao
5 | # @Site    : ICode
6 | # @File    : __init__.py.py
7 | # @IDE: PyCharm


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/config.ini:
--------------------------------------------------------------------------------
 1 | [LaneNet]
 2 | # 模型文件路径
 3 | model_file_path=~/MNN-0.2.1.0/beec_task/lane_detection/model/lanenet_model.mnn
 4 | # pixel embedding feature dims
 5 | pix_embedding_feature_dims=4
 6 | # dbscan邻域距离判断距离阈值
 7 | dbscan_neighbor_radius=0.4
 8 | # dbscan核心对象最少包含样本数
 9 | dbscan_core_object_min_pts=500
10 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/config_parser.cpp:
--------------------------------------------------------------------------------
  1 | /************************************************
  2 | * Author: MaybeShewill-CV
  3 | * File: configParser.cpp
  4 | * Date: 2019/10/10 上午10:39
  5 | ************************************************/
  6 | 
  7 | #include "config_parser.h"
  8 | 
  9 | #include <algorithm>
 10 | #include <cctype>
 11 | #include <fstream>
 12 | #include <iostream>
 13 | #include <sstream>
 14 | #include <string>
 15 | 
 16 | namespace beec {
 17 |     namespace config_parse_utils {
 18 | 
 19 |         ConfigParser::ConfigParser(const std::string &filename) {
 20 | 
 21 |             std::ifstream fin(filename);
 22 | 
 23 |             if (fin.good()) {
 24 |                 std::string line;
 25 |                 std::string current_header = "";
 26 |                 while (std::getline(fin, line)) {
 27 |                     trim(line);
 28 | 
 29 |                     // Skip empty lines
 30 |                     if (line.size() == 0)
 31 |                         continue;
 32 | 
 33 |                     switch (line[0]) {
 34 |                         case '#':
 35 |                         case ';':
 36 |                             // Ignore comments
 37 |                             break;
 38 |                         case '[':
 39 |                             // Section header
 40 |                             current_header = read_header(line);
 41 |                             break;
 42 |                         default:
 43 |                             // Everything else will be configurations
 44 |                             read_configuration(line, current_header);
 45 |                     }
 46 |                 }
 47 |                 fin.close();
 48 |             } else {
 49 |                 throw std::runtime_error("File `" + filename + "` does not exist");
 50 |             }
 51 |         }
 52 | 
 53 |         std::map<std::string, std::string> ConfigParser::get_section(const std::string &section_name) const {
 54 | 
 55 |             if (_m_sections.count(section_name) == 0) {
 56 |                 std::string error = "No such key: `" + section_name + "`";
 57 |                 throw std::out_of_range(error);
 58 |             }
 59 |             return _m_sections.at(section_name);
 60 |         }
 61 | 
 62 |         std::map<std::string, std::string> ConfigParser::operator[](const std::string &section_name) const {
 63 | 
 64 |             if (_m_sections.count(section_name) == 0) {
 65 |                 std::string error = "No such key: `" + section_name + "`";
 66 |                 throw std::out_of_range(error);
 67 |             }
 68 |             return _m_sections.at(section_name);
 69 |         }
 70 | 
 71 |         void ConfigParser::dump(FILE *log_file) {
 72 | 
 73 |             // Set up iterators
 74 |             std::map<std::string, std::string>::iterator itr1;
 75 |             std::map<std::string, std::map<std::string, std::string> >::iterator itr2;
 76 |             for (itr2 = _m_sections.begin(); itr2 != _m_sections.end(); itr2++) {
 77 |                 fprintf(log_file, "[%s]\n", itr2->first.c_str());
 78 |                 for (itr1 = itr2->second.begin(); itr1 != itr2->second.end(); itr1++) {
 79 |                     fprintf(log_file, "%s=%s\n", itr1->first.c_str(), itr1->second.c_str());
 80 |                 }
 81 |             }
 82 |         }
 83 | 
 84 |         std::string ConfigParser::read_header(const std::string &line) {
 85 | 
 86 |             if (line[line.size() - 1] != ']')
 87 |                 throw std::runtime_error("Invalid section header: `" + line + "`");
 88 |             return trim_copy(line.substr(1, line.size() - 2));
 89 |         }
 90 | 
 91 |         void ConfigParser::read_configuration(const std::string &line, const std::string &header) {
 92 |             if (header == "") {
 93 |                 std::string error = "No section provided for: `" + line + "`";
 94 |                 throw std::runtime_error(error);
 95 |             }
 96 | 
 97 |             if (line.find('=') == std::string::npos) {
 98 |                 std::string error = "Invalid configuration: `" + line + "`";
 99 |                 throw std::runtime_error(error);
100 |             }
101 | 
102 |             std::istringstream iss(line);
103 |             std::string key;
104 |             std::string val;
105 |             std::getline(iss, key, '=');
106 | 
107 |             if (key.size() == 0) {
108 |                 std::string error = "No key found in configuration: `" + line + "`";
109 |                 throw std::runtime_error(error);
110 |             }
111 | 
112 |             std::getline(iss, val);
113 | 
114 |             _m_sections[header][trim_copy(key)] = trim_copy(val);
115 |         }
116 | 
117 |         // trim from start (in place)
118 |         void ConfigParser::ltrim(std::string &s) {
119 |             s.erase(s.begin(), std::find_if(s.begin(), s.end(), [](int ch) {
120 |                 return !std::isspace(ch);
121 |             }));
122 |         }
123 | 
124 |         // trim from end (in place)
125 |         void ConfigParser::rtrim(std::string &s) {
126 |             s.erase(std::find_if(s.rbegin(), s.rend(), [](int ch) {
127 |                 return !std::isspace(ch);
128 |             }).base(), s.end());
129 |         }
130 | 
131 |         // trim from both ends (in place)
132 |         void ConfigParser::trim(std::string &s) {
133 |             ltrim(s);
134 |             rtrim(s);
135 |         }
136 | 
137 |         // trim from start (copying)
138 |         std::string ConfigParser::ltrim_copy(std::string s) {
139 |             ltrim(s);
140 |             return s;
141 |         }
142 | 
143 |         // trim from end (copying)
144 |         std::string ConfigParser::rtrim_copy(std::string s) {
145 |             rtrim(s);
146 |             return s;
147 |         }
148 | 
149 |         // trim from both ends (copying)
150 |         std::string ConfigParser::trim_copy(std::string s) {
151 |             trim(s);
152 |             return s;
153 |         }
154 |     }
155 | }


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/config_parser.h:
--------------------------------------------------------------------------------
 1 | /************************************************
 2 | * Author: MaybeShewill-CV
 3 | * File: configParser.h
 4 | * Date: 2019/10/10 上午10:39
 5 | ************************************************/
 6 | 
 7 | #ifndef MNN_CONFIGPARSER_H
 8 | #define MNN_CONFIGPARSER_H
 9 | 
10 | // Config parser
11 | 
12 | #include <exception>
13 | #include <stdio.h>
14 | #include <string>
15 | #include <map>
16 | 
17 | const extern int __CONFIG_BUFFER_SIZE;
18 | 
19 | namespace beec {
20 |     namespace config_parse_utils {
21 | 
22 |         class ConfigParser {
23 | 
24 |             using config_values = std::map<std::string, std::string>;
25 |         public:
26 |             explicit ConfigParser(const std::string& filename);
27 | 
28 |             ~ConfigParser() = default;
29 | 
30 |             config_values get_section(const std::string& section_name) const;
31 | 
32 |             config_values operator[](const std::string& section_name) const;
33 | 
34 |             void dump(FILE* log_file);
35 | 
36 |         private:
37 |             std::map<std::string, std::map<std::string, std::string> > _m_sections;
38 | 
39 |             std::string read_header(const std::string& line);
40 | 
41 |             void read_configuration(const std::string& line, const std::string& header);
42 | 
43 |             // trim from start (in place)
44 |             void ltrim(std::string &s);
45 | 
46 |             // trim from end (in place)
47 |             void rtrim(std::string &s);
48 | 
49 |             // trim from both ends (in place)
50 |             void trim(std::string &s);
51 | 
52 |             // trim from start (copying)
53 |             std::string ltrim_copy(std::string s);
54 | 
55 |             // trim from end (copying)
56 |             std::string rtrim_copy(std::string s);
57 | 
58 |             // trim from both ends (copying)
59 |             std::string trim_copy(std::string s);
60 |         };
61 |     }
62 | }
63 | 
64 | #endif //MNN_CONFIGPARSER_H
65 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/convert_lanenet_model_into_mnn_model.sh:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env bash
2 | 
3 | set -eux
4 | 
5 | PYTHONPATH=$(pwd) python freeze_lanenet_model --weights_path ./ckpt_file_path --save_path ./pb_file_path
6 | 
7 | MNNConverter -f TF --modelFile ./pb_file_path --MNNModel ./lanenet_model.mnn --bizCode MNN
8 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/dbscan.hpp:
--------------------------------------------------------------------------------
  1 | //
  2 | // Created by Nezha on 2016/12/15.
  3 | //
  4 | 
  5 | /**
  6 | * REAMME *
  7 | * @author: ZJ Jiang (Nezha)
  8 | * @github: https://github.com/CallmeNezha/SimpleDBSCAN
  9 | * @describe: This is a simple DBSCAN clustering method implement
 10 | */
 11 | 
 12 | // Copyright 2019 Baidu Inc. All Rights Reserved.
 13 | // Author: MaybeShewill-CV
 14 | // File: dbscan.hpp
 15 | // Date: 2019/11/6 下午8:26
 16 | 
 17 | #ifndef MNN_DBSCAN_HPP
 18 | #define MNN_DBSCAN_HPP
 19 | 
 20 | // Option brute force or use kdtree(by default)
 21 | #define BRUTEFORCE false
 22 | 
 23 | #include <vector>
 24 | #include <queue>
 25 | #include <set>
 26 | #include <memory>
 27 | #include <functional>
 28 | 
 29 | #if !BRUTEFORCE
 30 | /*
 31 | * @author: Scott Deming, John Tsiombikas
 32 | * @github:https://github.com/sdeming/kdtree
 33 | */
 34 | #include "kdtree.h"
 35 | #endif
 36 | 
 37 | typedef unsigned int uint;
 38 | 
 39 | enum CLASSIFY_FLAGS {
 40 |     NOISE = -2,
 41 |     NOT_CALSSIFIED = -1
 42 | };
 43 | 
 44 | /***
 45 |  * Feature vector. T can be float ,double ,int or any other number type but MUST
 46 |  * SUPPORT implicitly convert to double type
 47 |  */
 48 | template <typename T>
 49 | using Feature = std::vector<T>;
 50 | 
 51 | /***
 52 |  * Dbscan sample which will be clustered. A sample must have a feature vector and class id.
 53 |  * @tparam T
 54 |  */
 55 | template <typename T>
 56 | class DBSCAMSample final {
 57 | public:
 58 |     /***
 59 |      * Default constructor not supplied here
 60 |      */
 61 |     DBSCAMSample() = delete;
 62 | 
 63 |     /***
 64 |      * Default destructor
 65 |      */
 66 |     ~DBSCAMSample() = default;
 67 | 
 68 |     /***
 69 |      * Constructor
 70 |      * @param feature : feature vector
 71 |      * @param class_id : class id
 72 |      */
 73 |     DBSCAMSample(const Feature<T>& feature, uint class_id = CLASSIFY_FLAGS::NOT_CALSSIFIED);
 74 | 
 75 |     /***
 76 |      * Get sample's feature value via index
 77 |      * @param idx : feature index
 78 |      * @return : T feature value if in range[0, feature_vec.size()) else 0.0
 79 |      */
 80 |     T operator[](int idx) const;
 81 | 
 82 |     /***
 83 |      * Get feature vector's value
 84 |      * @return
 85 |      */
 86 |     Feature<T> get_feature_vector() const;
 87 | 
 88 |     /***
 89 |      * Set feature's value via feature from input parameter
 90 |      * @param feature : feature vector
 91 |      */
 92 |     void set_feature_vector(const Feature<T>& feature);
 93 | 
 94 |     /***
 95 |      * Get sample's class id
 96 |      * @return
 97 |      */
 98 |     uint get_class_id();
 99 | 
100 |     /***
101 |      * Set sample's class id
102 |      */
103 |     void set_class_id(uint class_id);
104 | 
105 | private:
106 |     // sample features
107 |     Feature<T> _m_feature = Feature<T>();
108 |     // class id
109 |     uint _m_class_id = CLASSIFY_FLAGS::NOT_CALSSIFIED;
110 | };
111 | 
112 | template <typename T>
113 | DBSCAMSample<T>::DBSCAMSample(const Feature<T> &feature, uint class_id) {
114 |     _m_feature = feature;
115 |     _m_class_id = class_id;
116 | }
117 | 
118 | template <typename T>
119 | T DBSCAMSample<T>::operator[](int idx) const {
120 |     // if idx is not in range [0, feature_vector.size() - 1] return 0.0
121 |     if (idx >= _m_feature.size()) {
122 |         return 0.0;
123 |     } else {
124 |         return _m_feature[idx];
125 |     }
126 | }
127 | 
128 | template <typename T>
129 | Feature<T> DBSCAMSample<T>::get_feature_vector() const {
130 |     return _m_feature;
131 | }
132 | 
133 | template <typename T>
134 | void DBSCAMSample<T>::set_feature_vector(const Feature<T> &feature) {
135 |     if (_m_feature.size() != feature.size()) {
136 |         _m_feature.resize(feature.size(), 0.0);
137 |         for (auto index = 0; index < feature.size(); ++index) {
138 |             _m_feature[index] = feature[index];
139 |         }
140 |     } else {
141 |         for (auto index = 0; index < feature.size(); ++index) {
142 |             _m_feature[index] = feature[index];
143 |         }
144 |     }
145 | }
146 | 
147 | template <typename T>
148 | uint DBSCAMSample<T>::get_class_id() {
149 |     return _m_class_id;
150 | }
151 | 
152 | template <typename T>
153 | void DBSCAMSample<T>::set_class_id(uint class_id) {
154 |     _m_class_id = class_id;
155 | }
156 | 
157 | 
158 | //! type T must be a vector-like container and MUST SUPPORT operator[] for iteration
159 | //! Float can be float ,double ,int or any other number type but MUST SUPPORT implicitly convert to double type
160 | template <typename T, typename Float>
161 | class DBSCAN final {
162 | 
163 |     enum ERROR_TYPE {
164 |         SUCCESS = 0
165 |         , FAILED
166 |         , COUNT
167 |     };
168 | 
169 |     using TVector      = std::vector<T>;
170 |     using DistanceFunc = std::function<Float(const T&, const T&)>;
171 | 
172 | public:
173 |     DBSCAN() { }
174 |     ~DBSCAN() { }
175 | 
176 |     /**
177 |     * @describe: Run DBSCAN clustering alogrithm
178 |     * @param: V {std::vector<T>} : data
179 |     * @param: dim {unsigned int} : dimension of T (a vector-like struct)
180 |     * @param: eps {Float} : epsilon or in other words, radian
181 |     * @param: min {unsigned int} : minimal number of points in epsilon radian, then the point is cluster core point
182 |     * @param: disfunc {DistanceFunc} : !!!! only used in bruteforce mode. Distance function recall. Euclidian distance is recommanded, but you can replace it by any metric measurement function
183 |     * @usage: Object.Run() and get the cluster and noise indices from this->Clusters & this->Noise.
184 |     * @pitfall: If you set big eps(search range) and huge density V, then kdtree will be a bottleneck of performance
185 |     * @pitfall: You MUST ensure the data's identicality (TVector* V) during Run(), because DBSCAN just use the reference of data passed in.
186 |     * @TODO: customize kdtree algorithm or rewrite it ,stop further searching when minimal number which indicates cluster core point condition is satisfied
187 |     */
188 |     int Run(TVector* V, const uint dim, const Float eps, const uint min, const DistanceFunc& disfunc = [](const T& t1, const T& t2)->Float { return 0; });
189 | 
190 | 
191 | private:
192 |     std::vector<uint> regionQuery(const uint pid) const;
193 |     void              addToCluster(const uint pid, const uint cid);
194 |     void              expandCluster(const uint cid, const std::vector<uint>& neighbors);
195 |     void              addToBorderSet(const uint pid) {
196 |         this->_borderset.insert(pid);
197 |     }
198 |     void              addToBorderSet(const std::vector<uint>& pids) {
199 |         for (uint pid : pids) this->_borderset.insert(pid);
200 |     }
201 |     bool              isInBorderSet(const uint pid) const {
202 |         return this->_borderset.end() != this->_borderset.find(pid);
203 |     }
204 |     void              buildKdtree(const TVector* V);
205 |     void              destroyKdtree();
206 | 
207 | public:
208 |     std::vector<std::vector<uint>>  Clusters;
209 |     std::vector<uint>               Noise;
210 | 
211 | private:
212 |     //temporary variables used during computation
213 |     std::vector<bool>   _visited;
214 |     std::vector<bool>   _assigned;
215 |     std::set<uint>      _borderset;
216 |     uint                _datalen;
217 |     uint                _minpts;
218 |     Float               _epsilon;
219 |     uint                _datadim;
220 | 
221 |     DistanceFunc        _disfunc;
222 | #if !BRUTEFORCE
223 |     kdtree*             _kdtree;
224 | #endif //!BRUTEFORCE
225 | 
226 |     std::vector<T>*     _data;  //Not owner, just holder, no responsible for deallocate
227 | 
228 | 
229 | };
230 | 
231 | template<typename T, typename Float>
232 | int DBSCAN<T, Float>::Run(
233 |     TVector*                V
234 |     , const uint            dim
235 |     , const Float           eps
236 |     , const uint            min
237 |     , const DistanceFunc&   disfunc
238 | ) {
239 | 
240 |     // Validate
241 |     if (V->size() < 1) return ERROR_TYPE::FAILED;
242 |     if (dim < 1) return ERROR_TYPE::FAILED;
243 |     if (min < 1) return ERROR_TYPE::FAILED;
244 | 
245 |     // initialization
246 |     this->_datalen = (uint)V->size();
247 |     this->_visited = std::vector<bool>(this->_datalen, false);
248 |     this->_assigned = std::vector<bool>(this->_datalen, false);
249 |     this->Clusters.clear();
250 |     this->Noise.clear();
251 |     this->_minpts = min;
252 |     this->_data = V;
253 |     this->_disfunc = disfunc;
254 |     this->_epsilon = eps;
255 |     this->_datadim = dim;
256 | 
257 | #if BRUTEFORCE
258 | #else
259 |     this->buildKdtree(this->_data);
260 | #endif // !BRUTEFORCE
261 | 
262 | 
263 |     for (uint pid = 0; pid < this->_datalen; ++pid) {
264 |         // Check if point forms a cluster
265 |         this->_borderset.clear();
266 |         if (!this->_visited[pid]) {
267 |             this->_visited[pid] = true;
268 | 
269 |             // Outliner it maybe noise or on the border of one cluster.
270 |             const std::vector<uint> neightbors = this->regionQuery(pid);
271 |             if (neightbors.size() < this->_minpts) {
272 |                 continue;
273 |             }
274 |             else {
275 |                 uint cid = (uint)this->Clusters.size();
276 |                 this->Clusters.push_back(std::vector<uint>());
277 |                 // first blood
278 |                 this->addToBorderSet(pid);
279 |                 this->addToCluster(pid, cid);
280 |                 this->expandCluster(cid, neightbors);
281 |             }
282 |         }
283 |     }
284 | 
285 |     for (uint pid = 0; pid < this->_datalen; ++pid) {
286 |         if (!this->_assigned[pid]) {
287 |             this->Noise.push_back(pid);
288 |         }
289 |     }
290 | 
291 | #if BRUTEFORCE
292 | #else
293 |     this->destroyKdtree();
294 | #endif // !BRUTEFORCE
295 | 
296 |     return ERROR_TYPE::SUCCESS;
297 | 
298 | }
299 | 
300 | 
301 | 
302 | 
303 | template<typename T, typename Float>
304 | void DBSCAN<T, Float>::destroyKdtree() {
305 |     kd_free(this->_kdtree);
306 | }
307 | 
308 | #if !BRUTEFORCE
309 | template<typename T, typename Float>
310 | void DBSCAN<T, Float>::buildKdtree(const TVector* V)
311 | {
312 |     this->_kdtree = kd_create((int)this->_datadim);
313 |     std::unique_ptr<double[]> v(new double[this->_datadim]);
314 |     for (uint r = 0; r < this->_datalen; ++r) {
315 |         // kdtree only support double type
316 |         for (uint c = 0; c < this->_datadim; ++c) {
317 |             v[c] = (double)(*V)[r][c];
318 |         }
319 |         kd_insert(this->_kdtree, v.get(), (void*)&(*V)[r]);
320 |     }
321 | }
322 | #endif
323 | 
324 | template<typename T, typename Float>
325 | std::vector<uint> DBSCAN<T, Float>::regionQuery(const uint pid) const {
326 | 
327 |     std::vector<uint> neighbors;
328 | 
329 | #if BRUTEFORCE //brute force  O(n^2)
330 |     for (uint i = 0; i < this->_data->size(); ++i)
331 |         if (i != pid &&  this->_disfunc((*this->_data)[pid], (*this->_data)[i]) < this->_epsilon)
332 |             neighbors.push_back(i);
333 | #else //kdtree
334 |     std::unique_ptr<double[]> v(new double[this->_datadim]);
335 |     for (uint c = 0; c < this->_datadim; ++c) {
336 |         v[c] = (double)((*this->_data)[pid][c]);
337 |     }
338 | 
339 |     kdres* presults = kd_nearest_range(this->_kdtree, v.get(), this->_epsilon);
340 |     while (!kd_res_end(presults)) {
341 |         /* get the data and position of the current result item */
342 |         T* pch = (T*)kd_res_item(presults, v.get());
343 |         uint pnpid = (uint)(pch - &(*this->_data)[0]);
344 |         if(pid != pnpid) neighbors.push_back(pnpid);
345 |         /* go to the next entry */
346 |         kd_res_next(presults);
347 |     }
348 |     kd_res_free(presults);
349 | 
350 | #endif // !BRUTEFORCE
351 | 
352 |     return neighbors;
353 | }
354 | 
355 | template<typename T, typename Float>
356 | void DBSCAN<T, Float>::expandCluster(const uint cid, const std::vector<uint>& neighbors) {
357 | 
358 |     std::queue<uint> border; // it has unvisited , visited unassigned pts. visited assigned will not appear
359 |     for (uint pid : neighbors) border.push(pid);
360 |     this->addToBorderSet(neighbors);
361 | 
362 |     while(border.size() > 0) {
363 |         const uint pid = border.front();
364 |         border.pop();
365 | 
366 |         if (!this->_visited[pid]) {
367 | 
368 |             // not been visited, great! , hurry to mark it visited
369 |             this->_visited[pid] = true;
370 |             const std::vector<uint> pidneighbors = this->regionQuery(pid);
371 | 
372 |             // Core point, the neighbors will be expanded
373 |             if (pidneighbors.size() >= this->_minpts) {
374 |                 this->addToCluster(pid, cid);
375 |                 for (uint pidnid : pidneighbors) {
376 |                     if (!this->isInBorderSet(pidnid)) {
377 |                         border.push(pidnid);
378 |                         this->addToBorderSet(pidnid);
379 |                     }
380 |                 }
381 |             }
382 |         }
383 |     }
384 | 
385 | }
386 | 
387 | template<typename T, typename Float>
388 | void DBSCAN<T, Float>::addToCluster(const uint pid, const uint cid) {
389 |     this->Clusters[cid].push_back(pid);
390 |     this->_assigned[pid] = true;
391 | }
392 | 
393 | #endif //MNN_DBSCAN_HPP
394 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/freeze_lanenet_model.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding: utf-8 -*-
 3 | # @Time    : 2019/11/5 下午4:53
 4 | # @Author  : MaybeShewill-CV
 5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
 6 | # @File    : freeze_lanenet_model.py.py
 7 | # @IDE: PyCharm
 8 | """
 9 | Freeze Lanenet model into frozen pb file
10 | """
11 | from __future__ import absolute_import
12 | from __future__ import division
13 | from __future__ import print_function
14 | 
15 | import argparse
16 | 
17 | import tensorflow as tf
18 | 
19 | from LaneDetectionLaneNet.lanenet_model import lanenet
20 | 
21 | MODEL_WEIGHTS_FILE_PATH = './test.ckpt'
22 | OUTPUT_PB_FILE_PATH = './lanenet.pb'
23 | 
24 | 
25 | def init_args():
26 |     """
27 | 
28 |     :return:
29 |     """
30 |     parser = argparse.ArgumentParser()
31 |     parser.add_argument('-w', '--weights_path', default=MODEL_WEIGHTS_FILE_PATH)
32 |     parser.add_argument('-s', '--save_path', default=OUTPUT_PB_FILE_PATH)
33 | 
34 |     return parser.parse_args()
35 | 
36 | 
37 | def convert_ckpt_into_pb_file(ckpt_file_path, pb_file_path):
38 |     """
39 | 
40 |     :param ckpt_file_path:
41 |     :param pb_file_path:
42 |     :return:
43 |     """
44 |     # construct compute graph
45 |     with tf.variable_scope('lanenet'):
46 |         input_tensor = tf.placeholder(dtype=tf.float32, shape=[1, 256, 512, 3], name='input_tensor')
47 | 
48 |     net = lanenet.LaneNet(phase='test', net_flag='vgg')
49 |     binary_seg_ret, instance_seg_ret = net.inference(input_tensor=input_tensor, name='lanenet_model')
50 | 
51 |     with tf.variable_scope('lanenet/'):
52 |         binary_seg_ret = tf.cast(binary_seg_ret, dtype=tf.float32)
53 |         binary_seg_ret = tf.squeeze(binary_seg_ret, axis=0, name='final_binary_output')
54 |         instance_seg_ret = tf.squeeze(instance_seg_ret, axis=0, name='final_pixel_embedding_output')
55 | 
56 |     # create a session
57 |     saver = tf.train.Saver()
58 | 
59 |     sess_config = tf.ConfigProto()
60 |     sess_config.gpu_options.per_process_gpu_memory_fraction = 0.85
61 |     sess_config.gpu_options.allow_growth = False
62 |     sess_config.gpu_options.allocator_type = 'BFC'
63 | 
64 |     sess = tf.Session(config=sess_config)
65 | 
66 |     with sess.as_default():
67 |         saver.restore(sess, ckpt_file_path)
68 | 
69 |         converted_graph_def = tf.graph_util.convert_variables_to_constants(
70 |             sess,
71 |             input_graph_def=sess.graph.as_graph_def(),
72 |             output_node_names=[
73 |                 'lanenet/input_tensor',
74 |                 'lanenet/final_binary_output',
75 |                 'lanenet/final_pixel_embedding_output'
76 |             ]
77 |         )
78 | 
79 |         with tf.gfile.GFile(pb_file_path, "wb") as f:
80 |             f.write(converted_graph_def.SerializeToString())
81 | 
82 | 
83 | if __name__ == '__main__':
84 |     """
85 |     test code
86 |     """
87 |     args = init_args()
88 | 
89 |     convert_ckpt_into_pb_file(
90 |         ckpt_file_path=args.weights_path,
91 |         pb_file_path=args.save_path
92 |     )
93 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/kdtree.cpp:
--------------------------------------------------------------------------------
  1 | /*
  2 | This file is part of ``kdtree'', a library for working with kd-trees.
  3 | Copyright (C) 2007-2009 John Tsiombikas <nuclear@siggraph.org>
  4 | 
  5 | Redistribution and use in source and binary forms, with or without
  6 | modification, are permitted provided that the following conditions are met:
  7 | 
  8 | 1. Redistributions of source code must retain the above copyright notice, this
  9 |    list of conditions and the following disclaimer.
 10 | 2. Redistributions in binary form must reproduce the above copyright notice,
 11 |    this list of conditions and the following disclaimer in the documentation
 12 |    and/or other materials provided with the distribution.
 13 | 3. The name of the author may not be used to endorse or promote products
 14 |    derived from this software without specific prior written permission.
 15 | 
 16 | THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
 17 | WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
 18 | MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
 19 | EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
 20 | EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT
 21 | OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 22 | INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 23 | CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
 24 | IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY
 25 | OF SUCH DAMAGE.
 26 | */
 27 | /* single nearest neighbor search written by Tamas Nepusz <tamas@cs.rhul.ac.uk> */
 28 | 
 29 | #include <string.h>
 30 | #include <math.h>
 31 | #include "kdtree.h"
 32 | 
 33 | #define SQ(x)           ((x) * (x))
 34 | 
 35 | static void clear_rec(struct kdnode *node, void (*destr)(void*));
 36 | static int insert_rec(struct kdnode **node, const double *pos, void *data, int dir, int dim);
 37 | static int rlist_insert(struct res_node *list, struct kdnode *item, double dist_sq);
 38 | static void clear_results(struct kdres *set);
 39 | 
 40 | static struct kdhyperrect* hyperrect_create(int dim, const double *min, const double *max);
 41 | static void hyperrect_free(struct kdhyperrect *rect);
 42 | static struct kdhyperrect* hyperrect_duplicate(const struct kdhyperrect *rect);
 43 | static void hyperrect_extend(struct kdhyperrect *rect, const double *pos);
 44 | static double hyperrect_dist_sq(struct kdhyperrect *rect, const double *pos);
 45 | 
 46 | struct kdtree *kd_create(int k)
 47 | {
 48 |     struct kdtree *tree;
 49 | 
 50 |     if(!(tree = new kdtree)) {
 51 |         return 0;
 52 |     }
 53 | 
 54 |     tree->dim = k;
 55 |     tree->root = 0;
 56 |     tree->destr = 0;
 57 |     tree->rect = 0;
 58 | 
 59 |     return tree;
 60 | }
 61 | 
 62 | void kd_free(struct kdtree *tree)
 63 | {
 64 |     if(tree) {
 65 |         kd_clear(tree);
 66 |         delete tree;
 67 |     }
 68 | }
 69 | 
 70 | static void clear_rec(struct kdnode *node, void (*destr)(void*))
 71 | {
 72 |     if(!node) return;
 73 | 
 74 |     clear_rec(node->left, destr);
 75 |     clear_rec(node->right, destr);
 76 | 
 77 |     if(destr) {
 78 |         destr(node->data);
 79 |     }
 80 |     delete[] node->pos;
 81 |     delete node;
 82 | }
 83 | 
 84 | void kd_clear(struct kdtree *tree)
 85 | {
 86 |     clear_rec(tree->root, tree->destr);
 87 |     tree->root = 0;
 88 | 
 89 |     if (tree->rect) {
 90 |         hyperrect_free(tree->rect);
 91 |         tree->rect = 0;
 92 |     }
 93 | }
 94 | 
 95 | void kd_data_destructor(struct kdtree *tree, void (*destr)(void*))
 96 | {
 97 |     tree->destr = destr;
 98 | }
 99 | 
100 | 
101 | static int insert_rec(struct kdnode **nptr, const double *pos, void *data, int dir, int dim)
102 | {
103 |     int new_dir;
104 |     struct kdnode *node;
105 | 
106 |     if(!*nptr) {
107 |         if(!(node = new kdnode)) {
108 |             return -1;
109 |         }
110 |         if(!(node->pos = new double[dim])) {
111 |             delete[] node;
112 |             return -1;
113 |         }
114 |         memcpy(node->pos, pos, dim * sizeof *node->pos);
115 |         node->data = data;
116 |         node->dir = dir;
117 |         node->left = node->right = 0;
118 |         *nptr = node;
119 |         return 0;
120 |     }
121 | 
122 |     node = *nptr;
123 |     new_dir = (node->dir + 1) % dim;
124 |     if(pos[node->dir] < node->pos[node->dir]) {
125 |         return insert_rec(&(*nptr)->left, pos, data, new_dir, dim);
126 |     }
127 |     return insert_rec(&(*nptr)->right, pos, data, new_dir, dim);
128 | }
129 | 
130 | int kd_insert(struct kdtree *tree, const double *pos, void *data)
131 | {
132 |     if (insert_rec(&tree->root, pos, data, 0, tree->dim)) {
133 |         return -1;
134 |     }
135 | 
136 |     if (tree->rect == 0) {
137 |         tree->rect = hyperrect_create(tree->dim, pos, pos);
138 |     } else {
139 |         hyperrect_extend(tree->rect, pos);
140 |     }
141 | 
142 |     return 0;
143 | }
144 | 
145 | static int find_nearest(struct kdnode *node, const double *pos, double range, struct res_node *list, int ordered, int dim)
146 | {
147 |     double dist_sq, dx;
148 |     int i, ret, added_res = 0;
149 | 
150 |     if(!node) return 0;
151 | 
152 |     dist_sq = 0;
153 |     for(i=0; i<dim; i++) {
154 |         dist_sq += SQ(node->pos[i] - pos[i]);
155 |     }
156 |     if(dist_sq <= SQ(range)) {
157 |         if(rlist_insert(list, node, ordered ? dist_sq : -1.0) == -1) {
158 |             return -1;
159 |         }
160 |         added_res = 1;
161 |     }
162 | 
163 |     dx = pos[node->dir] - node->pos[node->dir];
164 | 
165 |     ret = find_nearest(dx <= 0.0 ? node->left : node->right, pos, range, list, ordered, dim);
166 |     if(ret >= 0 && fabs(dx) < range) {
167 |         added_res += ret;
168 |         ret = find_nearest(dx <= 0.0 ? node->right : node->left, pos, range, list, ordered, dim);
169 |     }
170 |     if(ret == -1) {
171 |         return -1;
172 |     }
173 |     added_res += ret;
174 | 
175 |     return added_res;
176 | }
177 | 
178 | #if 0
179 | static int find_nearest_n(struct kdnode *node, const double *pos, double range, int num, struct rheap *heap, int dim)
180 | {
181 |     double dist_sq, dx;
182 |     int i, ret, added_res = 0;
183 | 
184 |     if(!node) return 0;
185 | 
186 |     /* if the photon is close enough, add it to the result heap */
187 |     dist_sq = 0;
188 |     for(i=0; i<dim; i++) {
189 |         dist_sq += SQ(node->pos[i] - pos[i]);
190 |     }
191 |     if(dist_sq <= range_sq) {
192 |         if(heap->size >= num) {
193 |             /* get furthest element */
194 |             struct res_node *maxelem = rheap_get_max(heap);
195 | 
196 |             /* and check if the new one is closer than that */
197 |             if(maxelem->dist_sq > dist_sq) {
198 |                 rheap_remove_max(heap);
199 | 
200 |                 if(rheap_insert(heap, node, dist_sq) == -1) {
201 |                     return -1;
202 |                 }
203 |                 added_res = 1;
204 | 
205 |                 range_sq = dist_sq;
206 |             }
207 |         } else {
208 |             if(rheap_insert(heap, node, dist_sq) == -1) {
209 |                 return =1;
210 |             }
211 |             added_res = 1;
212 |         }
213 |     }
214 | 
215 | 
216 |     /* find signed distance from the splitting plane */
217 |     dx = pos[node->dir] - node->pos[node->dir];
218 | 
219 |     ret = find_nearest_n(dx <= 0.0 ? node->left : node->right, pos, range, num, heap, dim);
220 |     if(ret >= 0 && fabs(dx) < range) {
221 |         added_res += ret;
222 |         ret = find_nearest_n(dx <= 0.0 ? node->right : node->left, pos, range, num, heap, dim);
223 |     }
224 | 
225 | }
226 | #endif
227 | 
228 | static void kd_nearest_i(struct kdnode *node, const double *pos, struct kdnode **result, double *result_dist_sq, struct kdhyperrect* rect)
229 | {
230 |     int dir = node->dir;
231 |     int i;
232 |     double dummy, dist_sq;
233 |     struct kdnode *nearer_subtree, *farther_subtree;
234 |     double *nearer_hyperrect_coord, *farther_hyperrect_coord;
235 | 
236 |     /* Decide whether to go left or right in the tree */
237 |     dummy = pos[dir] - node->pos[dir];
238 |     if (dummy <= 0) {
239 |         nearer_subtree = node->left;
240 |         farther_subtree = node->right;
241 |         nearer_hyperrect_coord = rect->max + dir;
242 |         farther_hyperrect_coord = rect->min + dir;
243 |     } else {
244 |         nearer_subtree = node->right;
245 |         farther_subtree = node->left;
246 |         nearer_hyperrect_coord = rect->min + dir;
247 |         farther_hyperrect_coord = rect->max + dir;
248 |     }
249 | 
250 |     if (nearer_subtree) {
251 |         /* Slice the hyperrect to get the hyperrect of the nearer subtree */
252 |         dummy = *nearer_hyperrect_coord;
253 |         *nearer_hyperrect_coord = node->pos[dir];
254 |         /* Recurse down into nearer subtree */
255 |         kd_nearest_i(nearer_subtree, pos, result, result_dist_sq, rect);
256 |         /* Undo the slice */
257 |         *nearer_hyperrect_coord = dummy;
258 |     }
259 | 
260 |     /* Check the distance of the point at the current node, compare it
261 |      * with our best so far */
262 |     dist_sq = 0;
263 |     for(i=0; i < rect->dim; i++) {
264 |         dist_sq += SQ(node->pos[i] - pos[i]);
265 |     }
266 |     if (dist_sq < *result_dist_sq) {
267 |         *result = node;
268 |         *result_dist_sq = dist_sq;
269 |     }
270 | 
271 |     if (farther_subtree) {
272 |         /* Get the hyperrect of the farther subtree */
273 |         dummy = *farther_hyperrect_coord;
274 |         *farther_hyperrect_coord = node->pos[dir];
275 |         /* Check if we have to recurse down by calculating the closest
276 |          * point of the hyperrect and see if it's closer than our
277 |          * minimum distance in result_dist_sq. */
278 |         if (hyperrect_dist_sq(rect, pos) < *result_dist_sq) {
279 |             /* Recurse down into farther subtree */
280 |             kd_nearest_i(farther_subtree, pos, result, result_dist_sq, rect);
281 |         }
282 |         /* Undo the slice on the hyperrect */
283 |         *farther_hyperrect_coord = dummy;
284 |     }
285 | }
286 | 
287 | struct kdres *kd_nearest(struct kdtree *kd, const double *pos)
288 | {
289 |     struct kdhyperrect *rect;
290 |     struct kdnode *result;
291 |     struct kdres *rset;
292 |     double dist_sq;
293 |     int i;
294 | 
295 |     if (!kd) return 0;
296 |     if (!kd->rect) return 0;
297 | 
298 |     /* Allocate result set */
299 |     if(!(rset = new kdres)) {
300 |         return 0;
301 |     }
302 |     if(!(rset->rlist = new res_node)) {
303 |         delete rset;
304 |         return 0;
305 |     }
306 |     rset->rlist->next = 0;
307 |     rset->tree = kd;
308 | 
309 |     /* Duplicate the bounding hyperrectangle, we will work on the copy */
310 |     if (!(rect = hyperrect_duplicate(kd->rect))) {
311 |         kd_res_free(rset);
312 |         return 0;
313 |     }
314 | 
315 |     /* Our first guesstimate is the root node */
316 |     result = kd->root;
317 |     dist_sq = 0;
318 |     for (i = 0; i < kd->dim; i++)
319 |         dist_sq += SQ(result->pos[i] - pos[i]);
320 | 
321 |     /* Search for the nearest neighbour recursively */
322 |     kd_nearest_i(kd->root, pos, &result, &dist_sq, rect);
323 | 
324 |     /* Free the copy of the hyperrect */
325 |     hyperrect_free(rect);
326 | 
327 |     /* Store the result */
328 |     if (result) {
329 |         if (rlist_insert(rset->rlist, result, -1.0) == -1) {
330 |             kd_res_free(rset);
331 |             return 0;
332 |         }
333 |         rset->size = 1;
334 |         kd_res_rewind(rset);
335 |         return rset;
336 |     } else {
337 |         kd_res_free(rset);
338 |         return 0;
339 |     }
340 | }
341 | 
342 | struct kdres *kd_nearest_range(struct kdtree *kd, const double *pos, double range)
343 | {
344 |     int ret;
345 |     struct kdres *rset;
346 | 
347 |     if(!(rset = new kdres)) {
348 |         return 0;
349 |     }
350 |     if(!(rset->rlist = new res_node)) {
351 |         delete rset;
352 |         return 0;
353 |     }
354 |     rset->rlist->next = 0;
355 |     rset->tree = kd;
356 | 
357 |     if((ret = find_nearest(kd->root, pos, range, rset->rlist, 0, kd->dim)) == -1) {
358 |         kd_res_free(rset);
359 |         return 0;
360 |     }
361 |     rset->size = ret;
362 |     kd_res_rewind(rset);
363 |     return rset;
364 | }
365 | 
366 | void kd_res_free(struct kdres *rset)
367 | {
368 |     clear_results(rset);
369 |     delete rset->rlist;
370 |     delete rset;
371 | }
372 | 
373 | int kd_res_size(struct kdres *set)
374 | {
375 |     return (set->size);
376 | }
377 | 
378 | void kd_res_rewind(struct kdres *rset)
379 | {
380 |     rset->riter = rset->rlist->next;
381 | }
382 | 
383 | int kd_res_end(struct kdres *rset)
384 | {
385 |     return rset->riter == 0;
386 | }
387 | 
388 | int kd_res_next(struct kdres *rset)
389 | {
390 |     rset->riter = rset->riter->next;
391 |     return rset->riter != 0;
392 | }
393 | 
394 | void *kd_res_item(struct kdres *rset, double *pos)
395 | {
396 |     if(rset->riter) {
397 |         if(pos) {
398 |             memcpy(pos, rset->riter->item->pos, rset->tree->dim * sizeof *pos);
399 |         }
400 |         return rset->riter->item->data;
401 |     }
402 |     return 0;
403 | }
404 | 
405 | void *kd_res_item_data(struct kdres *set)
406 | {
407 |     return kd_res_item(set, 0);
408 | }
409 | 
410 | /* ---- hyperrectangle helpers ---- */
411 | static struct kdhyperrect* hyperrect_create(int dim, const double *min, const double *max)
412 | {
413 |     size_t size = dim * sizeof(double);
414 |     struct kdhyperrect* rect = 0;
415 | 
416 |     if (!(rect = new kdhyperrect)) {
417 |         return 0;
418 |     }
419 | 
420 |     rect->dim = dim;
421 |     if (!(rect->min = new double[size])) {
422 |         delete rect;
423 |         return 0;
424 |     }
425 |     if (!(rect->max = new double[size])) {
426 |         delete[] rect->min;
427 |         delete rect;
428 |         return 0;
429 |     }
430 |     memcpy(rect->min, min, size);
431 |     memcpy(rect->max, max, size);
432 | 
433 |     return rect;
434 | }
435 | 
436 | static void hyperrect_free(struct kdhyperrect *rect)
437 | {
438 |     delete[] rect->min;
439 |     delete[] rect->max;
440 |     delete rect;
441 | }
442 | 
443 | static struct kdhyperrect* hyperrect_duplicate(const struct kdhyperrect *rect)
444 | {
445 |     return hyperrect_create(rect->dim, rect->min, rect->max);
446 | }
447 | 
448 | static void hyperrect_extend(struct kdhyperrect *rect, const double *pos)
449 | {
450 |     int i;
451 | 
452 |     for (i=0; i < rect->dim; i++) {
453 |         if (pos[i] < rect->min[i]) {
454 |             rect->min[i] = pos[i];
455 |         }
456 |         if (pos[i] > rect->max[i]) {
457 |             rect->max[i] = pos[i];
458 |         }
459 |     }
460 | }
461 | 
462 | static double hyperrect_dist_sq(struct kdhyperrect *rect, const double *pos)
463 | {
464 |     int i;
465 |     double result = 0;
466 | 
467 |     for (i=0; i < rect->dim; i++) {
468 |         if (pos[i] < rect->min[i]) {
469 |             result += SQ(rect->min[i] - pos[i]);
470 |         } else if (pos[i] > rect->max[i]) {
471 |             result += SQ(rect->max[i] - pos[i]);
472 |         }
473 |     }
474 | 
475 |     return result;
476 | }
477 | 
478 | /* inserts the item. if dist_sq is >= 0, then do an ordered insert */
479 | /* TODO make the ordering code use heapsort */
480 | static int rlist_insert(struct res_node *list, struct kdnode *item, double dist_sq)
481 | {
482 |     struct res_node *rnode;
483 | 
484 |     if(!(rnode = new res_node)) {
485 |         return -1;
486 |     }
487 |     rnode->item = item;
488 |     rnode->dist_sq = dist_sq;
489 | 
490 |     if(dist_sq >= 0.0) {
491 |         while(list->next && list->next->dist_sq < dist_sq) {
492 |             list = list->next;
493 |         }
494 |     }
495 |     rnode->next = list->next;
496 |     list->next = rnode;
497 |     return 0;
498 | }
499 | 
500 | static void clear_results(struct kdres *rset)
501 | {
502 |     struct res_node *tmp, *node = rset->rlist->next;
503 | 
504 |     while(node) {
505 |         tmp = node;
506 |         node = node->next;
507 |         delete tmp;
508 |     }
509 | 
510 |     rset->rlist->next = 0;
511 | }
512 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/kdtree.h:
--------------------------------------------------------------------------------
  1 | /*
  2 | This file is part of ``kdtree'', a library for working with kd-trees.
  3 | Copyright (C) 2007-2009 John Tsiombikas <nuclear@siggraph.org>
  4 | 
  5 | Redistribution and use in source and binary forms, with or without
  6 | modification, are permitted provided that the following conditions are met:
  7 | 
  8 | 1. Redistributions of source code must retain the above copyright notice, this
  9 |    list of conditions and the following disclaimer.
 10 | 2. Redistributions in binary form must reproduce the above copyright notice,
 11 |    this list of conditions and the following disclaimer in the documentation
 12 |    and/or other materials provided with the distribution.
 13 | 3. The name of the author may not be used to endorse or promote products
 14 |    derived from this software without specific prior written permission.
 15 | 
 16 | THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
 17 | WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
 18 | MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
 19 | EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
 20 | EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT
 21 | OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 22 | INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 23 | CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
 24 | IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY
 25 | OF SUCH DAMAGE.
 26 | */
 27 | #ifndef _KDTREE_H_
 28 | #define _KDTREE_H_
 29 | 
 30 | #ifdef __cplusplus
 31 | extern "C" {
 32 | #endif
 33 | 
 34 | struct kdhyperrect {
 35 |     int dim;
 36 |     double *min, *max;              /* minimum/maximum coords */
 37 | };
 38 | 
 39 | struct kdnode {
 40 |     double *pos;
 41 |     int dir;
 42 |     void *data;
 43 | 
 44 |     struct kdnode *left, *right;    /* negative/positive side */
 45 | };
 46 | 
 47 | struct res_node {
 48 |     struct kdnode *item;
 49 |     double dist_sq;
 50 |     struct res_node *next;
 51 | };
 52 | 
 53 | struct kdtree {
 54 |     int dim;
 55 |     struct kdnode *root;
 56 |     struct kdhyperrect *rect;
 57 |     void (*destr)(void*);
 58 | };
 59 | 
 60 | struct kdres {
 61 |     struct kdtree *tree;
 62 |     struct res_node *rlist, *riter;
 63 |     int size;
 64 | };
 65 | 
 66 | 
 67 | /* create a kd-tree for "k"-dimensional data */
 68 | struct kdtree *kd_create(int k);
 69 | 
 70 | /* free the struct kdtree */
 71 | void kd_free(struct kdtree *tree);
 72 | 
 73 | /* remove all the elements from the tree */
 74 | void kd_clear(struct kdtree *tree);
 75 | 
 76 | /* if called with non-null 2nd argument, the function provided
 77 |  * will be called on data pointers (see kd_insert) when nodes
 78 |  * are to be removed from the tree.
 79 |  */
 80 | void kd_data_destructor(struct kdtree *tree, void (*destr)(void*));
 81 | 
 82 | /* insert a node, specifying its position, and optional data */
 83 | int kd_insert(struct kdtree *tree, const double *pos, void *data);
 84 | 
 85 | /* Find the nearest node from a given point.
 86 |  *
 87 |  * This function returns a pointer to a result set with at most one element.
 88 |  */
 89 | struct kdres *kd_nearest(struct kdtree *tree, const double *pos);
 90 | 
 91 | /* Find the N nearest nodes from a given point.
 92 |  *
 93 |  * This function returns a pointer to a result set, with at most N elements,
 94 |  * which can be manipulated with the kd_res_* functions.
 95 |  * The returned pointer can be null as an indication of an error. Otherwise
 96 |  * a valid result set is always returned which may contain 0 or more elements.
 97 |  * The result set must be deallocated with kd_res_free after use.
 98 |  */
 99 | /*
100 | struct kdres *kd_nearest_n(struct kdtree *tree, const double *pos, int num);
101 | struct kdres *kd_nearest_nf(struct kdtree *tree, const float *pos, int num);
102 | struct kdres *kd_nearest_n3(struct kdtree *tree, double x, double y, double z);
103 | struct kdres *kd_nearest_n3f(struct kdtree *tree, float x, float y, float z);
104 | */
105 | 
106 | /* Find any nearest nodes from a given point within a range.
107 |  *
108 |  * This function returns a pointer to a result set, which can be manipulated
109 |  * by the kd_res_* functions.
110 |  * The returned pointer can be null as an indication of an error. Otherwise
111 |  * a valid result set is always returned which may contain 0 or more elements.
112 |  * The result set must be deallocated with kd_res_free after use.
113 |  */
114 | struct kdres *kd_nearest_range(struct kdtree *tree, const double *pos, double range);
115 | 
116 | /* frees a result set returned by kd_nearest_range() */
117 | void kd_res_free(struct kdres *set);
118 | 
119 | /* returns the size of the result set (in elements) */
120 | int kd_res_size(struct kdres *set);
121 | 
122 | /* rewinds the result set iterator */
123 | void kd_res_rewind(struct kdres *set);
124 | 
125 | /* returns non-zero if the set iterator reached the end after the last element */
126 | int kd_res_end(struct kdres *set);
127 | 
128 | /* advances the result set iterator, returns non-zero on success, zero if
129 |  * there are no more elements in the result set.
130 |  */
131 | int kd_res_next(struct kdres *set);
132 | 
133 | /* returns the data pointer (can be null) of the current result set item
134 |  * and optionally sets its position to the pointers(s) if not null.
135 |  */
136 | void *kd_res_item(struct kdres *set, double *pos);
137 | 
138 | /* equivalent to kd_res_item(set, 0) */
139 | void *kd_res_item_data(struct kdres *set);
140 | 
141 | 
142 | #ifdef __cplusplus
143 | }
144 | #endif
145 | 
146 | #endif  /* _KDTREE_H_ */
147 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/lanenet_model.cpp:
--------------------------------------------------------------------------------
  1 | /************************************************
  2 | * Copyright 2019 Baidu Inc. All Rights Reserved.
  3 | * Author: MaybeShewill-CV
  4 | * File: lanenetModel.cpp
  5 | * Date: 2019/11/5 下午5:19
  6 | ************************************************/
  7 | 
  8 | #include "lanenet_model.h"
  9 | 
 10 | #include <omp.h>
 11 | 
 12 | #include <glog/logging.h>
 13 | #include <boost/lexical_cast.hpp>
 14 | 
 15 | #include <AutoTime.hpp>
 16 | #include "dbscan.hpp"
 17 | 
 18 | namespace beec_task {
 19 | namespace lane_detection {
 20 | 
 21 | /******************Public Function Sets***************/
 22 | 
 23 | /***
 24 |  * Constructor. Using config file to setup lanenet model. Mainly defined object are as follows:
 25 |  * 1.Init mnn model file path
 26 |  * 2.Init lanenet model pixel embedding feature dims
 27 |  * 3.Init dbscan cluster search radius eps threshold
 28 |  * 4.Init dbscan cluster min pts which are supposed to belong to a core object.
 29 |  * @param config
 30 |  */
 31 | LaneNet::LaneNet(const beec::config_parse_utils::ConfigParser &config) {
 32 |     using config_content = std::map<std::string, std::string>;
 33 | 
 34 |     config_content config_section;
 35 |     try {
 36 |         config_section = config["LaneNet"];
 37 |     } catch (const std::out_of_range& e) {
 38 |         LOG(ERROR) << e.what();
 39 |         LOG(ERROR) << "Can not get LaneNet section content in config file, please check again";
 40 |         _m_successfully_initialized = false;
 41 |         return;
 42 |     }
 43 | 
 44 |     if (config_section.find("dbscan_neighbor_radius") == config_section.end()) {
 45 |         LOG(ERROR) << "Can not find \"dbscan_neighbor_radius\" field in config section";
 46 |         _m_successfully_initialized = false;
 47 |         return;
 48 |     } else {
 49 |         _m_dbscan_eps = boost::lexical_cast<float>(config_section["dbscan_neighbor_radius"]);
 50 |     }
 51 | 
 52 |     if (config_section.find("dbscan_core_object_min_pts") == config_section.end()) {
 53 |         LOG(ERROR) << "Can not find \"dbscan_core_object_min_pts\" field in config section";
 54 |         _m_successfully_initialized = false;
 55 |         return;
 56 |     } else {
 57 |         _m_dbscan_min_pts = boost::lexical_cast<uint>(config_section["dbscan_core_object_min_pts"]);
 58 |     }
 59 | 
 60 |     if (config_section.find("pix_embedding_feature_dims") == config_section.end()) {
 61 |         LOG(ERROR) << "Can not find \"pix_embedding_feature_dims\" field in config section";
 62 |         _m_successfully_initialized = false;
 63 |         return;
 64 |     } else {
 65 |         _m_lanenet_pix_embedding_feature_dims = boost::lexical_cast<uint>(config_section["pix_embedding_feature_dims"]);
 66 |     }
 67 | 
 68 |     if (config_section.find("model_file_path") == config_section.end()) {
 69 |         LOG(ERROR) << "Can not find \"model_file_path\" field in config section";
 70 |         _m_successfully_initialized = false;
 71 |         return;
 72 |     } else {
 73 |         _m_lanenet_model_file_path = config_section["model_file_path"];
 74 |     }
 75 | 
 76 |     _m_lanenet_model = std::unique_ptr<MNN::Interpreter>(MNN::Interpreter::createFromFile(
 77 |                            _m_lanenet_model_file_path.c_str()));
 78 |     if (nullptr == _m_lanenet_model) {
 79 |         LOG(ERROR) << "Construct lanenet mnn interpreter failed";
 80 |         _m_successfully_initialized = false;
 81 |         return;
 82 |     }
 83 | 
 84 |     MNN::ScheduleConfig mnn_config;
 85 |     mnn_config.type = MNN_FORWARD_CPU;
 86 |     mnn_config.numThread = 4;
 87 | 
 88 |     MNN::BackendConfig backend_config;
 89 |     backend_config.precision = MNN::BackendConfig::Precision_High;
 90 |     backend_config.power = MNN::BackendConfig::Power_High;
 91 |     mnn_config.backendConfig = &backend_config;
 92 | 
 93 |     _m_lanenet_session = _m_lanenet_model->createSession(mnn_config);
 94 |     if (nullptr == _m_lanenet_session) {
 95 |         LOG(ERROR) << "Construct laneNet mnn session failed";
 96 |         _m_successfully_initialized = false;
 97 |         return;
 98 |     }
 99 | 
100 |     std::string input_node_name = "lanenet/input_tensor";
101 |     std::string pix_embedding_output_name = "lanenet/final_pixel_embedding_output";
102 |     std::string binary_output_name = "lanenet/final_binary_output";
103 |     _m_input_tensor_host = _m_lanenet_model->getSessionInput(
104 |                                _m_lanenet_session, input_node_name.c_str());
105 |     _m_binary_output_tensor_host = _m_lanenet_model->getSessionOutput(
106 |                                        _m_lanenet_session, binary_output_name.c_str());
107 |     _m_pix_embedding_output_tensor_host = _m_lanenet_model->getSessionOutput(
108 |             _m_lanenet_session, pix_embedding_output_name.c_str());
109 |     _m_input_node_size_host.width = _m_input_tensor_host->width();
110 |     _m_input_node_size_host.height = _m_input_tensor_host->height();
111 | 
112 |     _m_successfully_initialized = true;
113 |     return;
114 | }
115 | 
116 | /***
117 |  * Destructor
118 |  */
119 | LaneNet::~LaneNet() {
120 |     _m_lanenet_model->releaseModel();
121 |     _m_lanenet_model->releaseSession(_m_lanenet_session);
122 | }
123 | 
124 | /***
125 |  * Detect lanes on image using lanenet model
126 |  * @param input_image
127 |  * @param binary_seg_result
128 |  * @param pix_embedding_result
129 |  */
130 | void LaneNet::detect(const cv::Mat &input_image, cv::Mat &binary_seg_result, cv::Mat &instance_seg_result) {
131 | 
132 |     // preprocess
133 |     cv::Mat input_image_copy;
134 |     input_image.copyTo(input_image_copy);
135 |     {
136 |         AUTOTIME
137 |         preprocess(input_image, input_image_copy);
138 |     }
139 | 
140 |     // run session
141 |     MNN::Tensor input_tensor_user(_m_input_tensor_host, MNN::Tensor::DimensionType::TENSORFLOW);
142 |     {
143 |         AUTOTIME
144 |         auto input_tensor_user_data = input_tensor_user.host<float>();
145 |         auto input_tensor_user_size = input_tensor_user.size();
146 |         ::mempcpy(input_tensor_user_data, input_image_copy.data, input_tensor_user_size);
147 | 
148 |         _m_input_tensor_host->copyFromHostTensor(&input_tensor_user);
149 |         _m_lanenet_model->runSession(_m_lanenet_session);
150 |     }
151 | 
152 |     // output graph node
153 |     MNN::Tensor binary_output_tensor_user(
154 |         _m_binary_output_tensor_host, MNN::Tensor::DimensionType::TENSORFLOW);
155 |     MNN::Tensor pix_embedding_output_tensor_user(
156 |         _m_pix_embedding_output_tensor_host, MNN::Tensor::DimensionType::TENSORFLOW);
157 |     _m_binary_output_tensor_host->copyToHostTensor(&binary_output_tensor_user);
158 |     _m_pix_embedding_output_tensor_host->copyToHostTensor(&pix_embedding_output_tensor_user);
159 | 
160 |     auto binary_output_data = binary_output_tensor_user.host<float>();
161 |     cv::Mat binary_output_mat(_m_input_node_size_host, CV_32FC1, binary_output_data);
162 |     binary_output_mat *= 255;
163 |     binary_output_mat.convertTo(binary_seg_result, CV_8UC1);
164 | 
165 |     auto pix_embedding_output_data = pix_embedding_output_tensor_user.host<float>();
166 |     cv::Mat pix_embedding_output_mat(
167 |         _m_input_node_size_host, CV_32FC4, pix_embedding_output_data);
168 | 
169 |     // gather pixel embedding features
170 |     std::vector<cv::Point> coords;
171 |     std::vector<DBSCAMSample> pixel_embedding_samples;
172 |     gather_pixel_embedding_features(binary_seg_result, pix_embedding_output_mat,coords, pixel_embedding_samples);
173 | 
174 |     // simultaneously random shuffle embedding vector and coord vector inplace
175 |     simultaneously_random_shuffle<cv::Point, DBSCAMSample >(coords, pixel_embedding_samples);
176 | 
177 |     // normalize pixel embedding features
178 |     normalize_sample_features(pixel_embedding_samples, pixel_embedding_samples);
179 | 
180 |     // cluster samples
181 |     std::vector<std::vector<uint> > cluster_ret;
182 |     std::vector<uint> noise;
183 |     {
184 |         AUTOTIME
185 |         cluster_pixem_embedding_features(pixel_embedding_samples, cluster_ret, noise);
186 |     }
187 | 
188 |     // visualize instance segmentation
189 |     instance_seg_result = cv::Mat(_m_input_node_size_host, CV_8UC3, cv::Scalar(0, 0, 0));
190 |     {
191 |         AUTOTIME
192 |         visualize_instance_segmentation_result(cluster_ret, coords, instance_seg_result);
193 |     }
194 | }
195 | 
196 | /***************Private Function Sets*******************/
197 | 
198 | /***
199 |  * Resize image and scale image into [-1.0, 1.0]
200 |  * @param input_image
201 |  * @param output_image
202 |  */
203 | void LaneNet::preprocess(const cv::Mat &input_image, cv::Mat& output_image) {
204 | 
205 |     if (input_image.type() != CV_32FC3) {
206 |         input_image.convertTo(output_image, CV_32FC3);
207 |     }
208 | 
209 |     if (output_image.size() != _m_input_node_size_host) {
210 |         cv::resize(output_image, output_image, _m_input_node_size_host);
211 |     }
212 | 
213 |     cv::divide(output_image, cv::Scalar(127.5, 127.5, 127.5), output_image);
214 |     cv::subtract(output_image, cv::Scalar(1.0, 1.0, 1.0), output_image);
215 | 
216 |     return;
217 | }
218 | 
219 | /***
220 |  * Gather pixel embedding features via binary segmentation result
221 |  * @param binary_mask
222 |  * @param pixel_embedding
223 |  * @param coords
224 |  * @param embedding_features
225 |  */
226 | void LaneNet::gather_pixel_embedding_features(const cv::Mat &binary_mask, const cv::Mat &pixel_embedding,
227 |         std::vector<cv::Point> &coords,
228 |         std::vector<DBSCAMSample> &embedding_samples) {
229 | 
230 |     CHECK_EQ(binary_mask.size(), pixel_embedding.size());
231 |     auto image_rows = _m_input_node_size_host.height;
232 |     auto image_cols = _m_input_node_size_host.width;
233 | 
234 |     for (auto row = 0; row < image_rows; ++row) {
235 |         auto binary_image_row_data = binary_mask.ptr<uchar>(row);
236 |         auto embedding_image_row_data = pixel_embedding.ptr<cv::Vec4f>(row);
237 |         for (auto col = 0; col < image_cols; ++col) {
238 |             auto binary_image_pix_value = binary_image_row_data[col];
239 |             if (binary_image_pix_value == 255) {
240 |                 coords.emplace_back(cv::Point(col, row));
241 |                 Feature embedding_features;
242 |                 for (auto index = 0; index < 4; ++index) {
243 |                     embedding_features.push_back(embedding_image_row_data[col][index]);
244 |                 }
245 |                 DBSCAMSample sample(embedding_features, CLASSIFY_FLAGS::NOT_CALSSIFIED);
246 |                 embedding_samples.push_back(sample);
247 |             }
248 |         }
249 |     }
250 | }
251 | 
252 | /***
253 |  *
254 |  * @param embedding_samples
255 |  * @param cluster_ret
256 |  */
257 | void LaneNet::cluster_pixem_embedding_features(std::vector<DBSCAMSample> &embedding_samples,
258 |         std::vector<std::vector<uint> > &cluster_ret, std::vector<uint>& noise) {
259 | 
260 |     if (embedding_samples.empty()) {
261 |         LOG(INFO) << "Pixel embedding samples empty";
262 |         return;
263 |     }
264 | 
265 |     // dbscan cluster
266 |     auto dbscan = DBSCAN<DBSCAMSample, float>();
267 |     dbscan.Run(&embedding_samples, _m_lanenet_pix_embedding_feature_dims, _m_dbscan_eps, _m_dbscan_min_pts);
268 |     cluster_ret = dbscan.Clusters;
269 |     noise = dbscan.Noise;
270 | }
271 | 
272 | /***
273 |  * Visualize instance segmentation result
274 |  * @param cluster_ret
275 |  * @param coords
276 |  */
277 | void LaneNet::visualize_instance_segmentation_result(
278 |     const std::vector<std::vector<uint> > &cluster_ret,
279 |     const std::vector<cv::Point> &coords,
280 |     cv::Mat& intance_segmentation_result) {
281 | 
282 |     LOG(INFO) << "Cluster nums: " << cluster_ret.size();
283 | 
284 |     std::map<int, cv::Scalar> color_map = {
285 |         {0, cv::Scalar(0, 0, 255)},
286 |         {1, cv::Scalar(0, 255, 0)},
287 |         {2, cv::Scalar(255, 0, 0)},
288 |         {3, cv::Scalar(255, 0, 255)},
289 |         {4, cv::Scalar(0, 255, 255)},
290 |         {5, cv::Scalar(255, 255, 0)},
291 |         {6, cv::Scalar(125, 0, 125)},
292 |         {7, cv::Scalar(0, 125, 125)}
293 |     };
294 | 
295 |     omp_set_num_threads(4);
296 |     for (int class_id = 0; class_id < cluster_ret.size(); ++class_id) {
297 |         auto class_color = color_map[class_id];
298 |         #pragma omp parallel for
299 |         for (auto index = 0; index < cluster_ret[class_id].size(); ++index) {
300 |             auto coord = coords[cluster_ret[class_id][index]];
301 |             auto image_col_data = intance_segmentation_result.ptr<cv::Vec3b>(coord.y);
302 |             image_col_data[coord.x][0] = class_color[0];
303 |             image_col_data[coord.x][1] = class_color[1];
304 |             image_col_data[coord.x][2] = class_color[2];
305 |         }
306 |     }
307 | }
308 | 
309 | /***
310 |  * Calculate the mean feature vector among a vector of DBSCAMSample samples
311 |  * @param input_samples
312 |  * @return
313 |  */
314 | Feature LaneNet::calculate_mean_feature_vector(const std::vector<DBSCAMSample> &input_samples) {
315 | 
316 |     if (input_samples.empty()) {
317 |         return Feature();
318 |     }
319 | 
320 |     auto feature_dims = input_samples[0].get_feature_vector().size();
321 |     auto sample_nums = input_samples.size();
322 |     Feature mean_feature_vec;
323 |     mean_feature_vec.resize(feature_dims, 0.0);
324 |     for (const auto& sample : input_samples) {
325 |         for (auto index = 0; index < feature_dims; ++index) {
326 |             mean_feature_vec[index] += sample[index];
327 |         }
328 |     }
329 |     for (auto index = 0; index < feature_dims; ++index) {
330 |         mean_feature_vec[index] /= sample_nums;
331 |     }
332 | 
333 |     return mean_feature_vec;
334 | }
335 | 
336 | /***
337 |  *
338 |  * @param input_samples
339 |  * @param mean_feature_vec
340 |  * @return
341 |  */
342 | Feature LaneNet::calculate_stddev_feature_vector(
343 |         const std::vector<DBSCAMSample> &input_samples,
344 |         const Feature& mean_feature_vec) {
345 | 
346 |     if (input_samples.empty()) {
347 |         return Feature();
348 |     }
349 | 
350 |     auto feature_dims = input_samples[0].get_feature_vector().size();
351 |     auto sample_nums = input_samples.size();
352 | 
353 |     // calculate stddev feature vector
354 |     Feature stddev_feature_vec;
355 |     stddev_feature_vec.resize(feature_dims, 0.0);
356 |     for (const auto& sample : input_samples) {
357 |         for (auto index = 0; index < feature_dims; ++index) {
358 |             auto sample_feature = sample.get_feature_vector();
359 |             auto diff = sample_feature[index] - mean_feature_vec[index];
360 |             diff = std::pow(diff, 2);
361 |             stddev_feature_vec[index] += diff;
362 |         }
363 |     }
364 |     for (auto index = 0; index < feature_dims; ++index) {
365 |         stddev_feature_vec[index] /= sample_nums;
366 |         stddev_feature_vec[index] = std::sqrt(stddev_feature_vec[index]);
367 |     }
368 | 
369 |     return stddev_feature_vec;
370 | }
371 | 
372 | /***
373 |  * Normalize input samples' feature. Each sample's feature is normalized via function as follows:
374 |  * feature[i] = (feature[i] - mean_feature_vector[i]) / stddev_feature_vector[i].
375 |  * @param input_samples
376 |  * @param output_samples
377 |  */
378 | void LaneNet::normalize_sample_features(const std::vector<DBSCAMSample> &input_samples,
379 |                                         std::vector<DBSCAMSample> &output_samples) {
380 |     // calcualte mean feature vector
381 |     Feature mean_feature_vector = calculate_mean_feature_vector(input_samples);
382 | 
383 |     // calculate stddev feature vector
384 |     Feature stddev_feature_vector = calculate_stddev_feature_vector(input_samples, mean_feature_vector);
385 | 
386 |     std::vector<DBSCAMSample> input_samples_copy = input_samples;
387 |     for (auto& sample : input_samples_copy) {
388 |         auto feature = sample.get_feature_vector();
389 |         for (auto index = 0; index < feature.size(); ++index) {
390 |             feature[index] = (feature[index] - mean_feature_vector[index]) / stddev_feature_vector[index];
391 |         }
392 |         sample.set_feature_vector(feature);
393 |     }
394 |     output_samples = input_samples_copy;
395 | }
396 | 
397 | /***
398 |  * simultaneously random shuffle two vector inplace. The two input source vector should have the same size.
399 |  * @tparam T
400 |  * @param src1
401 |  * @param src2
402 |  */
403 | template <typename T1, typename T2>
404 | void LaneNet::simultaneously_random_shuffle(std::vector<T1> src1, std::vector<T2> src2) {
405 | 
406 |     CHECK_EQ(src1.size(), src2.size());
407 |     if (src1.empty() || src2.empty()) {
408 |         return;
409 |     }
410 | 
411 |     // construct index vector of two input src
412 |     std::vector<uint> indexes;
413 |     indexes.reserve(src1.size());
414 |     std::iota(indexes.begin(), indexes.end(), 0);
415 |     std::random_shuffle(indexes.begin(), indexes.end());
416 | 
417 |     // make copy of two input vector
418 |     std::vector<T1> src1_copy(src1);
419 |     std::vector<T2> src2_copy(src2);
420 | 
421 |     // random two source input vector via random shuffled index vector
422 |     for (uint i = 0; i < indexes.size(); ++i) {
423 |         src1[i] = src1_copy[indexes[i]];
424 |         src2[i] = src2_copy[indexes[i]];
425 |     }
426 | }
427 | 
428 | }
429 | }
430 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/mnn_project/lanenet_model.h:
--------------------------------------------------------------------------------
  1 | /************************************************
  2 | * Copyright 2019 Baidu Inc. All Rights Reserved.
  3 | * Author: MaybeShewill-CV
  4 | * File: lanenetModel.h
  5 | * Date: 2019/11/5 下午5:19
  6 | ************************************************/
  7 | 
  8 | #ifndef MNN_LANENET_MODEL_H
  9 | #define MNN_LANENET_MODEL_H
 10 | 
 11 | #include <memory>
 12 | #include <string>
 13 | 
 14 | #include <opencv2/opencv.hpp>
 15 | 
 16 | #include <Interpreter.hpp>
 17 | #include <Session.hpp>
 18 | #include <Tensor.hpp>
 19 | #include "config_parser.h"
 20 | #include "dbscan.hpp"
 21 | 
 22 | namespace beec_task {
 23 | namespace lane_detection {
 24 | 
 25 | using beec::config_parse_utils::ConfigParser;
 26 | using DBSCAMSample = DBSCAMSample<float>;
 27 | using Feature = Feature<float>;
 28 | 
 29 | class LaneNet {
 30 | 
 31 | public:
 32 |     /**
 33 |      * Remove default construction funciton
 34 |      */
 35 |     LaneNet() = delete;
 36 | 
 37 |     /***
 38 |      * Destruction function
 39 |      */
 40 |     ~LaneNet();
 41 | 
 42 |     /***
 43 |      * Constructor. Using config file to setup lanenet model. Mainly defined object are as follows:
 44 |      * 1.Init mnn model file path
 45 |      * 2.Init lanenet model pixel embedding feature dims
 46 |      * 3.Init dbscan cluster search radius eps threshold
 47 |      * 4.Init dbscan cluster min pts which are supposed to belong to a core object.
 48 |      * @param config : ConfigParser object
 49 |      */
 50 |     LaneNet(const ConfigParser& config);
 51 | 
 52 |     /***
 53 |     * Not allow copy here
 54 |     * @param transformer
 55 |     */
 56 |     LaneNet(const LaneNet& transformer) = delete;
 57 | 
 58 |     /***
 59 |      * Not allow copy here
 60 |      * @param transformer
 61 |      * @return
 62 |      */
 63 |     LaneNet &operator=(const LaneNet& transformer) = delete;
 64 | 
 65 |     /***
 66 |      * Detect lanes on image using lanenet model
 67 |      * @param input_image : input image
 68 |      * @param binary_seg_result : binary segmentation result [0, 255] ---> [foreground, background]
 69 |      * @param instance_seg_result : instance segmentation result
 70 |      */
 71 |     void detect(const cv::Mat& input_image, cv::Mat& binary_seg_result, cv::Mat& instance_seg_result);
 72 | 
 73 |     /***
 74 |      * Return if model is successfully initialized
 75 |      * @return
 76 |      */
 77 |     bool is_successfully_initialized() {
 78 |         return _m_successfully_initialized;
 79 |     }
 80 | 
 81 | 
 82 | private:
 83 |     // MNN Lanenet model file path
 84 |     std::string _m_lanenet_model_file_path = "";
 85 |     // MNN Lanenet model interpreter
 86 |     std::unique_ptr<MNN::Interpreter> _m_lanenet_model = nullptr;
 87 |     // MNN Lanenet model session
 88 |     MNN::Session* _m_lanenet_session = nullptr;
 89 |     // MNN Lanenet model input tensor
 90 |     MNN::Tensor* _m_input_tensor_host = nullptr;
 91 |     // MNN Lanenet model binary output tensor
 92 |     MNN::Tensor* _m_binary_output_tensor_host = nullptr;
 93 |     // MNN Lanenet model pixel embedding output tensor
 94 |     MNN::Tensor* _m_pix_embedding_output_tensor_host = nullptr;
 95 |     // MNN Lanenet input graph node tensor size
 96 |     cv::Size _m_input_node_size_host;
 97 |     // lanenet pixel embedding feature dims
 98 |     uint _m_lanenet_pix_embedding_feature_dims=4;
 99 |     // Dbscan eps threshold
100 |     float _m_dbscan_eps = 0.0;
101 |     // dbscan min pts threshold
102 |     uint _m_dbscan_min_pts = 0;
103 |     // successfully init model flag
104 |     bool _m_successfully_initialized = false;
105 | 
106 |     /***
107 |      * Preprocess image, resize image and scale image into [-1.0, 1.0]
108 |      * @param input_image
109 |      * @param output_image
110 |      */
111 |     void preprocess(const cv::Mat& input_image, cv::Mat& output_image);
112 | 
113 |     /***
114 |      * Gathet embedding features via binary segmentation mask
115 |      * @param binary_mask
116 |      * @param pixel_embedding
117 |      * @param coords
118 |      * @param embedding_features
119 |      */
120 |     void gather_pixel_embedding_features(const cv::Mat& binary_mask, const cv::Mat& pixel_embedding,
121 |                                          std::vector<cv::Point>& coords, std::vector<DBSCAMSample>& embedding_samples);
122 | 
123 |     /***
124 |      * Cluster pixel embedding features via DBSCAN
125 |      * @param embedding_samples
126 |      * @param cluster_ret
127 |      */
128 |     void cluster_pixem_embedding_features(std::vector<DBSCAMSample>& embedding_samples,
129 |                                           std::vector<std::vector<uint> >& cluster_ret, std::vector<uint>& noise);
130 | 
131 |     /***
132 |      * Visualize instance segmentation result
133 |      * @param cluster_ret
134 |      * @param coords
135 |      * @param instance_segmentation_result
136 |      */
137 |     static void visualize_instance_segmentation_result(const std::vector<std::vector<uint> >& cluster_ret,
138 |             const std::vector<cv::Point>& coords, cv::Mat& instance_segmentation_result);
139 | 
140 |     /***
141 |      * Normalize input samples' feature. Each sample's feature is normalized via function as follows:
142 |      * feature[i] = (feature[i] - mean_feature_vector[i]) / stddev_feature_vector[i].
143 |      * @param input_samples : vector of samples whose feature vector need to be normalized
144 |      * @param output_samples : normalized result
145 |      */
146 |     static void normalize_sample_features(const std::vector<DBSCAMSample >& input_samples,
147 |                                           std::vector<DBSCAMSample >& output_samples);
148 | 
149 |     /***
150 |      * Calculate the mean feature vector among a vector of DBSCAMSample samples
151 |      * @param input_samples : vector of DBSCAMSample samples
152 |      * @return : mean feature vector
153 |      */
154 |     static Feature calculate_mean_feature_vector(const std::vector<DBSCAMSample >& input_samples);
155 | 
156 |     /***
157 |      * Calculate the stddev feature vector among a vector of DBSCAMSample samples
158 |      * @param input_samples : vector of DBSCAMSample samples
159 |      * @param mean_feature_vec : mean feature vector
160 |      * @return : stddev feature vector
161 |      */
162 |     static Feature calculate_stddev_feature_vector(
163 |             const std::vector<DBSCAMSample >& input_samples,
164 |             const Feature& mean_feature_vec);
165 | 
166 |     /***
167 |      * simultaneously random shuffle two vector inplace. The two input source vector should have the same size.
168 |      * @tparam T
169 |      * @param src1
170 |      * @param src2
171 |      */
172 |     template <typename T1, typename T2>
173 |     static void simultaneously_random_shuffle(std::vector<T1> src1, std::vector<T2> src2);
174 | };
175 | 
176 | }
177 | }
178 | 
179 | #endif //MNN_LANENET_MODEL_H
180 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/requirements.txt:
--------------------------------------------------------------------------------
1 | numpy==1.15.1
2 | tqdm==4.28.1
3 | glog==0.3.1
4 | easydict==1.9
5 | tensorflow_gpu==1.15.2
6 | matplotlib==3.0.2
7 | opencv==4.0.0
8 | scikit_learn==0.21.1
9 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/semantic_segmentation_zoo/__init__.py:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env python3
2 | # -*- coding: utf-8 -*-
3 | # @Time    : 19-4-24 下午6:41
4 | # @Author  : LuoYao
5 | # @Site    : ICode
6 | # @File    : __init__.py.py
7 | # @IDE: PyCharm


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/semantic_segmentation_zoo/vgg16_based_fcn.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | # @Time    : 19-4-24 下午6:42
  4 | # @Author  : MaybeShewill-CV
  5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
  6 | # @File    : vgg16_based_fcn.py
  7 | # @IDE: PyCharm
  8 | """
  9 | Implement VGG16 based fcn net for semantic segmentation
 10 | """
 11 | import collections
 12 | 
 13 | import tensorflow as tf
 14 | 
 15 | from LaneDetectionLaneNet.config import global_config
 16 | from LaneDetectionLaneNet.semantic_segmentation_zoo import cnn_basenet
 17 | 
 18 | CFG = global_config.cfg
 19 | 
 20 | 
 21 | class VGG16FCN(cnn_basenet.CNNBaseModel):
 22 |     """
 23 |     VGG 16 based fcn net for semantic segmentation
 24 |     """
 25 |     def __init__(self, phase):
 26 |         """
 27 | 
 28 |         """
 29 |         super(VGG16FCN, self).__init__()
 30 |         self._phase = phase
 31 |         self._is_training = self._is_net_for_training()
 32 |         self._net_intermediate_results = collections.OrderedDict()
 33 | 
 34 |     def _is_net_for_training(self):
 35 |         """
 36 |         if the net is used for training or not
 37 |         :return:
 38 |         """
 39 |         if isinstance(self._phase, tf.Tensor):
 40 |             phase = self._phase
 41 |         else:
 42 |             phase = tf.constant(self._phase, dtype=tf.string)
 43 | 
 44 |         return tf.equal(phase, tf.constant('train', dtype=tf.string))
 45 | 
 46 |     def _vgg16_conv_stage(self, input_tensor, k_size, out_dims, name,
 47 |                           stride=1, pad='SAME', need_layer_norm=True):
 48 |         """
 49 |         stack conv and activation in vgg16
 50 |         :param input_tensor:
 51 |         :param k_size:
 52 |         :param out_dims:
 53 |         :param name:
 54 |         :param stride:
 55 |         :param pad:
 56 |         :param need_layer_norm:
 57 |         :return:
 58 |         """
 59 |         with tf.variable_scope(name):
 60 |             conv = self.conv2d(
 61 |                 inputdata=input_tensor, out_channel=out_dims,
 62 |                 kernel_size=k_size, stride=stride,
 63 |                 use_bias=False, padding=pad, name='conv'
 64 |             )
 65 | 
 66 |             if need_layer_norm:
 67 |                 bn = self.layerbn(inputdata=conv, is_training=self._is_training, name='bn')
 68 | 
 69 |                 relu = self.relu(inputdata=bn, name='relu')
 70 |             else:
 71 |                 relu = self.relu(inputdata=conv, name='relu')
 72 | 
 73 |         return relu
 74 | 
 75 |     def _decode_block(self, input_tensor, previous_feats_tensor,
 76 |                       out_channels_nums, name, kernel_size=4,
 77 |                       stride=2, use_bias=False,
 78 |                       previous_kernel_size=4, need_activate=True):
 79 |         """
 80 | 
 81 |         :param input_tensor:
 82 |         :param previous_feats_tensor:
 83 |         :param out_channels_nums:
 84 |         :param kernel_size:
 85 |         :param previous_kernel_size:
 86 |         :param use_bias:
 87 |         :param stride:
 88 |         :param name:
 89 |         :return:
 90 |         """
 91 |         with tf.variable_scope(name_or_scope=name):
 92 | 
 93 |             deconv_weights_stddev = tf.sqrt(
 94 |                 tf.divide(tf.constant(2.0, tf.float32),
 95 |                           tf.multiply(tf.cast(previous_kernel_size * previous_kernel_size, tf.float32),
 96 |                                       tf.cast(tf.shape(input_tensor)[3], tf.float32)))
 97 |             )
 98 |             deconv_weights_init = tf.truncated_normal_initializer(
 99 |                 mean=0.0, stddev=deconv_weights_stddev)
100 | 
101 |             deconv = self.deconv2d(
102 |                 inputdata=input_tensor, out_channel=out_channels_nums, kernel_size=kernel_size,
103 |                 stride=stride, use_bias=use_bias, w_init=deconv_weights_init,
104 |                 name='deconv'
105 |             )
106 | 
107 |             deconv = self.layerbn(inputdata=deconv, is_training=self._is_training, name='deconv_bn')
108 | 
109 |             deconv = self.relu(inputdata=deconv, name='deconv_relu')
110 | 
111 |             fuse_feats = tf.add(
112 |                 previous_feats_tensor, deconv, name='fuse_feats'
113 |             )
114 | 
115 |             if need_activate:
116 | 
117 |                 fuse_feats = self.layerbn(
118 |                     inputdata=fuse_feats, is_training=self._is_training, name='fuse_gn'
119 |                 )
120 | 
121 |                 fuse_feats = self.relu(inputdata=fuse_feats, name='fuse_relu')
122 | 
123 |         return fuse_feats
124 | 
125 |     def _vgg16_fcn_encode(self, input_tensor, name):
126 |         """
127 | 
128 |         :param input_tensor:
129 |         :param name:
130 |         :return:
131 |         """
132 |         with tf.variable_scope(name_or_scope=name):
133 |             # encode stage 1
134 |             conv_1_1 = self._vgg16_conv_stage(
135 |                 input_tensor=input_tensor, k_size=3,
136 |                 out_dims=64, name='conv1_1',
137 |                 need_layer_norm=True
138 |             )
139 |             conv_1_2 = self._vgg16_conv_stage(
140 |                 input_tensor=conv_1_1, k_size=3,
141 |                 out_dims=64, name='conv1_2',
142 |                 need_layer_norm=True
143 |             )
144 |             self._net_intermediate_results['encode_stage_1_share'] = {
145 |                 'data': conv_1_2,
146 |                 'shape': conv_1_2.get_shape().as_list()
147 |             }
148 | 
149 |             # encode stage 2
150 |             pool1 = self.maxpooling(
151 |                 inputdata=conv_1_2, kernel_size=2,
152 |                 stride=2, name='pool1'
153 |             )
154 |             conv_2_1 = self._vgg16_conv_stage(
155 |                 input_tensor=pool1, k_size=3,
156 |                 out_dims=128, name='conv2_1',
157 |                 need_layer_norm=True
158 |             )
159 |             conv_2_2 = self._vgg16_conv_stage(
160 |                 input_tensor=conv_2_1, k_size=3,
161 |                 out_dims=128, name='conv2_2',
162 |                 need_layer_norm=True
163 |             )
164 |             self._net_intermediate_results['encode_stage_2_share'] = {
165 |                 'data': conv_2_2,
166 |                 'shape': conv_2_2.get_shape().as_list()
167 |             }
168 | 
169 |             # encode stage 3
170 |             pool2 = self.maxpooling(
171 |                 inputdata=conv_2_2, kernel_size=2,
172 |                 stride=2, name='pool2'
173 |             )
174 |             conv_3_1 = self._vgg16_conv_stage(
175 |                 input_tensor=pool2, k_size=3,
176 |                 out_dims=256, name='conv3_1',
177 |                 need_layer_norm=True
178 |             )
179 |             conv_3_2 = self._vgg16_conv_stage(
180 |                 input_tensor=conv_3_1, k_size=3,
181 |                 out_dims=256, name='conv3_2',
182 |                 need_layer_norm=True
183 |             )
184 |             conv_3_3 = self._vgg16_conv_stage(
185 |                 input_tensor=conv_3_2, k_size=3,
186 |                 out_dims=256, name='conv3_3',
187 |                 need_layer_norm=True
188 |             )
189 |             self._net_intermediate_results['encode_stage_3_share'] = {
190 |                 'data': conv_3_3,
191 |                 'shape': conv_3_3.get_shape().as_list()
192 |             }
193 | 
194 |             # encode stage 4
195 |             pool3 = self.maxpooling(
196 |                 inputdata=conv_3_3, kernel_size=2,
197 |                 stride=2, name='pool3'
198 |             )
199 |             conv_4_1 = self._vgg16_conv_stage(
200 |                 input_tensor=pool3, k_size=3,
201 |                 out_dims=512, name='conv4_1',
202 |                 need_layer_norm=True
203 |             )
204 |             conv_4_2 = self._vgg16_conv_stage(
205 |                 input_tensor=conv_4_1, k_size=3,
206 |                 out_dims=512, name='conv4_2',
207 |                 need_layer_norm=True
208 |             )
209 |             conv_4_3 = self._vgg16_conv_stage(
210 |                 input_tensor=conv_4_2, k_size=3,
211 |                 out_dims=512, name='conv4_3',
212 |                 need_layer_norm=True
213 |             )
214 |             self._net_intermediate_results['encode_stage_4_share'] = {
215 |                 'data': conv_4_3,
216 |                 'shape': conv_4_3.get_shape().as_list()
217 |             }
218 | 
219 |             # encode stage 5 for binary segmentation
220 |             pool4 = self.maxpooling(
221 |                 inputdata=conv_4_3, kernel_size=2,
222 |                 stride=2, name='pool4'
223 |             )
224 |             conv_5_1_binary = self._vgg16_conv_stage(
225 |                 input_tensor=pool4, k_size=3,
226 |                 out_dims=512, name='conv5_1_binary',
227 |                 need_layer_norm=True
228 |             )
229 |             conv_5_2_binary = self._vgg16_conv_stage(
230 |                 input_tensor=conv_5_1_binary, k_size=3,
231 |                 out_dims=512, name='conv5_2_binary',
232 |                 need_layer_norm=True
233 |             )
234 |             conv_5_3_binary = self._vgg16_conv_stage(
235 |                 input_tensor=conv_5_2_binary, k_size=3,
236 |                 out_dims=512, name='conv5_3_binary',
237 |                 need_layer_norm=True
238 |             )
239 |             self._net_intermediate_results['encode_stage_5_binary'] = {
240 |                 'data': conv_5_3_binary,
241 |                 'shape': conv_5_3_binary.get_shape().as_list()
242 |             }
243 | 
244 |             # encode stage 5 for instance segmentation
245 |             conv_5_1_instance = self._vgg16_conv_stage(
246 |                 input_tensor=pool4, k_size=3,
247 |                 out_dims=512, name='conv5_1_instance',
248 |                 need_layer_norm=True
249 |             )
250 |             conv_5_2_instance = self._vgg16_conv_stage(
251 |                 input_tensor=conv_5_1_instance, k_size=3,
252 |                 out_dims=512, name='conv5_2_instance',
253 |                 need_layer_norm=True
254 |             )
255 |             conv_5_3_instance = self._vgg16_conv_stage(
256 |                 input_tensor=conv_5_2_instance, k_size=3,
257 |                 out_dims=512, name='conv5_3_instance',
258 |                 need_layer_norm=True
259 |             )
260 |             self._net_intermediate_results['encode_stage_5_instance'] = {
261 |                 'data': conv_5_3_instance,
262 |                 'shape': conv_5_3_instance.get_shape().as_list()
263 |             }
264 | 
265 |         return
266 | 
267 |     def _vgg16_fcn_decode(self, name):
268 |         """
269 | 
270 |         :return:
271 |         """
272 |         with tf.variable_scope(name):
273 | 
274 |             # decode part for binary segmentation
275 |             with tf.variable_scope(name_or_scope='binary_seg_decode'):
276 | 
277 |                 decode_stage_5_binary = self._net_intermediate_results['encode_stage_5_binary']['data']
278 | 
279 |                 decode_stage_4_fuse = self._decode_block(
280 |                     input_tensor=decode_stage_5_binary,
281 |                     previous_feats_tensor=self._net_intermediate_results['encode_stage_4_share']['data'],
282 |                     name='decode_stage_4_fuse', out_channels_nums=512, previous_kernel_size=3
283 |                 )
284 |                 decode_stage_3_fuse = self._decode_block(
285 |                     input_tensor=decode_stage_4_fuse,
286 |                     previous_feats_tensor=self._net_intermediate_results['encode_stage_3_share']['data'],
287 |                     name='decode_stage_3_fuse', out_channels_nums=256
288 |                 )
289 |                 decode_stage_2_fuse = self._decode_block(
290 |                     input_tensor=decode_stage_3_fuse,
291 |                     previous_feats_tensor=self._net_intermediate_results['encode_stage_2_share']['data'],
292 |                     name='decode_stage_2_fuse', out_channels_nums=128
293 |                 )
294 |                 decode_stage_1_fuse = self._decode_block(
295 |                     input_tensor=decode_stage_2_fuse,
296 |                     previous_feats_tensor=self._net_intermediate_results['encode_stage_1_share']['data'],
297 |                     name='decode_stage_1_fuse', out_channels_nums=64
298 |                 )
299 |                 binary_final_logits_conv_weights_stddev = tf.sqrt(
300 |                     tf.divide(tf.constant(2.0, tf.float32),
301 |                               tf.multiply(4.0 * 4.0,
302 |                                           tf.cast(tf.shape(decode_stage_1_fuse)[3], tf.float32)))
303 |                 )
304 |                 binary_final_logits_conv_weights_init = tf.truncated_normal_initializer(
305 |                     mean=0.0, stddev=binary_final_logits_conv_weights_stddev)
306 | 
307 |                 binary_final_logits = self.conv2d(
308 |                     inputdata=decode_stage_1_fuse, out_channel=CFG.TRAIN.CLASSES_NUMS,
309 |                     kernel_size=1, use_bias=False,
310 |                     w_init=binary_final_logits_conv_weights_init,
311 |                     name='binary_final_logits')
312 | 
313 |                 self._net_intermediate_results['binary_segment_logits'] = {
314 |                     'data': binary_final_logits,
315 |                     'shape': binary_final_logits.get_shape().as_list()
316 |                 }
317 | 
318 |             with tf.variable_scope(name_or_scope='instance_seg_decode'):
319 | 
320 |                 decode_stage_5_instance = self._net_intermediate_results['encode_stage_5_instance']['data']
321 | 
322 |                 decode_stage_4_fuse = self._decode_block(
323 |                     input_tensor=decode_stage_5_instance,
324 |                     previous_feats_tensor=self._net_intermediate_results['encode_stage_4_share']['data'],
325 |                     name='decode_stage_4_fuse', out_channels_nums=512, previous_kernel_size=3)
326 | 
327 |                 decode_stage_3_fuse = self._decode_block(
328 |                     input_tensor=decode_stage_4_fuse,
329 |                     previous_feats_tensor=self._net_intermediate_results['encode_stage_3_share']['data'],
330 |                     name='decode_stage_3_fuse', out_channels_nums=256)
331 | 
332 |                 decode_stage_2_fuse = self._decode_block(
333 |                     input_tensor=decode_stage_3_fuse,
334 |                     previous_feats_tensor=self._net_intermediate_results['encode_stage_2_share']['data'],
335 |                     name='decode_stage_2_fuse', out_channels_nums=128)
336 | 
337 |                 decode_stage_1_fuse = self._decode_block(
338 |                     input_tensor=decode_stage_2_fuse,
339 |                     previous_feats_tensor=self._net_intermediate_results['encode_stage_1_share']['data'],
340 |                     name='decode_stage_1_fuse', out_channels_nums=64, need_activate=False)
341 | 
342 |                 self._net_intermediate_results['instance_segment_logits'] = {
343 |                     'data': decode_stage_1_fuse,
344 |                     'shape': decode_stage_1_fuse.get_shape().as_list()
345 |                 }
346 | 
347 |     def build_model(self, input_tensor, name, reuse=False):
348 |         """
349 | 
350 |         :param input_tensor:
351 |         :param name:
352 |         :param reuse:
353 |         :return:
354 |         """
355 |         with tf.variable_scope(name_or_scope=name, reuse=reuse):
356 |             # vgg16 fcn encode part
357 |             self._vgg16_fcn_encode(input_tensor=input_tensor, name='vgg16_encode_module')
358 |             # vgg16 fcn decode part
359 |             self._vgg16_fcn_decode(name='vgg16_decode_module')
360 | 
361 |         return self._net_intermediate_results
362 | 
363 | 
364 | if __name__ == '__main__':
365 |     """
366 |     test code
367 |     """
368 |     test_in_tensor = tf.placeholder(dtype=tf.float32, shape=[1, 256, 512, 3], name='input')
369 |     model = VGG16FCN(phase='train')
370 |     ret = model.build_model(test_in_tensor, name='vgg16fcn')
371 |     for layer_name, layer_info in ret.items():
372 |         print('layer name: {:s} shape: {}'.format(layer_name, layer_info['shape']))
373 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/tools/evaluate_lanenet_on_tusimple.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | 
  4 | """
  5 | Author: Mayur Sunil Jawalkar (mj8628)
  6 |         Kunjan Suresh Mhaske (km1556)
  7 | 
  8 | Evaluate lanenet model on tusimple lane dataset
  9 | """
 10 | import argparse
 11 | import glob
 12 | import os
 13 | import os.path as ops
 14 | import time
 15 | 
 16 | import cv2
 17 | import glog as log
 18 | import numpy as np
 19 | import tensorflow as tf
 20 | import tqdm
 21 | 
 22 | from LaneDetectionLaneNet.config import global_config
 23 | from LaneDetectionLaneNet.lanenet_model import lanenet
 24 | from LaneDetectionLaneNet.lanenet_model import lanenet_postprocess
 25 | 
 26 | CFG = global_config.cfg
 27 | 
 28 | 
 29 | def init_args():
 30 |     """
 31 | 
 32 |     :return:
 33 |     """
 34 |     parser = argparse.ArgumentParser()
 35 |     parser.add_argument('--image_dir', type=str, help='The source tusimple lane test data dir')
 36 |     parser.add_argument('--weights_path', type=str, help='The model weights path')
 37 |     parser.add_argument('--save_dir', type=str, help='The test output save root dir')
 38 | 
 39 |     return parser.parse_args()
 40 | 
 41 | 
 42 | def test_lanenet_batch(src_dir, weights_path, save_dir):
 43 |     """
 44 | 
 45 |     :param src_dir:
 46 |     :param weights_path:
 47 |     :param save_dir:
 48 |     :return:
 49 |     """
 50 |     assert ops.exists(src_dir), '{:s} not exist'.format(src_dir)
 51 | 
 52 |     os.makedirs(save_dir, exist_ok=True)
 53 | 
 54 |     input_tensor = tf.placeholder(dtype=tf.float32, shape=[1, 256, 512, 3], name='input_tensor')
 55 | 
 56 |     net = lanenet.LaneNet(phase='test', net_flag='vgg')
 57 |     binary_seg_ret, instance_seg_ret = net.inference(input_tensor=input_tensor, name='lanenet_model')
 58 | 
 59 |     postprocessor = lanenet_postprocess.LaneNetPostProcessor()
 60 | 
 61 |     saver = tf.train.Saver()
 62 | 
 63 |     # Set sess configuration
 64 |     sess_config = tf.ConfigProto()
 65 |     sess_config.gpu_options.per_process_gpu_memory_fraction = CFG.TEST.GPU_MEMORY_FRACTION
 66 |     sess_config.gpu_options.allow_growth = CFG.TRAIN.TF_ALLOW_GROWTH
 67 |     sess_config.gpu_options.allocator_type = 'BFC'
 68 | 
 69 |     sess = tf.Session(config=sess_config)
 70 | 
 71 |     with sess.as_default():
 72 | 
 73 |         saver.restore(sess=sess, save_path=weights_path)
 74 | 
 75 |         image_list = glob.glob('{:s}/**/*.jpg'.format(src_dir), recursive=True)
 76 |         avg_time_cost = []
 77 | 
 78 |         vid_writer = None
 79 |         # frame_count = 0
 80 |         # ignore_count_1 = 0
 81 |         for index, image_path in tqdm.tqdm(enumerate(image_list), total=len(image_list)):
 82 | 
 83 |             image = cv2.imread(image_path, cv2.IMREAD_COLOR)
 84 |             image_vis = image
 85 |             image = cv2.resize(image, (512, 256), interpolation=cv2.INTER_LINEAR)
 86 |             image = image / 127.5 - 1.0
 87 | 
 88 | 
 89 |             t_start = time.time()
 90 |             binary_seg_image, instance_seg_image = sess.run(
 91 |                 [binary_seg_ret, instance_seg_ret],
 92 |                 feed_dict={input_tensor: [image]}
 93 |             )
 94 |             avg_time_cost.append(time.time() - t_start)
 95 | 
 96 |             postprocess_result = postprocessor.postprocess(
 97 |                 binary_seg_result=binary_seg_image[0],
 98 |                 instance_seg_result=instance_seg_image[0],
 99 |                 source_image=image_vis
100 |             )
101 | 
102 |             if index % 100 == 0:
103 |                 log.info('Mean inference time every single image: {:.5f}s'.format(np.mean(avg_time_cost)))
104 |                 avg_time_cost.clear()
105 | 
106 |             input_image_dir = ops.split(image_path.split('clips')[1])[0][1:]
107 |             input_image_name = ops.split(image_path)[1]
108 |             output_image_dir = ops.join(save_dir, input_image_dir)
109 |             os.makedirs(output_image_dir, exist_ok=True)
110 |             output_image_path = ops.join(output_image_dir, input_image_name)
111 |             if ops.exists(output_image_path):
112 |                 continue
113 |             # print(output_image_path)
114 | 
115 |             try:
116 |                 cv2.imwrite(output_image_path, postprocess_result['source_image'])
117 |             except:
118 |                 continue
119 |     vid_writer.release()
120 |     return
121 | 
122 | 
123 | if __name__ == '__main__':
124 |     """
125 |     test code
126 |     """
127 |     # init args
128 |     args = init_args()
129 | 
130 |     test_lanenet_batch(
131 |         src_dir=args.image_dir,
132 |         weights_path=args.weights_path,
133 |         save_dir=args.save_dir
134 |     )
135 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/tools/evaluate_model_utils.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding: utf-8 -*-
 3 | # @Time    : 19-1-21 上午11:17
 4 | # @Author  : MaybeShewill-CV
 5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
 6 | # @File    : evaluate_model_utils.py
 7 | # @IDE: PyCharm
 8 | """
 9 | Calculate model's fp fn and precision
10 | """
11 | import tensorflow as tf
12 | 
13 | 
14 | def calculate_model_precision(input_tensor, label_tensor):
15 |     """
16 |     calculate accuracy acc = correct_nums / ground_truth_nums
17 |     :param input_tensor: binary segmentation logits
18 |     :param label_tensor: binary segmentation label
19 |     :return:
20 |     """
21 | 
22 |     logits = tf.nn.softmax(logits=input_tensor)
23 |     final_output = tf.expand_dims(tf.argmax(logits, axis=-1), axis=-1)
24 | 
25 |     idx = tf.where(tf.equal(final_output, 1))
26 |     pix_cls_ret = tf.gather_nd(label_tensor, idx)
27 |     accuracy = tf.count_nonzero(pix_cls_ret)
28 |     accuracy = tf.divide(
29 |         accuracy,
30 |         tf.cast(tf.shape(tf.gather_nd(label_tensor, tf.where(tf.equal(label_tensor, 1))))[0], tf.int64))
31 | 
32 |     return accuracy
33 | 
34 | 
35 | def calculate_model_fp(input_tensor, label_tensor):
36 |     """
37 |     calculate fp figure
38 |     :param input_tensor:
39 |     :param label_tensor:
40 |     :return:
41 |     """
42 |     logits = tf.nn.softmax(logits=input_tensor)
43 |     final_output = tf.expand_dims(tf.argmax(logits, axis=-1), axis=-1)
44 | 
45 |     idx = tf.where(tf.equal(final_output, 1))
46 |     pix_cls_ret = tf.gather_nd(final_output, idx)
47 |     false_pred = tf.cast(tf.shape(pix_cls_ret)[0], tf.int64) - tf.count_nonzero(
48 |         tf.gather_nd(label_tensor, idx)
49 |     )
50 | 
51 |     return tf.divide(false_pred, tf.cast(tf.shape(pix_cls_ret)[0], tf.int64))
52 | 
53 | 
54 | def calculate_model_fn(input_tensor, label_tensor):
55 |     """
56 |     calculate fn figure
57 |     :param input_tensor:
58 |     :param label_tensor:
59 |     :return:
60 |     """
61 |     logits = tf.nn.softmax(logits=input_tensor)
62 |     final_output = tf.expand_dims(tf.argmax(logits, axis=-1), axis=-1)
63 | 
64 |     idx = tf.where(tf.equal(label_tensor, 1))
65 |     pix_cls_ret = tf.gather_nd(final_output, idx)
66 |     label_cls_ret = tf.gather_nd(label_tensor, tf.where(tf.equal(label_tensor, 1)))
67 |     mis_pred = tf.cast(tf.shape(label_cls_ret)[0], tf.int64) - tf.count_nonzero(pix_cls_ret)
68 | 
69 |     return tf.divide(mis_pred, tf.cast(tf.shape(label_cls_ret)[0], tf.int64))
70 | 
71 | 
72 | def get_image_summary(img):
73 |     """
74 |     Make an image summary for 4d tensor image with index idx
75 |     :param img:
76 |     """
77 | 
78 |     if len(img.get_shape().as_list()) == 3:
79 |         img = tf.expand_dims(img, -1)
80 | 
81 |     image = img - tf.reduce_min(img)
82 |     image /= tf.reduce_max(img) - tf.reduce_min(img)
83 |     image *= 255
84 | 
85 |     return image
86 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/tools/generate_tusimple_dataset.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | # @Time    : 18-5-18 下午7:31
  4 | # @Author  : MaybeShewill-CV
  5 | # @Site    : https://github.com/MaybeShewill-CV/lanenet-lane-detection
  6 | # @File    : generate_tusimple_dataset.py
  7 | # @IDE: PyCharm Community Edition
  8 | """
  9 | generate tusimple training dataset
 10 | """
 11 | import argparse
 12 | import glob
 13 | import json
 14 | import os
 15 | import os.path as ops
 16 | import shutil
 17 | 
 18 | import cv2
 19 | import numpy as np
 20 | 
 21 | 
 22 | def init_args():
 23 |     """
 24 | 
 25 |     :return:
 26 |     """
 27 |     parser = argparse.ArgumentParser()
 28 |     parser.add_argument('--src_dir', type=str, help='The origin path of unzipped tusimple dataset')
 29 | 
 30 |     return parser.parse_args()
 31 | 
 32 | 
 33 | def process_json_file(json_file_path, src_dir, ori_dst_dir, binary_dst_dir, instance_dst_dir):
 34 |     """
 35 | 
 36 |     :param json_file_path:
 37 |     :param src_dir: origin clip file path
 38 |     :param ori_dst_dir:
 39 |     :param binary_dst_dir:
 40 |     :param instance_dst_dir:
 41 |     :return:
 42 |     """
 43 |     assert ops.exists(json_file_path), '{:s} not exist'.format(json_file_path)
 44 | 
 45 |     image_nums = len(os.listdir(ori_dst_dir))
 46 | 
 47 |     with open(json_file_path, 'r') as file:
 48 |         for line_index, line in enumerate(file):
 49 |             info_dict = json.loads(line)
 50 | 
 51 |             image_dir = ops.split(info_dict['raw_file'])[0]
 52 |             image_dir_split = image_dir.split('/')[1:]
 53 |             image_dir_split.append(ops.split(info_dict['raw_file'])[1])
 54 |             image_name = '_'.join(image_dir_split)
 55 |             image_path = ops.join(src_dir, info_dict['raw_file'])
 56 |             assert ops.exists(image_path), '{:s} not exist'.format(image_path)
 57 | 
 58 |             h_samples = info_dict['h_samples']
 59 |             lanes = info_dict['lanes']
 60 | 
 61 |             image_name_new = '{:s}.png'.format('{:d}'.format(line_index + image_nums).zfill(4))
 62 | 
 63 |             src_image = cv2.imread(image_path, cv2.IMREAD_COLOR)
 64 |             dst_binary_image = np.zeros([src_image.shape[0], src_image.shape[1]], np.uint8)
 65 |             dst_instance_image = np.zeros([src_image.shape[0], src_image.shape[1]], np.uint8)
 66 | 
 67 |             for lane_index, lane in enumerate(lanes):
 68 |                 assert len(h_samples) == len(lane)
 69 |                 lane_x = []
 70 |                 lane_y = []
 71 |                 for index in range(len(lane)):
 72 |                     if lane[index] == -2:
 73 |                         continue
 74 |                     else:
 75 |                         ptx = lane[index]
 76 |                         pty = h_samples[index]
 77 |                         lane_x.append(ptx)
 78 |                         lane_y.append(pty)
 79 |                 if not lane_x:
 80 |                     continue
 81 |                 lane_pts = np.vstack((lane_x, lane_y)).transpose()
 82 |                 lane_pts = np.array([lane_pts], np.int64)
 83 | 
 84 |                 cv2.polylines(dst_binary_image, lane_pts, isClosed=False,
 85 |                               color=255, thickness=5)
 86 |                 cv2.polylines(dst_instance_image, lane_pts, isClosed=False,
 87 |                               color=lane_index * 50 + 20, thickness=5)
 88 | 
 89 |             dst_binary_image_path = ops.join(binary_dst_dir, image_name_new)
 90 |             dst_instance_image_path = ops.join(instance_dst_dir, image_name_new)
 91 |             dst_rgb_image_path = ops.join(ori_dst_dir, image_name_new)
 92 | 
 93 |             cv2.imwrite(dst_binary_image_path, dst_binary_image)
 94 |             cv2.imwrite(dst_instance_image_path, dst_instance_image)
 95 |             cv2.imwrite(dst_rgb_image_path, src_image)
 96 | 
 97 |             print('Process {:s} success'.format(image_name))
 98 | 
 99 | 
100 | def gen_train_sample(src_dir, b_gt_image_dir, i_gt_image_dir, image_dir):
101 |     """
102 |     generate sample index file
103 |     :param src_dir:
104 |     :param b_gt_image_dir:
105 |     :param i_gt_image_dir:
106 |     :param image_dir:
107 |     :return:
108 |     """
109 | 
110 |     with open('{:s}/training/train.txt'.format(src_dir), 'w') as file:
111 | 
112 |         for image_name in os.listdir(b_gt_image_dir):
113 |             if not image_name.endswith('.png'):
114 |                 continue
115 | 
116 |             binary_gt_image_path = ops.join(b_gt_image_dir, image_name)
117 |             instance_gt_image_path = ops.join(i_gt_image_dir, image_name)
118 |             image_path = ops.join(image_dir, image_name)
119 | 
120 |             assert ops.exists(image_path), '{:s} not exist'.format(image_path)
121 |             assert ops.exists(instance_gt_image_path), '{:s} not exist'.format(instance_gt_image_path)
122 | 
123 |             b_gt_image = cv2.imread(binary_gt_image_path, cv2.IMREAD_COLOR)
124 |             i_gt_image = cv2.imread(instance_gt_image_path, cv2.IMREAD_COLOR)
125 |             image = cv2.imread(image_path, cv2.IMREAD_COLOR)
126 | 
127 |             if b_gt_image is None or image is None or i_gt_image is None:
128 |                 print('图像对: {:s}损坏'.format(image_name))
129 |                 continue
130 |             else:
131 |                 info = '{:s} {:s} {:s}'.format(image_path, binary_gt_image_path, instance_gt_image_path)
132 |                 file.write(info + '\n')
133 |     return
134 | 
135 | 
136 | def process_tusimple_dataset(src_dir):
137 |     """
138 | 
139 |     :param src_dir:
140 |     :return:
141 |     """
142 |     traing_folder_path = ops.join(src_dir, 'training')
143 |     testing_folder_path = ops.join(src_dir, 'testing')
144 | 
145 |     os.makedirs(traing_folder_path, exist_ok=True)
146 |     os.makedirs(testing_folder_path, exist_ok=True)
147 | 
148 |     for json_label_path in glob.glob('{:s}/label*.json'.format(src_dir)):
149 |         json_label_name = ops.split(json_label_path)[1]
150 | 
151 |         shutil.copyfile(json_label_path, ops.join(traing_folder_path, json_label_name))
152 | 
153 |     for json_label_path in glob.glob('{:s}/test*.json'.format(src_dir)):
154 |         json_label_name = ops.split(json_label_path)[1]
155 | 
156 |         shutil.copyfile(json_label_path, ops.join(testing_folder_path, json_label_name))
157 | 
158 |     gt_image_dir = ops.join(traing_folder_path, 'gt_image')
159 |     gt_binary_dir = ops.join(traing_folder_path, 'gt_binary_image')
160 |     gt_instance_dir = ops.join(traing_folder_path, 'gt_instance_image')
161 | 
162 |     os.makedirs(gt_image_dir, exist_ok=True)
163 |     os.makedirs(gt_binary_dir, exist_ok=True)
164 |     os.makedirs(gt_instance_dir, exist_ok=True)
165 | 
166 |     for json_label_path in glob.glob('{:s}/*.json'.format(traing_folder_path)):
167 |         process_json_file(json_label_path, src_dir, gt_image_dir, gt_binary_dir, gt_instance_dir)
168 | 
169 |     gen_train_sample(src_dir, gt_binary_dir, gt_instance_dir, gt_image_dir)
170 | 
171 |     return
172 | 
173 | 
174 | if __name__ == '__main__':
175 |     args = init_args()
176 | 
177 |     process_tusimple_dataset(args.src_dir)
178 | 


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/tools/lane_and_object_detection_on_video.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kunjan-mhaske/Obstacle-and-Lane-Detection-using-Computer-Vision/df80843803595683b2a98e6d7a8958ebeb9fa615/LaneDetectionLaneNet/tools/lane_and_object_detection_on_video.py


--------------------------------------------------------------------------------
/LaneDetectionLaneNet/tools/test_lanenet.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | 
  4 | 
  5 | """
  6 | Author: Mayur Sunil Jawalkar (mj8628)
  7 |         Kunjan Suresh Mhaske (km1556)
  8 | 
  9 |         This program tests the LaneNet model on single image
 10 | """
 11 | 
 12 | import argparse
 13 | import os.path as ops
 14 | import time
 15 | 
 16 | import cv2
 17 | import glog as log
 18 | import matplotlib.pyplot as plt
 19 | import numpy as np
 20 | import tensorflow as tf
 21 | import silence_tensorflow.auto
 22 | from LaneDetectionLaneNet.config import global_config
 23 | from LaneDetectionLaneNet.lanenet_model import lanenet
 24 | from LaneDetectionLaneNet.lanenet_model import lanenet_postprocess
 25 | 
 26 | 
 27 | CFG = global_config.cfg
 28 | 
 29 | 
 30 | def init_args():
 31 |     """
 32 |     Initialize the arguments passed while executing the program
 33 |     :return:
 34 |     """
 35 |     parser = argparse.ArgumentParser()
 36 |     parser.add_argument('--image_path', type=str, help='The image path or the src image save dir')
 37 |     parser.add_argument('--weights_path', type=str, help='The model weights path')
 38 | 
 39 |     return parser.parse_args()
 40 | 
 41 | 
 42 | def args_str2bool(arg_value):
 43 |     """
 44 |     Convert the arguments to the boolean value
 45 |     :param arg_value: value of input argument
 46 |     :return: boolean value associated with the input value
 47 |     """
 48 |     if arg_value.lower() in ('yes', 'true', 't', 'y', '1'):
 49 |         return True
 50 | 
 51 |     elif arg_value.lower() in ('no', 'false', 'f', 'n', '0'):
 52 |         return False
 53 |     else:
 54 |         raise argparse.ArgumentTypeError('Unsupported value encountered.')
 55 | 
 56 | 
 57 | def minmax_scale(input_arr):
 58 |     """
 59 |     Performs the min max scaling operation on the input array.
 60 |     :param input_arr: array
 61 |     :return: array after min max operations
 62 |     """
 63 |     min_val = np.min(input_arr)
 64 |     max_val = np.max(input_arr)
 65 | 
 66 |     output_arr = (input_arr - min_val) * 255.0 / (max_val - min_val)
 67 | 
 68 |     return output_arr
 69 | 
 70 | 
 71 | def test_lanenet(weights_path, in_image=None, image_path=None, session=None):
 72 |     """
 73 |     Tests the lanenet model on the image passes as an argument.
 74 |     :param image_path: path to the input image
 75 |     :param weights_path: path to the weights of the lanenet model
 76 |     :param in_image: input image
 77 |     :return: output image with detected lanes
 78 |     """
 79 | 
 80 |     # t_start = time.time()
 81 |     if in_image is None:
 82 |         # make sure that the path is valid
 83 |         assert ops.exists(image_path), '{:s} not exist'.format(image_path)
 84 | 
 85 |         # log.info('Start reading image and preprocessing')
 86 |         # read image from that path
 87 |         image = cv2.imread(image_path, cv2.IMREAD_COLOR)
 88 |     else:
 89 |         image = in_image.copy()
 90 | 
 91 |     image_vis = image
 92 |     # Resize the image to the standard dimensions
 93 |     image = cv2.resize(image, (512, 256), interpolation=cv2.INTER_LINEAR)
 94 |     image = image / 127.5 - 1.0
 95 |     # log.info('Image load complete, cost time: {:.5f}s'.format(time.time() - t_start))
 96 | 
 97 |     # create an empty place holder of a specified size and of type float
 98 |     input_tensor = tf.placeholder(dtype=tf.float32, shape=[1, 256, 512, 3], name='input_tensor')
 99 | 
100 |     # Initialize the Lanenet model
101 |     net = lanenet.LaneNet(phase='test', net_flag='vgg')
102 | 
103 |     # Make predictions using lanenet
104 |     binary_seg_ret, instance_seg_ret = net.inference(input_tensor=input_tensor, name='lanenet_model')
105 | 
106 |     # Instantiate the postprocessor
107 |     postprocessor = lanenet_postprocess.LaneNetPostProcessor()
108 | 
109 |     # Save the current instance
110 |     saver = tf.train.Saver()
111 | 
112 |     # Set sess configuration
113 |     # sess_config = tf.ConfigProto(device_count={'GPU': 0})
114 |     # sess_config.gpu_options.per_process_gpu_memory_fraction = CFG.TEST.GPU_MEMORY_FRACTION
115 |     # sess_config.gpu_options.allow_growth = CFG.TRAIN.TF_ALLOW_GROWTH
116 |     # sess_config.gpu_options.allocator_type = 'BFC'
117 | 
118 |     # sess = tf.Session(config=sess_config)
119 | 
120 |     sess = session
121 | 
122 |     output_img = None
123 | 
124 |     with sess.as_default():
125 | 
126 |         saver.restore(sess=sess, save_path=weights_path)
127 | 
128 |         # t_start = time.time()
129 |         binary_seg_image, instance_seg_image = sess.run(
130 |             [binary_seg_ret, instance_seg_ret],
131 |             feed_dict={input_tensor: [image]}
132 |         )
133 |         # t_cost = time.time() - t_start
134 |         # log.info('Single imgae inference cost time: {:.5f}s'.format(t_cost))
135 | 
136 |         postprocess_result = postprocessor.postprocess(
137 |             binary_seg_result=binary_seg_image[0],
138 |             instance_seg_result=instance_seg_image[0],
139 |             source_image=image_vis
140 |         )
141 |         # mask_image = postprocess_result['mask_image']
142 | 
143 |         for i in range(CFG.TRAIN.EMBEDDING_FEATS_DIMS):
144 |             instance_seg_image[0][:, :, i] = minmax_scale(instance_seg_image[0][:, :, i])
145 |         # embedding_image = np.array(instance_seg_image[0], np.uint8)
146 | 
147 |         output_img = postprocess_result['source_image']
148 | 
149 |         # plt.figure('mask_image')
150 |         # plt.imshow(mask_image[:, :, (2, 1, 0)])
151 |         # plt.figure('src_image')
152 |         # plt.imshow(image_vis[:, :, (2, 1, 0)])
153 |         # plt.figure('instance_image')
154 |         # plt.imshow(embedding_image[:, :, (2, 1, 0)])
155 |         # plt.figure('binary_image')
156 |         # plt.imshow(binary_seg_image[0] * 255, cmap='gray')
157 |         # plt.show()
158 |         #
159 |         # cv2.imwrite('instance_mask_image.png', mask_image)
160 |         # cv2.imwrite('source_image.png', postprocess_result['source_image'])
161 |         # cv2.imwrite('binary_mask_image.png', binary_seg_image[0] * 255)
162 | 
163 |     # sess.close()
164 | 
165 |     return output_img
166 | 
167 | 
168 | if __name__ == '__main__':
169 |     """
170 |     test code
171 |     """
172 |     # init args
173 |     args = init_args()
174 | 
175 |     test_lanenet(image_path=args.image_path, weights_path=args.weights_path)
176 | 


--------------------------------------------------------------------------------
/OUT/output_video - Copy.avi:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kunjan-mhaske/Obstacle-and-Lane-Detection-using-Computer-Vision/df80843803595683b2a98e6d7a8958ebeb9fa615/OUT/output_video - Copy.avi


--------------------------------------------------------------------------------
/OUT/output_video.avi:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kunjan-mhaske/Obstacle-and-Lane-Detection-using-Computer-Vision/df80843803595683b2a98e6d7a8958ebeb9fa615/OUT/output_video.avi


--------------------------------------------------------------------------------
/ObstacleDetectionYOLO/ObjectDetection_YOLO.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Author: Mayur Sunil Jawalkar (mj8628)
  3 |         Kunjan Suresh Mhaske (km1556)
  4 | 
  5 | This program detects the objects in the image using the YOLO model.
  6 | """
  7 | 
  8 | # USAGE
  9 | # python ObjectDetection_YOLO.py --image images/0.jpg --yolo yolo-coco
 10 | 
 11 | # import the necessary packages
 12 | import numpy as np
 13 | import argparse
 14 | import cv2
 15 | import os
 16 | 
 17 | # Declare Global Variables
 18 | global ARG_DICT
 19 | global COLORS
 20 | global LABELS
 21 | 
 22 | # Initialize the global variables
 23 | ARG_DICT = dict()
 24 | COLORS = list()
 25 | LABELS = list()
 26 | 
 27 | 
 28 | def set_input_arguments(in_img, yolo_dir, confidence, threshold):
 29 |     """
 30 |     Extract the argument information in the dictionary
 31 |     """
 32 |     globals()  # Access global variables
 33 |     ARG_DICT.clear()  # Clear the pre-existing content
 34 |     ARG_DICT['input_img'] = in_img
 35 |     ARG_DICT['yolo'] = yolo_dir
 36 |     ARG_DICT['confidence'] = confidence
 37 |     ARG_DICT['threshold'] = threshold
 38 | 
 39 | 
 40 | def get_labels_from_yolo_model():
 41 |     """
 42 |     Open the label file and save labels for the prediction classes into a list
 43 |     """
 44 |     globals()  # Access global variables
 45 |     LABELS.clear()  # Clear the pre-existing content
 46 |     # save the path for the labels file
 47 |     labelsPath = os.path.sep.join([ARG_DICT["yolo"], "coco.names"])
 48 |     # Read the file and save the content in the list
 49 |     LABELS.extend(open(labelsPath).read().strip().split("\n"))
 50 | 
 51 | 
 52 | def set_colors_for_labels():
 53 |     """
 54 |     Define random color for each of the labelled class.
 55 |     """
 56 |     globals()  # Access global variables
 57 |     COLORS.clear()  # Clear the pre-existing content
 58 |     # initialize a list of colors to represent each possible class label
 59 |     np.random.seed(42)
 60 |     COLORS.extend(np.random.randint(0, 255, size=(len(LABELS), 3), dtype="uint8"))
 61 | 
 62 | 
 63 | def get_loaded_yolo_model():
 64 |     globals()  # Access global variables
 65 |     # Extract the complete path of the weights and configuration file of a trained yolo model.
 66 |     weightsPath = os.path.sep.join([ARG_DICT["yolo"], "yolov3.weights"])
 67 |     configPath = os.path.sep.join([ARG_DICT["yolo"], "yolov3.cfg"])
 68 | 
 69 |     # load the yolo network using the weights and configuration file of a trained model.
 70 |     neural_network = cv2.dnn.readNetFromDarknet(configPath, weightsPath)
 71 |     return neural_network
 72 | 
 73 | 
 74 | def get_bb_and_confidence_for_detections(layerOutputs, Wt, Ht):
 75 |     """
 76 |     Get the bounding boxes, confidences and classIDs for the detected objects from the layerOutputs.
 77 |     """
 78 |     # Initialize the lists to store all bounding boxes, confidence levels, and class IDs.
 79 |     boxes = []
 80 |     confidences = []
 81 |     classIDs = []
 82 | 
 83 |     # Iterate over each output from the layer output generated after forward pass.
 84 |     for output in layerOutputs:
 85 |         # Iterate over each detection from each output.
 86 |         for detection in output:
 87 | 
 88 |             scores = detection[5:]  # Extract scores
 89 |             classID = np.argmax(scores)  # Extract class ID
 90 |             confidence = scores[classID]  # Extract Confidence or probability
 91 | 
 92 |             # check if the confidence level is above confidence threshold.
 93 |             if confidence > ARG_DICT["confidence"]:
 94 |                 # Create the bounding box for the detected objects.
 95 |                 bounding_box = detection[0:4] * np.array([Wt, Ht, Wt, Ht])
 96 | 
 97 |                 # Extract the center co-ordinates, height and width of the bounding box on the frame.
 98 |                 (centerX, centerY, width, height) = bounding_box.astype("int")
 99 | 
100 |                 # Extract the top and bottom co-ordinates of bounding box from the above information.
101 |                 x_box = int(centerX - (width / 2))
102 |                 y_box = int(centerY - (height / 2))
103 | 
104 |                 # Append the bounding_box, confidence, and classID in the respective lists.
105 |                 boxes.append([x_box, y_box, int(width), int(height)])
106 |                 confidences.append(float(confidence))
107 |                 classIDs.append(classID)
108 |     return boxes, confidences, classIDs
109 | 
110 | 
111 | def object_detection():
112 |     """
113 |     This function performs the object detection using YOLO.
114 |     """
115 |     # load the yolo network using the weights and configuration file of a trained model.
116 |     neural_net = get_loaded_yolo_model()
117 | 
118 |     # Extract the input image
119 |     image = ARG_DICT['input_img']
120 | 
121 |     # Extract the shape or dimensions of the     image.
122 |     (Ht, Wt) = image.shape[:2]
123 | 
124 |     # Determine the layers in the network
125 |     layer_names = neural_net.getLayerNames()
126 |     # Determine the names of only output layers.
127 |     layer_names = [layer_names[i[0] - 1] for i in neural_net.getUnconnectedOutLayers()]
128 | 
129 |     # Construct a blob from a input frame.
130 |     blob = cv2.dnn.blobFromImage(image, 1 / 255.0, (416, 416), swapRB=True, crop=False)
131 |     # use this blob as an input to the neural network
132 |     neural_net.setInput(blob)
133 |     # Perform a forward pass of the YOLO object detector.
134 |     layerOutputs = neural_net.forward(layer_names)
135 | 
136 |     # Get the information(bounidng box, confidence and ID) about the considerable detections to mark on  the image
137 |     boxes, confidences, classIDs = get_bb_and_confidence_for_detections(layerOutputs, Wt, Ht)
138 | 
139 |     # Perform the non-maximum suppression to suppress the weak, overlapping bounding boxes.
140 |     idxs = cv2.dnn.NMSBoxes(boxes, confidences, ARG_DICT["confidence"], ARG_DICT["threshold"])
141 |     return idxs, boxes, confidences, classIDs
142 | 
143 | 
144 | def mark_prediction_results_on_image(op_image, idxs, boxes, confidences, classIDs):
145 |     """
146 |     This function adds the prediction results on the output image.
147 |     """
148 |     globals()  # Access global variables
149 |     # check if there is at-least one bounding box.
150 |     if len(idxs) > 0:
151 |         # iterate over each index
152 |         for i in idxs.flatten():
153 |             # extract the coordinates for bounding box.
154 |             (x, y) = (boxes[i][0], boxes[i][1])
155 |             (w, h) = (boxes[i][2], boxes[i][3])
156 | 
157 |             # draw a bounding box with the label on the output image.
158 |             color = [int(c) for c in COLORS[classIDs[i]]]
159 |             cv2.rectangle(op_image, (x, y), (x + w, y + h), color, 2)
160 |             text = "{}: {:.4f}".format(LABELS[classIDs[i]], confidences[i])
161 |             cv2.putText(op_image, text, (x, y - 5), cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2)
162 |     return op_image
163 | 
164 | 
165 | def handle_object_detection_flow(in_img, op_img, yolo_dir, confidence=0.5, threshold=0.3):
166 |     """
167 |     This function handles the flow of the object detection using YOLO.
168 |     """
169 |     # Set input arguments
170 |     set_input_arguments(in_img, yolo_dir, confidence, threshold)
171 |     # Extract the labels from the trained model
172 |     get_labels_from_yolo_model()
173 |     # Associate the color to each label.
174 |     set_colors_for_labels()
175 |     # Perform object detection
176 |     indexes, bounding_boxes, confidences, classIDs = object_detection()
177 |     # Add the results of the detected objects on the output image.
178 |     op_img = mark_prediction_results_on_image(op_img, indexes, bounding_boxes, confidences, classIDs)
179 |     return op_img
180 | 
181 | 
182 | def main():
183 |     # construct the argument parse and parse the arguments
184 |     ap = argparse.ArgumentParser()
185 |     ap.add_argument("-i", "--image", required=True, help="path to input image")
186 |     ap.add_argument("-y", "--yolo", required=True, help="base path to YOLO directory")
187 |     ap.add_argument("-c", "--confidence", type=float, default=0.5,
188 |                     help="minimum probability to filter weak detections")
189 |     ap.add_argument("-t", "--threshold", type=float, default=0.3,
190 |                     help="threshold when applyong non-maxima suppression")
191 |     args = vars(ap.parse_args())
192 |     in_image = cv2.imread(args['image'])
193 | 
194 |     op_image = handle_object_detection_flow(in_image, in_image, args['yolo'], args['confidence'], args['threshold'])
195 |     cv2.imshow("Output", op_image)
196 |     cv2.waitKey(0)
197 |     cv2.destroyAllWindows()
198 | 
199 | 
200 | if __name__ == '__main__':
201 |     main()
202 | 


--------------------------------------------------------------------------------
/ObstacleDetectionYOLO/images/0.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kunjan-mhaske/Obstacle-and-Lane-Detection-using-Computer-Vision/df80843803595683b2a98e6d7a8958ebeb9fa615/ObstacleDetectionYOLO/images/0.jpg


--------------------------------------------------------------------------------
/ObstacleDetectionYOLO/images/3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kunjan-mhaske/Obstacle-and-Lane-Detection-using-Computer-Vision/df80843803595683b2a98e6d7a8958ebeb9fa615/ObstacleDetectionYOLO/images/3.jpg


--------------------------------------------------------------------------------
/Project_report.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kunjan-mhaske/Obstacle-and-Lane-Detection-using-Computer-Vision/df80843803595683b2a98e6d7a8958ebeb9fa615/Project_report.pdf


--------------------------------------------------------------------------------
/Test_Detections_On_Video.py:
--------------------------------------------------------------------------------
 1 | """
 2 | This file combines the results of both lanenet model and yolo model
 3 | to detect the lanes and objects in the input video.
 4 | """
 5 | 
 6 | # Import statements
 7 | import cv2
 8 | import time
 9 | import imutils
10 | import os
11 | import argparse
12 | from ObstacleDetectionYOLO import ObjectDetection_YOLO
13 | from LaneDetectionLaneNet.tools import test_lanenet as tst_ln_net
14 | import tensorflow as tf
15 | 
16 | # Parse all input arguments
17 | arg_parser = argparse.ArgumentParser()
18 | arg_parser.add_argument("-i", "--input", required=True, help="input video file path")
19 | arg_parser.add_argument("-o", "--output", default="OUT/output_video.avi", help="output video file path")
20 | # extract the argument information in the dictionary
21 | arg_dict = vars(arg_parser.parse_args())
22 | 
23 | # Create a video stream object for a input video file.
24 | vid_stream = cv2.VideoCapture(arg_dict["input"])
25 | 
26 | # Initialize the video writer to write the output video
27 | vid_writer = None
28 | 
29 | # try to determine number of frames in a video file.
30 | try:
31 |     if imutils.is_cv2():
32 |         prop = cv2.cv.CV_CAP_PROP_FRAME_COUNT
33 |     else:
34 |         prop = cv2.CAP_PROP_FRAME_COUNT
35 |     # Save the total number of frames.
36 |     frame_count = int(vid_stream.get(prop))
37 |     print("Video Contains {} frames.".format(frame_count))
38 | # Handle if there occurs any exception / Error while computing the total frames.
39 | except:
40 |     print("Error occurred while determining total frames")
41 |     frame_count = -1
42 | 
43 | # Initialize the current_frame_count and MAX_FRAME_LIMIT to limit the output video to a certain number of frames.
44 | current_count = 0
45 | MAX_FRAME_LIMIT = 300
46 | 
47 | # Create session configurations to use CPU only and create a session
48 | sess_config = tf.ConfigProto(device_count={'GPU': 0})
49 | sess = tf.Session(config=sess_config)
50 | 
51 | # Explore each frame in the video until maximum number of frames are processed.
52 | while current_count < MAX_FRAME_LIMIT:
53 |     # read the frame in the video.
54 |     (read_flag, frame) = vid_stream.read()
55 | 
56 |     # if the read operation is not successful break out of the loop. (Potentially end of the video).
57 |     if not read_flag:
58 |         break
59 | 
60 |     # Increment the current frame count
61 |     current_count += 1
62 | 
63 |     # print(current_count)
64 | 
65 |     # Note the beginning count
66 |     begin_time = time.time()
67 |     lane_output_frame = tst_ln_net.test_lanenet(
68 |                             weights_path="./LaneDetectionLaneNet/model/tusimple_lanenet_vgg/tusimple_lanenet_vgg.ckpt",
69 |                             in_image=frame, session=sess)
70 |     object_ouput_frame = ObjectDetection_YOLO.handle_object_detection_flow(frame, lane_output_frame,
71 |                                                                            "./ObstacleDetectionYOLO/yolo-coco")
72 |     # Note the end time
73 |     finish_time = time.time()
74 | 
75 |     # check if the video writer is created.
76 |     if vid_writer is None:
77 |         # initialize the video writer.
78 |         fourcc = cv2.VideoWriter_fourcc(*"MJPG")
79 |         vid_writer = cv2.VideoWriter(arg_dict["output"], fourcc, 30, (frame.shape[1], frame.shape[0]), True)
80 | 
81 |         # Gather and display the information for processing a single frame.
82 |         if frame_count > 0:
83 |             # Compute the execution time.
84 |             elapsed_time = (finish_time - begin_time)
85 |             # Compute the estimated time based on the total video size of MAX_FRAME_LIMIT
86 |             estimated_time = (elapsed_time * frame_count) if frame_count <= MAX_FRAME_LIMIT \
87 |                 else (elapsed_time * MAX_FRAME_LIMIT)
88 |             print("Time Reqired for 1 frame : {:.4f} seconds".format(elapsed_time))
89 |             print("Total estimated time : {:.4f} seconds".format(estimated_time))
90 | 
91 |     # Write the frame on the output video using video writer.
92 |     vid_writer.write(object_ouput_frame)
93 | 
94 | # Close all the resources.
95 | sess.close()
96 | vid_writer.release()
97 | vid_stream.release()
98 | 


--------------------------------------------------------------------------------
/readme.md:
--------------------------------------------------------------------------------
 1 | ## Obstacle and Lane Detection using YOLO and Lane-Net 
 2 | 
 3 | Steps to execute:
 4 | 
 5 | 1. Extract the "ObstacleAndLaneDetection" project file from the submission.
 6 | 2. Download the weights of the pre-trained models from https://drive.google.com/drive/folders/1IX1seops2R8XgnBWfePeDMNAPhz2Yf9f?usp=sharing 
 7 | 3. Extract and save the "models" folder in the LaneDetectionLaneNet folder.
 8 | 4. Extract and save the "yolo-coco" folder in the ObstacleDetectionYOLO folder.
 9 | 5. Execute the Test_Detections_On_Video.py file with the following arguments.
10 |     
11 |    python Test_Detections_On_Video.py --input ./test_video/lane_traffic.avi
12 |                                       --output ./OUT/output_video.avi
13 | 
14 | 6. Check the results in the specified output directory or in the OUT directory.
15 | 
16 | 
17 | > Please check Project report pdf for more details.


--------------------------------------------------------------------------------