-
Notifications
You must be signed in to change notification settings - Fork 97
/
Copy pathcreating-train-and-test-txt-files.py
124 lines (96 loc) · 2.98 KB
/
creating-train-and-test-txt-files.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
"""
Course: Training YOLO v3 for Objects Detection with Custom Data
Section-3
Labelling new Dataset in YOLO format
File: creating-train-and-test-txt-files.py
"""
# Creating files train.txt and test.txt
# for training in Darknet framework
#
# Algorithm:
# Setting up full paths --> List of paths -->
# --> Extracting 15% of paths to save into test.txt file -->
# --> Writing paths into train and test txt files
#
# Result:
# Files train.txt and test.txt with full paths to images
# Importing needed library
import os
"""
Start of:
Setting up full path to directory with labelled images
"""
# Full or absolute path to the folder with images
# Find it with Py file getting-full-path.py
# Pay attention! If you're using Windows, yours path might looks like:
# r'C:\Users\my_name\Downloads\video-to-annotate'
# or:
# 'C:\\Users\\my_name\\Downloads\\video-to-annotate'
full_path_to_images = '/home/my_name/Downloads/video-to-annotate'
"""
End of:
Setting up full path to directory with labelled images
"""
"""
Start of:
Getting list of full paths to labelled images
"""
# Check point
# Getting the current directory
# print(os.getcwd())
# Changing the current directory
# to one with images
os.chdir(full_path_to_images)
# Check point
# Getting the current directory
# print(os.getcwd())
# Defining list to write paths in
p = []
# Using os.walk for going through all directories
# and files in them from the current directory
# Fullstop in os.walk('.') means the current directory
for current_dir, dirs, files in os.walk('.'):
# Going through all files
for f in files:
# Checking if filename ends with '.jpeg'
if f.endswith('.jpeg'):
# Preparing path to save into train.txt file
# Pay attention!
# If you're using Windows, it might need to change
# this: + '/' +
# to this: + '\' +
# or to this: + '\\' +
path_to_save_into_txt_files = full_path_to_images + '/' + f
# Appending the line into the list
# We use here '\n' to move to the next line
# when writing lines into txt files
p.append(path_to_save_into_txt_files + '\n')
# Slicing first 15% of elements from the list
# to write into the test.txt file
p_test = p[:int(len(p) * 0.15)]
# Deleting from initial list first 15% of elements
p = p[int(len(p) * 0.15):]
"""
End of:
Getting list of full paths to labelled images
"""
"""
Start of:
Creating train.txt and test.txt files
"""
# Creating file train.txt and writing 85% of lines in it
with open('train.txt', 'w') as train_txt:
# Going through all elements of the list
for e in p:
# Writing current path at the end of the file
train_txt.write(e)
# Creating file test.txt and writing 15% of lines in it
with open('test.txt', 'w') as test_txt:
# Going through all elements of the list
for e in p_test:
# Writing current path at the end of the file
test_txt.write(e)
"""
End of:
Creating train.txt and test.txt files
"""