-
Notifications
You must be signed in to change notification settings - Fork 0
/
data_generation.py
110 lines (94 loc) · 3.27 KB
/
data_generation.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
from PIL import Image
import os
#%% ------------------------------------- Create data directory to store CXR images ---------------------------------------
dir = os.path.dirname('data/')
if not os.path.exists(dir):
os.makedirs(dir)
covid = os.path.dirname('data/covid/') ## covid cases
if not os.path.exists(covid):
os.makedirs(covid)
normal = os.path.dirname('data/normal/') ## normal cases
if not os.path.exists(normal):
os.makedirs(normal)
pneumonia = os.path.dirname('data/pneumonia/') ## pneumonia cases
if not os.path.exists(pneumonia):
os.makedirs(pneumonia)
#%% ----------------------------- Convert images into PNG and save them into 3 folders -------------------------------------
# CXR_dataset
## normal
imglist = [f for f in os.listdir('CXR_dataset/normal/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('CXR_dataset/normal/' + f)
img.save(normal + "/" + name)
## pneumonia
imglist = [f for f in os.listdir('CXR_dataset/pneumonia/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('CXR_dataset/pneumonia/' + f)
img.save(pneumonia + "/" + name)
# ==============================
# github_dataset
## covid
imglist = [f for f in os.listdir('github_dataset/covid/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('github_dataset/covid/' + f)
img.save(covid + "/" + name)
## normal
imglist = [f for f in os.listdir('github_dataset/normal/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('github_dataset/normal/' + f)
img.save(normal + "/" + name)
## pneumonia
imglist = [f for f in os.listdir('github_dataset/pneumonia/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('github_dataset/pneumonia/' + f)
img.save(pneumonia + "/" + name)
# ==============================
# COVID-19 Radiography
## covid
imglist = [f for f in os.listdir('COVID-19_radiography/covid/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('COVID-19_radiography/covid/' + f)
img.save(covid + "/" + name)
## normal
imglist = [f for f in os.listdir('COVID-19_radiography/normal/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('COVID-19_radiography/normal/' + f)
img.save(normal + "/" + name)
## pneumonia
imglist = [f for f in os.listdir('COVID-19_radiography/pneumonia/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('COVID-19_radiography/pneumonia/' + f)
img.save(pneumonia + "/" + name)
# ==============================
# RSNA dataset
## normal
imglist = [f for f in os.listdir('rsna_dataset/normal/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('rsna_dataset/normal/' + f)
img.save(normal + "/" + name)
## pneumonia
imglist = [f for f in os.listdir('rsna_dataset/pneumonia/')]
for f in imglist:
sep = "."
name = sep.join(f.split(sep)[:-1]) + ".png"
img = Image.open('rsna_dataset/pneumonia/' + f)
img.save(pneumonia + "/" + name)
print("Data generation process is completed.")