forked from Garvit244/Leetcode
-
Notifications
You must be signed in to change notification settings - Fork 0
/
crawl.py
54 lines (51 loc) · 1.57 KB
/
crawl.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
import json
import os
dictionary = {}
def is_dadada(line):
return line == "'''\n"
rootdir = "/Users/yf/Documents/LeetcodeRawdata"
for subdir, dirs, files in os.walk(rootdir):
for file in files:
if (not file.endswith(".py")):
continue
file_path = os.path.join(subdir, file)
f = open(file_path, "r")
count_dadada = 0
context = ""
code = ""
is_ignore = False
is_context = True
line_of_codes = 0
for line in f.readlines():
if ((count_dadada == 0) & (not is_dadada(line))):
break
if is_dadada(line):
if (count_dadada != 0):
context += line
is_ignore = False
is_context = False
continue
else:
count_dadada+=1
if (is_context & (line == "\n")):
continue
if (line.startswith("Example")):
is_ignore = True
if (is_ignore):
continue
else:
if (is_context):
context += line
else:
code += line
line_of_codes +=1
if (line_of_codes >20):
context = ""
code = ""
break
if ((context != "") & (code != "")):
dictionary[context] = code
json_object = json.dumps(dictionary, indent=4)
# Writing to sample.json
with open("context_example.json", "w") as outfile:
outfile.write(json_object)