-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathvision2.py
71 lines (59 loc) · 1.61 KB
/
vision2.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
# coding utf-8
# ©2020 Jean-Hugues Roy. GNU GPL v3.
import csv, os, json
from collections import Counter
fout = "instaOUT.csv"
n = 0
fichiers = os.listdir()
lieux = []
celebrites = []
categories = []
etiquettes = []
for fichier in fichiers:
if fichier.endswith(".json"):
n += 1
# print(n,fichier)
with open(fichier) as lefichier:
donnees = json.load(lefichier)
# print(donnees.keys())
# print(cat.keys())
# print(cat["name"])
try:
# print(len(donnees["categories"][0]["detail"]["landmarks"]))
if len(donnees["categories"][0]["detail"]["landmarks"]) > 0:
for landmark in donnees["categories"][0]["detail"]["landmarks"]:
# print(landmark["name"])
lieux.append(landmark["name"])
# print("*"*8)
except:
prout = 0
try:
if len(donnees["categories"][0]["detail"]["celebrities"]) > 0:
for celebrity in donnees["categories"][0]["detail"]["celebrities"]:
# print(celebrity["name"])
celebrites.append(celebrity["name"])
# print("*"*8)
except:
prout = 0
for cat in donnees["categories"]:
# print(cat["name"])
categories.append(cat["name"])
for tag in donnees["description"]["tags"]:
# print(tag)
etiquettes.append(tag)
try:
for vignette in donnees["description"]["captions"]:
# print(vignette["text"])
vignettes.append(vignette["text"])
except:
prout = 0
print("*"*8)
freq = Counter(categories)
print(freq.most_common(100))
print(len(categories))
freq = Counter(etiquettes)
print(freq.most_common(100))
print(len(etiquettes))
freq = Counter(celebrites)
print(freq.most_common(100))
print(len(celebrites))