2010-07-31

This commit is contained in:
Ismo Vuorinen
2020-07-15 00:19:21 +03:00
parent 2502fffe37
commit d4383738cd
4 changed files with 36068 additions and 0 deletions

54
_process.py Normal file
View File

@@ -0,0 +1,54 @@
import codecs, re, sys
print "graph imdblinks {" # start the project
print
def f8(seq): # Dave Kirby
# Order preserving
seen = set()
return [x for x in seq if x not in seen and not seen.add(x)]
lista = []
f = codecs.open( 'movie-links.list.utf8', encoding='utf-8' )
for line in f:
line = line.encode('utf-8', 'replace')
if line[0] == "\"":
if re.search("{", line): # Skip TV-episodes
pass
else:
#title = repr(line)
title = line
elif re.search("referenced in", line):
if re.search("{", line): # Skip TV-episodes
pass
else:
title = title.replace("\"", "")
title = title.replace("\"", "")
refer = line.replace("referenced in", "")
refer = refer.replace("(", "", 1)
refer = refer.replace("))", ")")
refer = refer.replace("\"", "")
title = "\"" + title.strip() + "\""
refer = "\"" + refer.strip() + "\""
rivi = title+" -- "+refer+";"
lista.append(rivi)
else:
pass
#print f8(lista)
lista = f8(lista)
for l in lista:
print "\t"+l
print
print "}"

35960
new.dot Normal file

File diff suppressed because it is too large Load Diff

36
process.py Normal file
View File

@@ -0,0 +1,36 @@
import codecs, re, sys
print "graph imdblinks {" # start the project
print
f = codecs.open( 'movie-links.list.utf8', encoding='utf-8' )
for line in f:
line = line.encode('utf-8', 'replace')
if line[0] == "\"":
if re.search("{", line): # Skip TV-episodes
pass
else:
#title = repr(line)
title = line
elif re.search("referenced in", line):
if re.search("{", line): # Skip TV-episodes
pass
else:
title = title.replace("\"", "")
title = title.replace("\"", "")
refer = line.replace("referenced in", "")
refer = refer.replace("(", "", 1)
refer = refer.replace("))", ")")
refer = refer.replace("\"", "")
title = "\"" + title.strip() + "\""
refer = "\"" + refer.strip() + "\""
print "\t"+title, "--", refer+";"
else:
pass
print
print "}"

18
run.sh Executable file
View File

@@ -0,0 +1,18 @@
#!/usr/bin/env bash
if [ -n "$1" ]; then
FROM=iso-8859-1
TO=UTF-8
iconv -f $FROM -t $TO $1 > $1.utf8
# process and create .dot
python process.py -f $1.utf8 > $1.dot
# do the image from the .dot
#dot $1.dot -Tpng -v -o $1.png
# iconv -f original_charset -t utf-8 originalfile > newfile
else
echo "source needed"
fi