# HG changeset patch # User sem4j # Date 1380091103 14400 # Node ID 75c072490c2d5007f71e89ea753abc8af776f382 # Parent dba28145ab27ada04fa4c9deeab39bdf26a0689d Uploaded diff -r dba28145ab27 -r 75c072490c2d tab2rdf.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tab2rdf.py Wed Sep 25 02:38:23 2013 -0400 @@ -0,0 +1,40 @@ +# tab2rdf.py version:0.1 +# USAGE: python tab2rdf.py +# .. +# USAGE: python tab2rdf.py multi_namespaces .. + +import sys, csv, sqlite3, time + +argvs = sys.argv +num_triple = (len(argvs) - 4) / 4 +print('Number of Triples for One Column: ' + str(num_triple) + '\n') + +input_file = argvs[1] +output_file = argvs[2] +output_format = argvs[3] +ns = argvs[4] + +# OUTPUT +out = open(output_file, 'w') + +with open(input_file,'rb') as infile: + dr = csv.reader(infile, delimiter='\t') + row_count = 0 + for row in dr: + row_count += 1 + values = [] + col_count = 0 + for col in row: + col_count += 1 + values.append(col) + for i in range(0, num_triple): + s_val = values[int(argvs[4 * i + 5]) - 1] + p_val = argvs[4 * i + 6] + o_val = values[int(argvs[4 * i + 7]) - 1] + if int(argvs[4 * i + 8]) : + out.write('<' + ns + s_val + '> <' + ns + p_val + '> <' + ns + o_val + '> .\n') + else : + out.write('<' + ns + s_val + '> <' + ns + p_val + '> "' + o_val + '" .\n') + +out.close() +