Commit 6add27b9 authored by Your Name's avatar Your Name

test

parent 22e3735c
...@@ -201,14 +201,19 @@ if __name__ == "__main__": ...@@ -201,14 +201,19 @@ if __name__ == "__main__":
# #
# tf.logging.set_verbosity(tf.logging.INFO) # tf.logging.set_verbosity(tf.logging.INFO)
# #
te_files = [path + "nearby/part-r-00000"] # te_files = [path + "nearby/part-r-00000"]
te_files = []
for i in range(0,10):
te_files.append([path + "nearby/part-r-0000" + str(i)])
for i in range(10,100):
te_files.append([path + "nearby/part-r-000" + str(i)])
# main(te_files) # main(te_files)
# te_files = [[path+"nearby/part-r-00000"],[path+"native/part-r-00000"]] # te_files = [[path+"nearby/part-r-00000"],[path+"native/part-r-00000"]]
rdd_te_files = spark.sparkContext.parallelize(te_files) rdd_te_files = spark.sparkContext.parallelize(te_files)
print("-"*100) print("-"*100)
print(rdd_te_files.collect()) print(rdd_te_files.collect())
print("-" * 100) print("-" * 100)
indices = rdd_te_files.map(lambda x: main(x)) indices = rdd_te_files.repartion(100).map(lambda x: main(x))
print(indices.collect()) print(indices.collect())
b = time.time() b = time.time()
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment