Commit bc6a703d authored by Ivan Tyagov's avatar Ivan Tyagov

Improve check.

parent 5ddd7bf8
...@@ -3,18 +3,20 @@ ...@@ -3,18 +3,20 @@
is properly uploaded to Wendelin Data Lake. is properly uploaded to Wendelin Data Lake.
Format of is the same as md5sum's output: Format of is the same as md5sum's output:
<md5_sum> <filename> <md5_sum> <filename.extension>
""" """
data = str(context.file_system_checksum).strip() data = str(context.file_system_checksum).strip()
lines = data.split("\n") lines = data.split("\n")
print "Total files = ", len(lines)
for line in lines[:]: for line in lines[:]:
md5_checksum = line[:32].strip() md5_checksum = line[:32].strip()
filename = line[32:].strip() full_filename = line[32:].strip()
# check Data stream for this hash exists # check Data stream for this hash exists
reference = "/%s/jpg" %(data_set_reference, filename.replace(".jpg", "")) filename, extension = full_filename.split(".")
reference = "%s/%s/%s" %(data_set_reference, filename, extension)
catalog_kw = {"portal_type": "Data Stream", catalog_kw = {"portal_type": "Data Stream",
"reference": reference} "reference": reference}
data_stream = context.portal_catalog.getResultValue(**catalog_kw) data_stream = context.portal_catalog.getResultValue(**catalog_kw)
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment