|
39 | 39 | .getOrCreate()
|
40 | 40 |
|
41 | 41 |
|
42 |
| -# s3keys are read from the verifySproxydKeys.js scripts output |
| 42 | +# s3keys are generated by verifySproxydKeys.js script and processed by s3_fsck_p0.py |
43 | 43 | s3keys = "%s://%s/%s/s3fsck/s3-dig-keys.csv" % (PROTOCOL, PATH, RING)
|
44 |
| -# ringkeys are read from the listkeys.py (or ringsh dump) scripts output |
| 44 | +# ringkeys are generated by the listkeys.py (or ringsh dump) script and processed by s3_fsck_p1.py |
45 | 45 | ringkeys = "%s://%s/%s/s3fsck/arc-keys.csv" % (PROTOCOL, PATH, RING)
|
46 | 46 |
|
47 |
| -# reading with a header, the columns are named. The column _c1 will be whatever column the _c1 header is assigned to |
| 47 | +# reading with a header, the columns are named. |
| 48 | +# columns digkey, sproxyd input key, subkey are the actual column names of |
| 49 | +# columns 1, 2, 3 for the csv |
| 50 | +# input structure: (digkey, sproxyd input key, subkey) |
| 51 | +# e.g. 7359114991482315D0A5890000,BDE4B9BBEB45711EC2F1A9C78F6BCD59E02C6220,SINGLE |
| 52 | +# Required Fields: |
| 53 | +# - digkey |
| 54 | +# - sproxyd input key |
48 | 55 | dfs3keys = spark.read.format("csv").option("header", "true").option("inferSchema", "true").load(s3keys)
|
49 |
| -# reading with a header, the columns are named. The column _c1 will be whatever column the _c1 header is assigned to |
| 56 | + |
| 57 | + |
| 58 | +# reading with a header, the columns are named. |
| 59 | +# columns _c1, count, ringkey (main chunk) are the actual column names of |
| 60 | +# columns 1, 2, 3 for the csv |
| 61 | +# input structure: (digkey, count, ringkey (main chunk)) |
| 62 | +# e.g. 7359114991482315D0A5890000,BDE4B9BBEB45711EC2F1A9C78F6BCD59E02C6220,SINGLE |
| 63 | +# Required Fields: |
| 64 | +# - digkey |
| 65 | +# - ringkey (main chunk) |
50 | 66 | dfringkeys = spark.read.format("csv").option("header", "true").option("inferSchema", "true").load(ringkeys)
|
51 | 67 |
|
52 | 68 | # rename the column _c1 to digkey, the next write will output a header that uses digkey instead of _c1
|
|
0 commit comments