Skip to content

Commit f3ef7ee

Browse files
Add files via upload
Added - two identical tabular data files, one Excel file (.xlsx), and one tab-separated plain text fil (.txt) - json metadata file of the dataset We'd like our depositors to be able to upload tabular data in the original file format (e.g. Excel; .xlsx) and in a preferred file format (tab-separated plain text; .txt). These file should have the same file names except for the file extension. Currently, such files are handled like this in Dataverse: - The Excel file is ingested. - Dataverse recognizes identical content in the Excel file and the .txt file. Therefore, a "1" is added to the file name of the .txt file. For more information, see this discussion in the Dataverse Google Group: https://groups.google.com/forum/?hl=no#!topic/dataverse-community/_2Tm2B2sQhc
1 parent 98808ed commit f3ef7ee

3 files changed

Lines changed: 45 additions & 0 deletions

File tree

data/Tabular_Sample_Data.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
{"id":1101620,"identifier":"FK2/0MVCBM","persistentUrl":"https://doi.org/10.70122/FK2/0MVCBM","protocol":"doi","authority":"10.70122","publisher":"Demo Dataverse","publicationDate":"2020-06-08","storageIdentifier":"file://10.70122/FK2/0MVCBM","datasetVersion":{"id":134195,"datasetId":1101620,"datasetPersistentId":"doi:10.70122/FK2/0MVCBM","storageIdentifier":"file://10.70122/FK2/0MVCBM","versionNumber":1,"versionMinorNumber":0,"versionState":"RELEASED","UNF":"UNF:6:eFXLLKw9zMMIcjPRZOLhPg==","lastUpdateTime":"2020-06-08T05:52:18Z","releaseTime":"2020-06-08T05:52:18Z","createTime":"2020-06-04T09:06:36Z","license":"CC0","termsOfUse":"CC0 Waiver","fileAccessRequest":false,"metadataBlocks":{"citation":{"displayName":"Citation Metadata","fields":[{"typeName":"title","multiple":false,"typeClass":"primitive","value":"Testing Tabular File Ingest - Excel and tab-separated .txt"},{"typeName":"author","multiple":true,"typeClass":"compound","value":[{"authorName":{"typeName":"authorName","multiple":false,"typeClass":"primitive","value":"Test User 1, UiT"},"authorAffiliation":{"typeName":"authorAffiliation","multiple":false,"typeClass":"primitive","value":"UiT The Arctic University of Norway"}}]},{"typeName":"datasetContact","multiple":true,"typeClass":"compound","value":[{"datasetContactName":{"typeName":"datasetContactName","multiple":false,"typeClass":"primitive","value":"Test User 1, UiT"},"datasetContactAffiliation":{"typeName":"datasetContactAffiliation","multiple":false,"typeClass":"primitive","value":"UiT The Arctic University of Norway"},"datasetContactEmail":{"typeName":"datasetContactEmail","multiple":false,"typeClass":"primitive","value":"philipp.conzett@uit.no"}}]},{"typeName":"dsDescription","multiple":true,"typeClass":"compound","value":[{"dsDescriptionValue":{"typeName":"dsDescriptionValue","multiple":false,"typeClass":"primitive","value":"Testing ingest of tabular files in Dataverse."},"dsDescriptionDate":{"typeName":"dsDescriptionDate","multiple":false,"typeClass":"primitive","value":"2020-06-04"}}]},{"typeName":"subject","multiple":true,"typeClass":"controlledVocabulary","value":["Social Sciences"]},{"typeName":"keyword","multiple":true,"typeClass":"compound","value":[{"keywordValue":{"typeName":"keywordValue","multiple":false,"typeClass":"primitive","value":"testing"}},{"keywordValue":{"typeName":"keywordValue","multiple":false,"typeClass":"primitive","value":"file ingest"}}]},{"typeName":"depositor","multiple":false,"typeClass":"primitive","value":"Test User 1, UiT"},{"typeName":"dateOfDeposit","multiple":false,"typeClass":"primitive","value":"2020-06-04"}]},"geospatial":{"displayName":"Geospatial Metadata","fields":[]},"journal":{"displayName":"Journal Metadata","fields":[]}},"files":[{"description":"Excel file","label":"Tabular_Sample_Data.tab","restricted":false,"version":3,"datasetVersionId":134195,"dataFile":{"id":1104456,"persistentId":"doi:10.70122/FK2/0MVCBM/LISFFL","pidURL":"https://doi.org/10.70122/FK2/0MVCBM/LISFFL","filename":"Tabular_Sample_Data.tab","contentType":"text/tab-separated-values","filesize":2200,"description":"Excel file","storageIdentifier":"file://17282ef3127-d8ed28281ac7","originalFileFormat":"application/vnd.openxmlformats-officedocument.spreadsheetml.sheet","originalFormatLabel":"MS Excel Spreadsheet","originalFileSize":12751,"UNF":"UNF:6:eFXLLKw9zMMIcjPRZOLhPg==","rootDataFileId":-1,"md5":"45a5a81537c772485a640a030b12bd33","checksum":{"type":"MD5","value":"45a5a81537c772485a640a030b12bd33"},"creationDate":"2020-06-05"}},{"description":"Tab-separated plain text file","label":"Tabular_Sample_Data.txt","restricted":false,"version":1,"datasetVersionId":134195,"dataFile":{"id":1104457,"persistentId":"doi:10.70122/FK2/0MVCBM/IYDYQR","pidURL":"https://doi.org/10.70122/FK2/0MVCBM/IYDYQR","filename":"Tabular_Sample_Data.txt","contentType":"text/plain","filesize":2060,"description":"Tab-separated plain text file","storageIdentifier":"file://17282ee8e22-382bc0edc2d6","rootDataFileId":-1,"md5":"b2a1624bcf972094c48d639d4aa67c9e","checksum":{"type":"MD5","value":"b2a1624bcf972094c48d639d4aa67c9e"},"creationDate":"2020-06-05"}}],"citation":"Test User 1, UiT, 2020, \"Testing Tabular File Ingest - Excel and tab-separated .txt\", https://doi.org/10.70122/FK2/0MVCBM, Demo Dataverse, V1, UNF:6:eFXLLKw9zMMIcjPRZOLhPg== [fileUNF]"}}

data/Tabular_Sample_Data.txt

Lines changed: 44 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,44 @@
1+
OrderDate Region Rep Item Units UnitCost Total
2+
01.06.2019 East Jones Pencil 95 1,99 189,05
3+
02.06.2019 Central Kivell Binder 50 19,99 999,5
4+
03.06.2019 Central Jardine Pencil 36 4,99 179,64
5+
04.06.2019 Central Gill Pen 27 19,99 539,73
6+
05.06.2019 West Sorvino Pencil 56 2,99 167,44
7+
06.06.2019 East Jones Binder 60 4,99 299,4
8+
07.06.2019 Central Andrews Pencil 75 1,99 149,25
9+
08.06.2019 Central Jardine Pencil 90 4,99 449,1
10+
09.06.2019 West Thompson Pencil 32 1,99 63,68
11+
10.06.2019 East Jones Binder 60 8,99 539,4
12+
11.06.2019 Central Morgan Pencil 90 4,99 449,1
13+
12.06.2019 East Howard Binder 29 1,99 57,71
14+
13.06.2019 East Parent Binder 81 19,99 1619,19
15+
14.06.2019 East Jones Pencil 35 4,99 174,65
16+
15.06.2019 Central Smith Desk 2 125 250
17+
16.06.2019 East Jones Pen Set 16 15,99 255,84
18+
17.06.2019 Central Morgan Binder 28 8,99 251,72
19+
18.06.2019 East Jones Pen 64 8,99 575,36
20+
19.06.2019 East Parent Pen 15 19,99 299,85
21+
20.06.2019 Central Kivell Pen Set 96 4,99 479,04
22+
21.06.2019 Central Smith Pencil 67 1,29 86,43
23+
22.06.2019 East Parent Pen Set 74 15,99 1183,26
24+
23.06.2019 Central Gill Binder 46 8,99 413,54
25+
24.06.2019 Central Smith Binder 87 15 1305
26+
25.06.2019 East Jones Binder 4 4,99 19,96
27+
26.06.2019 West Sorvino Binder 7 19,99 139,93
28+
27.06.2019 Central Jardine Pen Set 50 4,99 249,5
29+
28.06.2019 Central Andrews Pencil 66 1,99 131,34
30+
29.06.2019 East Howard Pen 96 4,99 479,04
31+
30.06.2019 Central Gill Pencil 53 1,29 68,37
32+
01.07.2019 Central Gill Binder 80 8,99 719,2
33+
02.07.2019 Central Kivell Desk 5 125 625
34+
03.07.2019 East Jones Pen Set 62 4,99 309,38
35+
04.07.2019 Central Morgan Pen Set 55 12,49 686,95
36+
05.07.2019 Central Kivell Pen Set 42 23,95 1005,9
37+
06.07.2019 West Sorvino Desk 3 275 825
38+
07.07.2019 Central Gill Pencil 7 1,29 543,02
39+
08.07.2019 West Sorvino Pen 76 1,99 151,24
40+
09.07.2019 West Thompson Binder 57 19,99 1139,43
41+
10.07.2019 Central Andrews Pencil 14 1,29 325,56
42+
11.07.2019 Central Jardine Binder 11 4,99 54,89
43+
12.07.2019 Central Jardine Binder 94 19,99 1879,06
44+
13.07.2019 Central Andrews Binder 28 4,99 139,72

data/Tabular_Sample_Data.xlsx

12.5 KB
Binary file not shown.

0 commit comments

Comments
 (0)