-
Notifications
You must be signed in to change notification settings - Fork 11
/
Copy pathHelpers.gs
137 lines (106 loc) · 3.63 KB
/
Helpers.gs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
function constructTableJson(thisTableData, thisProjectId, thisDatasetId) {
return{
tableReference: {
projectId: thisProjectId,
datasetId: thisDatasetId,
tableId: thisTableData.tableId
},
schema: thisTableData.schema
};
}
/**
* Create Tables
*/
function createTable(thisTableId, thisProjectId, thisDataSetId, tableReferenceJson) {
table = BigQuery.Tables.insert(tableReferenceJson, thisProjectId, thisDataSetId);
Logger.log('Table created: %s', thisTableId);
}
/**
* Loads a CSV into BigQuery
*/
function bqLoadCsv(thisProjectId, thisDatasetId, thisTableId, csvFileId) {
// Load CSV data from Drive and convert to the correct format for upload.
var file = DriveApp.getFileById(csvFileId);
var data = file.getBlob().setContentType('application/octet-stream');
// Create the data upload job.
var myJob = {
configuration: {
load: {
destinationTable: {
projectId: thisProjectId,
datasetId: thisDatasetId,
tableId: thisTableId
},
skipLeadingRows: 1,
writeDisposition: 'WRITE_APPEND',
}
}
};
loadJob = BigQuery.Jobs.insert(myJob, thisProjectId, data);
Logger.log('Load job started. Check on the status of it here: ' +
'https://console.cloud.google.com/bigquery?project=%s&page=jobs', BQ_PROJECT_ID);
}
function CSVToArray(strData, rowLimit, strDelimiter) {
// Check to see if the delimiter is defined. If not,
// then default to COMMA.
strDelimiter = (strDelimiter || ",");
// Create a regular expression to parse the CSV values.
var objPattern = new RegExp(
(
// Delimiters.
"(\\" + strDelimiter + "|\\r?\\n|\\r|^)" +
// Quoted fields.
"(?:\"([^\"]*(?:\"\"[^\"]*)*)\"|" +
// Standard fields.
"([^\"\\" + strDelimiter + "\\r\\n]*))"
),
"gi"
);
// Create an array to hold our data. Give the array
// a default empty first row.
var arrData = [
[]
];
// Create an array to hold our individual pattern
// matching groups.
var arrMatches = null;
// Keep looping over the regular expression matches
// until we can no longer find a match.
var i = 0;
while (arrMatches = objPattern.exec(strData)|| i < rowLimit) {
// Get the delimiter that was found.
var strMatchedDelimiter = arrMatches[1];
// Check to see if the given delimiter has a length
// (is not the start of string) and if it matches
// field delimiter. If id does not, then we know
// that this delimiter is a row delimiter.
if (
strMatchedDelimiter.length &&
(strMatchedDelimiter != strDelimiter)
) {
// Since we have reached a new row of data,
// add an empty row to our data array.
arrData.push([]);
}
// Now that we have our delimiter out of the way,
// let's check to see which kind of value we
// captured (quoted or unquoted).
if (arrMatches[2]) {
// We found a quoted value. When we capture
// this value, unescape any double quotes.
var strMatchedValue = arrMatches[2].replace(
new RegExp("\"\"", "g"),
"\""
);
} else {
// We found a non-quoted value.
var strMatchedValue = arrMatches[3];
}
// Now that we have our value string, let's add
// it to the data array.
arrData[arrData.length - 1].push(strMatchedValue);
i++;
}
// Return the parsed data.
return (arrData);
}