-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathsentiment_analysis.js
112 lines (91 loc) · 3.47 KB
/
sentiment_analysis.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
const fs = require('fs');
const readline = require('readline');
const createCsvWriter = require('csv-writer').createObjectCsvWriter;
const language = require('@google-cloud/language');
async function analyzeSentimentWithRetry(text, maxRetries = 3) {
let retries = 0;
while (retries < maxRetries) {
try {
const client = new language.LanguageServiceClient({
timeout: 900000, // Increase timeout to 15 minutes (900000 milliseconds)
});
const document = {
content: text,
type: 'PLAIN_TEXT',
};
const [result] = await client.analyzeSentiment({ document: document });
const sentiment = result.documentSentiment;
return {
'Sentiment score': sentiment.score,
'Sentiment magnitude': sentiment.magnitude,
};
} catch (error) {
console.error('Error analyzing sentiment:', error);
retries++;
}
}
return {
'Sentiment score': 'N/A',
'Sentiment magnitude': 'N/A',
};
}
async function processCSV(inputFilePath, outputFilePath, chunkSize) {
try {
const fileStream = fs.createReadStream(inputFilePath);
const rl = readline.createInterface({
input: fileStream,
crlfDelay: Infinity,
});
const header = (await rl[Symbol.asyncIterator]().next()).value.split(',');
const csvWriter = createCsvWriter({
path: outputFilePath,
header: [
{ id: 'label', title: 'Label'},
{ id: 'text', title: 'Text' },
{ id: 'Sentiment score', title: 'Sentiment score' },
{ id: 'Sentiment magnitude', title: 'Sentiment magnitude' },
],
});
let recordsWithSentiment = [];
let rowCount = 0;
for await (const line of rl) {
const recordValues = line.split(',');
const record = {};
for (let i = 0; i < header.length; i++) {
record[header[i]] = recordValues[i];
}
const text = record['text'];
const sentimentResults = await analyzeSentimentWithRetry(text);
recordsWithSentiment.push({
...record,
...sentimentResults,
});
rowCount++;
if (rowCount >= chunkSize) {
await csvWriter.writeRecords(recordsWithSentiment);
console.log(`Sentiment scores added to the new CSV file for ${rowCount} rows.`);
recordsWithSentiment = [];
rowCount = 0;
}
}
// Write remaining records
if (recordsWithSentiment.length > 0) {
await csvWriter.writeRecords(recordsWithSentiment);
console.log(`Sentiment scores added to the new CSV file for the remaining rows.`);
}
console.log(`Sentiment scores added to the new CSV file (${outputFilePath}).`);
// Close file stream explicitly
fileStream.close();
} catch (error) {
console.error('Error processing CSV:', error);
}
}
async function quickstart() {
const chunkSize = 1000;
for (let i = 3; i >= 1; i--) {
const inputFilePath = `tweets-labels-processed-${i}.csv`;
const outputFilePath = `sentiment-analysis-tweets-labels-processed-${i}.csv`;
await processCSV(inputFilePath, outputFilePath, chunkSize);
}
}
quickstart();