-
Notifications
You must be signed in to change notification settings - Fork 452
/
Copy pathPKPTemporaryTotalsDAO.php
320 lines (300 loc) · 16.6 KB
/
PKPTemporaryTotalsDAO.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
<?php
/**
* @file classes/statistics/PKPTemporaryTotalsDAO.php
*
* Copyright (c) 2022 Simon Fraser University
* Copyright (c) 2022 John Willinsky
* Distributed under the GNU GPL v3. For full terms see the file docs/COPYING.
*
* @class PKPTemporaryTotalsDAO
*
* @ingroup statistics
*
* @brief Operations for retrieving and adding total usage.
*
* It considers:
* context index page views,
* submission abstract, primary and supp file views,
* geo submission usage,
* COUNTER submission stats.
*/
namespace PKP\statistics;
use APP\core\Application;
use DateTimeImmutable;
use Illuminate\Support\Facades\DB;
use PKP\config\Config;
use PKP\db\DAORegistry;
abstract class PKPTemporaryTotalsDAO
{
/**
* The name of the table. This table contains all usage events.
*/
public string $table = 'usage_stats_total_temporary_records';
/**
* Add the passed usage statistic record.
*/
public function insert(object $entryData, int $lineNumber, string $loadId): void
{
$insertData = $this->getInsertData($entryData);
$insertData['line_number'] = $lineNumber;
$insertData['load_id'] = $loadId;
DB::table($this->table)->insert($insertData);
}
/**
* Get Laravel optimized array of data to insert into the table based on the log entry
*/
protected function getInsertData(object $entryData): array
{
return [
'date' => $entryData->time,
'ip' => $entryData->ip,
'user_agent' => substr($entryData->userAgent, 0, 255),
'canonical_url' => $entryData->canonicalUrl,
'context_id' => $entryData->contextId,
'submission_id' => $entryData->submissionId,
'representation_id' => $entryData->representationId,
'submission_file_id' => $entryData->submissionFileId,
'assoc_type' => $entryData->assocType,
'file_type' => $entryData->fileType,
'country' => !empty($entryData->country) ? $entryData->country : '',
'region' => !empty($entryData->region) ? $entryData->region : '',
'city' => !empty($entryData->city) ? $entryData->city : '',
];
}
/**
* Delete all temporary records associated
* with the passed load id.
*/
public function deleteByLoadId(string $loadId): void
{
DB::table($this->table)->where('load_id', '=', $loadId)->delete();
}
/**
* Remove Double Clicks according to COUNTER guidelines
* Remove the potential of over-counting which could occur when a user clicks the same link multiple times.
* Double-clicks, i.e. two clicks in succession, on a link by the same user within a 30-second period MUST be counted as one action.
* When two actions are made for the same URL within 30 seconds the first request MUST be removed and the second retained.
* A user is identified by IP address combined with the browser’s user-agent.
*
* See https://www.projectcounter.org/code-of-practice-five-sections/7-processing-rules-underlying-counter-reporting-data/#doubleclick
*/
public function removeDoubleClicks(string $loadId, int $counterDoubleClickTimeFilter): void
{
if (substr(Config::getVar('database', 'driver'), 0, strlen('postgres')) === 'postgres') {
DB::statement(
"
DELETE FROM {$this->table} ust
WHERE EXISTS (
SELECT * FROM (
SELECT 1 FROM {$this->table} ustt
WHERE ust.load_id = ? AND ustt.load_id = ust.load_id AND
ustt.context_id = ust.context_id AND
ustt.ip = ust.ip AND ustt.user_agent = ust.user_agent AND ustt.canonical_url = ust.canonical_url AND
EXTRACT(EPOCH FROM (ustt.date - ust.date)) < ? AND
EXTRACT(EPOCH FROM (ustt.date - ust.date)) > 0 AND
ust.line_number < ustt.line_number) AS tmp
)
",
[$loadId, $counterDoubleClickTimeFilter]
);
} else {
DB::statement(
"
DELETE FROM ust USING {$this->table} ust
INNER JOIN {$this->table} ustt ON (
ustt.load_id = ust.load_id AND
ustt.context_id = ust.context_id AND
ustt.ip = ust.ip AND
ustt.user_agent = ust.user_agent AND
ustt.canonical_url = ust.canonical_url
)
WHERE ust.load_id = ? AND
TIMESTAMPDIFF(SECOND, ust.date, ustt.date) < ? AND
TIMESTAMPDIFF(SECOND, ust.date, ustt.date) > 0 AND
ust.line_number < ustt.line_number
",
[$loadId, $counterDoubleClickTimeFilter]
);
}
}
/**
* Load usage for context index pages
*/
public function compileContextMetrics(string $loadId): void
{
$date = DateTimeImmutable::createFromFormat('Ymd', substr($loadId, -12, 8));
DB::table('metrics_context')->where('load_id', '=', $loadId)->orWhereDate('date', '=', $date)->delete();
$selectContextMetrics = DB::table($this->table)
->select(DB::raw('load_id, context_id, DATE(date) as date, count(*) as metric'))
->where('load_id', '=', $loadId)
->where('assoc_type', '=', Application::getContextAssocType())
->groupBy(DB::raw('load_id, context_id, DATE(date)'));
DB::table('metrics_context')->insertUsing(['load_id', 'context_id', 'date', 'metric'], $selectContextMetrics);
}
/**
* Load usage for submissions (abstract, primary and supp files)
*/
public function compileSubmissionMetrics(string $loadId): void
{
$date = DateTimeImmutable::createFromFormat('Ymd', substr($loadId, -12, 8));
DB::table('metrics_submission')->where('load_id', '=', $loadId)->orWhereDate('date', '=', $date)->delete();
$selectSubmissionMetrics = DB::table($this->table)
->select(DB::raw('load_id, context_id, submission_id, assoc_type, DATE(date) as date, count(*) as metric'))
->where('load_id', '=', $loadId)
->where('assoc_type', '=', Application::ASSOC_TYPE_SUBMISSION)
->groupBy(DB::raw('load_id, context_id, submission_id, assoc_type, DATE(date)'));
DB::table('metrics_submission')->insertUsing(['load_id', 'context_id', 'submission_id', 'assoc_type', 'date', 'metric'], $selectSubmissionMetrics);
$selectSubmissionFileMetrics = DB::table($this->table)
->select(DB::raw('load_id, context_id, submission_id, representation_id, submission_file_id, file_type, assoc_type, DATE(date) as date, count(*) as metric'))
->where('load_id', '=', $loadId)
->where('assoc_type', '=', Application::ASSOC_TYPE_SUBMISSION_FILE)
->groupBy(DB::raw('load_id, context_id, submission_id, representation_id, submission_file_id, file_type, assoc_type, DATE(date)'));
DB::table('metrics_submission')->insertUsing(['load_id', 'context_id', 'submission_id', 'representation_id', 'submission_file_id', 'file_type', 'assoc_type', 'date', 'metric'], $selectSubmissionFileMetrics);
$selectSubmissionSuppFileMetrics = DB::table($this->table)
->select(DB::raw('load_id, context_id, submission_id, representation_id, submission_file_id, file_type, assoc_type, DATE(date) as date, count(*) as metric'))
->where('load_id', '=', $loadId)
->where('assoc_type', '=', Application::ASSOC_TYPE_SUBMISSION_FILE_COUNTER_OTHER)
->groupBy(DB::raw('load_id, context_id, submission_id, representation_id, submission_file_id, file_type, assoc_type, DATE(date)'));
DB::table('metrics_submission')->insertUsing(['load_id', 'context_id', 'submission_id', 'representation_id', 'submission_file_id', 'file_type', 'assoc_type', 'date', 'metric'], $selectSubmissionSuppFileMetrics);
}
// For the DB tables that contain also the unique metrics, this deletion by loadId is in a separate function,
// differently to the deletion for the tables above (metrics_context, metrics_issue and metrics_submission)
// The total metrics will be loaded here (s. load... functions below), unique metrics are loaded in UnsageStatsUnique... classes
public function deleteSubmissionGeoDailyByLoadId(string $loadId): void
{
$date = DateTimeImmutable::createFromFormat('Ymd', substr($loadId, -12, 8));
DB::table('metrics_submission_geo_daily')->where('load_id', '=', $loadId)->orWhereDate('date', '=', $date)->delete();
}
public function deleteCounterSubmissionDailyByLoadId(string $loadId): void
{
$date = DateTimeImmutable::createFromFormat('Ymd', substr($loadId, -12, 8));
DB::table('metrics_counter_submission_daily')->where('load_id', '=', $loadId)->orWhereDate('date', '=', $date)->delete();
}
public function deleteCounterSubmissionInstitutionDailyByLoadId(string $loadId): void
{
$date = DateTimeImmutable::createFromFormat('Ymd', substr($loadId, -12, 8));
DB::table('metrics_counter_submission_institution_daily')->where('load_id', '=', $loadId)->orWhereDate('date', '=', $date)->delete();
}
/**
* Load total geographical usage on the submission level
*/
public function compileSubmissionGeoDailyMetrics(string $loadId): void
{
// construct metric upsert
$metricUpsertSql = "
INSERT INTO metrics_submission_geo_daily (load_id, context_id, submission_id, date, country, region, city, metric, metric_unique)
SELECT * FROM (SELECT load_id, context_id, submission_id, DATE(date) as date, country, region, city, count(*) as metric_tmp, 0 as metric_unique
FROM {$this->table}
WHERE load_id = ? AND submission_id IS NOT NULL AND (country <> '' OR region <> '' OR city <> '')
GROUP BY load_id, context_id, submission_id, DATE(date), country, region, city) AS t
";
if (substr(Config::getVar('database', 'driver'), 0, strlen('postgres')) === 'postgres') {
$metricUpsertSql .= '
ON CONFLICT ON CONSTRAINT msgd_uc_load_context_submission_c_r_c_date DO UPDATE
SET metric = excluded.metric;
';
} else {
$metricUpsertSql .= '
ON DUPLICATE KEY UPDATE metric = metric_tmp;
';
}
DB::statement($metricUpsertSql, [$loadId]);
}
/**
* Load total COUNTER submission usage (investigations and requests)
*/
public function compileCounterSubmissionDailyMetrics(string $loadId): void
{
// construct metric_investigations upsert
$metricInvestigationsUpsertSql = "
INSERT INTO metrics_counter_submission_daily (load_id, context_id, submission_id, date, metric_investigations, metric_investigations_unique, metric_requests, metric_requests_unique)
SELECT * FROM (SELECT load_id, context_id, submission_id, DATE(date) as date, count(*) as metric, 0 as metric_investigations_unique, 0 as metric_requests, 0 as metric_requests_unique
FROM {$this->table}
WHERE load_id = ? AND submission_id IS NOT NULL
GROUP BY load_id, context_id, submission_id, DATE(date)) AS t
";
if (substr(Config::getVar('database', 'driver'), 0, strlen('postgres')) === 'postgres') {
$metricInvestigationsUpsertSql .= '
ON CONFLICT ON CONSTRAINT msd_uc_load_id_context_id_submission_id_date DO UPDATE
SET metric_investigations = excluded.metric_investigations;
';
} else {
$metricInvestigationsUpsertSql .= '
ON DUPLICATE KEY UPDATE metric_investigations = metric;
';
}
DB::statement($metricInvestigationsUpsertSql, [$loadId]);
// construct metric_requests upsert
$metricRequestsUpsertSql = "
INSERT INTO metrics_counter_submission_daily (load_id, context_id, submission_id, date, metric_investigations, metric_investigations_unique, metric_requests, metric_requests_unique)
SELECT * FROM (SELECT load_id, context_id, submission_id, DATE(date) as date, 0 as metric_investigations, 0 as metric_investigations_unique, count(*) as metric, 0 as metric_requests_unique
FROM {$this->table}
WHERE load_id = ? AND assoc_type = ?
GROUP BY load_id, context_id, submission_id, DATE(date)) AS t
";
if (substr(Config::getVar('database', 'driver'), 0, strlen('postgres')) === 'postgres') {
$metricRequestsUpsertSql .= '
ON CONFLICT ON CONSTRAINT msd_uc_load_id_context_id_submission_id_date DO UPDATE
SET metric_requests = excluded.metric_requests;
';
} else {
$metricRequestsUpsertSql .= '
ON DUPLICATE KEY UPDATE metric_requests = metric;
';
}
DB::statement($metricRequestsUpsertSql, [$loadId, Application::ASSOC_TYPE_SUBMISSION_FILE]);
}
/**
* Load total institutional COUNTER submission usage (investigations and requests)
*/
public function compileCounterSubmissionInstitutionDailyMetrics(string $loadId): void
{
// construct metric_investigations upsert
$metricInvestigationsUpsertSql = "
INSERT INTO metrics_counter_submission_institution_daily (load_id, context_id, submission_id, date, institution_id, metric_investigations, metric_investigations_unique, metric_requests, metric_requests_unique)
SELECT * FROM (
SELECT ustt.load_id, ustt.context_id, ustt.submission_id, DATE(ustt.date) as date, usit.institution_id, count(*) as metric, 0 as metric_investigations_unique, 0 as metric_requests, 0 as metric_requests_unique
FROM {$this->table} ustt
JOIN usage_stats_institution_temporary_records usit on (usit.load_id = ustt.load_id AND usit.line_number = ustt.line_number)
WHERE ustt.load_id = ? AND submission_id IS NOT NULL AND usit.institution_id = ?
GROUP BY ustt.load_id, ustt.context_id, ustt.submission_id, DATE(ustt.date), usit.institution_id) AS t
";
if (substr(Config::getVar('database', 'driver'), 0, strlen('postgres')) === 'postgres') {
$metricInvestigationsUpsertSql .= '
ON CONFLICT ON CONSTRAINT msid_uc_load_id_context_id_submission_id_institution_id_date DO UPDATE
SET metric_investigations = excluded.metric_investigations;
';
} else {
$metricInvestigationsUpsertSql .= '
ON DUPLICATE KEY UPDATE metric_investigations = metric;
';
}
// construct metric_requests upsert
$metricRequestsUpsertSql = "
INSERT INTO metrics_counter_submission_institution_daily (load_id, context_id, submission_id, date, institution_id, metric_investigations, metric_investigations_unique, metric_requests, metric_requests_unique)
SELECT * FROM (
SELECT ustt.load_id, ustt.context_id, ustt.submission_id, DATE(ustt.date) as date, usit.institution_id, 0 as metric_investigations, 0 as metric_investigations_unique, count(*) as metric, 0 as metric_requests_unique
FROM {$this->table} ustt
JOIN usage_stats_institution_temporary_records usit on (usit.load_id = ustt.load_id AND usit.line_number = ustt.line_number)
WHERE ustt.load_id = ? AND ustt.assoc_type = ? AND usit.institution_id = ?
GROUP BY ustt.load_id, ustt.context_id, ustt.submission_id, DATE(ustt.date), usit.institution_id) AS t
";
if (substr(Config::getVar('database', 'driver'), 0, strlen('postgres')) === 'postgres') {
$metricRequestsUpsertSql .= '
ON CONFLICT ON CONSTRAINT msid_uc_load_id_context_id_submission_id_institution_id_date DO UPDATE
SET metric_requests = excluded.metric_requests;
';
} else {
$metricRequestsUpsertSql .= '
ON DUPLICATE KEY UPDATE metric_requests = metric;
';
}
/** @var TemporaryInstitutionsDAO */
$temporaryInstitutionsDAO = DAORegistry::getDAO('TemporaryInstitutionsDAO');
$institutionIds = $temporaryInstitutionsDAO->getInstitutionIdsByLoadId($loadId);
foreach ($institutionIds as $institutionId) {
DB::statement($metricInvestigationsUpsertSql, [$loadId, (int) $institutionId]);
DB::statement($metricRequestsUpsertSql, [$loadId, Application::ASSOC_TYPE_SUBMISSION_FILE, (int) $institutionId]);
}
}
}