1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
|
# -*- text -*-
#
# main/mysql/process-radacct.sql -- Schema extensions for processing radacct entries
#
# $Id$
-- ---------------------------------
-- - Per-user data usage over time -
-- ---------------------------------
--
-- An extension to the standard schema to hold per-user data usage statistics
-- for arbitrary periods.
--
-- The data_usage_by_period table is populated by periodically calling the
-- fr_new_data_usage_period stored procedure.
--
-- This table can be queried in various ways to produce reports of aggregate
-- data use over time. For example, if the fr_new_data_usage_period SP is
-- invoked one per day just after midnight, to produce usage data with daily
-- granularity, then a reasonably accurate monthly bandwidth summary for a
-- given user could be obtained with:
--
-- SELECT
-- DATE_FORMAT(period_start, '%Y-%M') AS month,
-- SUM(acctinputoctets)/1000/1000/1000 AS GB_in,
-- SUM(acctoutputoctets)/1000/1000/1000 AS GB_out
-- FROM
-- data_usage_by_period
-- WHERE
-- username='bob' AND
-- period_end IS NOT NULL
-- GROUP BY
-- YEAR(period_start), MONTH(period_start);
--
-- +----------------+----------------+-----------------+
-- | month | GB_in | GB_out |
-- +----------------+----------------+-----------------+
-- | 2019-July | 5.782279230000 | 50.545664820000 |
-- | 2019-August | 4.230543340000 | 48.523096420000 |
-- | 2019-September | 4.847360590000 | 48.631835480000 |
-- | 2019-October | 6.456763250000 | 51.686231930000 |
-- | 2019-November | 6.362537730000 | 52.385710570000 |
-- | 2019-December | 4.301524440000 | 50.762240270000 |
-- | 2020-January | 5.436280540000 | 49.067775280000 |
-- +----------------+----------------+-----------------+
-- 7 rows in set (0.000 sec)
--
CREATE TABLE data_usage_by_period (
username VARCHAR(64),
period_start DATETIME,
period_end DATETIME,
acctinputoctets BIGINT(20),
acctoutputoctets BIGINT(20),
PRIMARY KEY (username,period_start)
);
CREATE INDEX idx_data_usage_by_period_period_start ON data_usage_by_period (period_start);
CREATE INDEX idx_data_usage_by_period_period_end ON data_usage_by_period (period_end);
--
-- Stored procedure that when run with some arbitrary frequency, say
-- once per day by cron, will process the recent radacct entries to extract
-- time-windowed data containing acct{input,output}octets ("data usage") per
-- username, per period.
--
-- Each invocation will create new rows in the data_usage_by_period tables
-- containing the data used by each user since the procedure was last invoked.
-- The intervals do not need to be identical but care should be taken to
-- ensure that the start/end of each period aligns well with any intended
-- reporting intervals.
--
-- It can be invoked by running:
--
-- CALL fr_new_data_usage_period();
--
--
DELIMITER $$
DROP PROCEDURE IF EXISTS fr_new_data_usage_period;
CREATE PROCEDURE fr_new_data_usage_period ()
SQL SECURITY INVOKER
BEGIN
DECLARE v_start DATETIME;
DECLARE v_end DATETIME;
DECLARE EXIT HANDLER FOR SQLEXCEPTION
BEGIN
ROLLBACK;
RESIGNAL;
END;
SELECT IFNULL(DATE_ADD(MAX(period_end), INTERVAL 1 SECOND), FROM_UNIXTIME(0)) INTO v_start FROM data_usage_by_period;
SELECT NOW() INTO v_end;
START TRANSACTION;
--
-- Add the data usage for the sessions that were active in the current
-- period to the table. Include all sessions that finished since the start
-- of this period as well as those still ongoing.
--
INSERT INTO data_usage_by_period (username, period_start, period_end, acctinputoctets, acctoutputoctets)
SELECT *
FROM (
SELECT
username,
v_start,
v_end,
SUM(acctinputoctets) AS acctinputoctets,
SUM(acctoutputoctets) AS acctoutputoctets
FROM ((
SELECT
username, acctinputoctets, acctoutputoctets
FROM
radacct
WHERE
acctstoptime > v_start
) UNION ALL (
SELECT
username, acctinputoctets, acctoutputoctets
FROM
radacct
WHERE
acctstoptime IS NULL
)) AS a
GROUP BY
username
) AS s
ON DUPLICATE KEY UPDATE
acctinputoctets = data_usage_by_period.acctinputoctets + s.acctinputoctets,
acctoutputoctets = data_usage_by_period.acctoutputoctets + s.acctoutputoctets,
period_end = v_end;
--
-- Create an open-ended "next period" for all ongoing sessions and carry a
-- negative value of their data usage to avoid double-accounting when we
-- process the next period. Their current data usage has already been
-- allocated to the current and possibly previous periods.
--
INSERT INTO data_usage_by_period (username, period_start, period_end, acctinputoctets, acctoutputoctets)
SELECT *
FROM (
SELECT
username,
DATE_ADD(v_end, INTERVAL 1 SECOND),
NULL,
0 - SUM(acctinputoctets),
0 - SUM(acctoutputoctets)
FROM
radacct
WHERE
acctstoptime IS NULL
GROUP BY
username
) AS s;
COMMIT;
END$$
DELIMITER ;
-- ------------------------------------------------------
-- - "Lightweight" Accounting-On/Off strategy resources -
-- ------------------------------------------------------
--
-- The following resources are for use only when the "lightweight"
-- Accounting-On/Off strategy is enabled in queries.conf.
--
-- Instead of bulk closing the radacct sessions belonging to a reloaded NAS,
-- this strategy leaves them open and records the NAS reload time in the
-- nasreload table.
--
-- Where applicable, the onus is on the administator to:
--
-- * Consider the nas reload times when deriving a list of
-- active/inactive sessions, and when determining the duration of sessions
-- interrupted by a NAS reload. (Refer to the view below.)
--
-- * Close the affected sessions out of band. (Refer to the SP below.)
--
--
-- The radacct_with_reloads view presents the radacct table with two additional
-- columns: acctstoptime_with_reloads and acctsessiontime_with_reloads
--
-- Where the session isn't closed (acctstoptime IS NULL), yet it started before
-- the last reload of the NAS (radacct.acctstarttime < nasreload.reloadtime),
-- the derived columns are set based on the reload time of the NAS (effectively
-- the point in time that the session was interrupted.)
--
CREATE VIEW radacct_with_reloads AS
SELECT
a.*,
COALESCE(a.acctstoptime,
IF(a.acctstarttime < n.reloadtime, n.reloadtime, NULL)
) AS acctstoptime_with_reloads,
COALESCE(a.acctsessiontime,
IF(a.acctstoptime IS NULL AND a.acctstarttime < n.reloadtime,
UNIX_TIMESTAMP(n.reloadtime) - UNIX_TIMESTAMP(a.acctstarttime), NULL)
) AS acctsessiontime_with_reloads
FROM radacct a
LEFT OUTER JOIN nasreload n USING (nasipaddress);
--
-- It may be desirable to periodically "close" radacct sessions belonging to a
-- reloaded NAS, replicating the "bulk close" Accounting-On/Off behaviour,
-- just not in real time.
--
-- The fr_radacct_close_after_reload SP will set radacct.acctstoptime to
-- nasreload.reloadtime, calculate the corresponding radacct.acctsessiontime,
-- and set acctterminatecause to "NAS reboot" for interrupted sessions. It
-- does so in batches, which avoids long-lived locks on the affected rows.
--
-- It can be invoked as follows:
--
-- CALL fr_radacct_close_after_reload();
--
-- Note: This SP walks radacct in strides of v_batch_size. It will typically
-- skip closed and ongoing sessions at a rate significantly faster than
-- 100,000 rows per second and process batched updates faster than 20,000
-- orphaned sessions per second. If this isn't fast enough then you should
-- really consider using a custom schema that includes partitioning by
-- nasipaddress or acct{start,stop}time.
--
DELIMITER $$
DROP PROCEDURE IF EXISTS fr_radacct_close_after_reload;
CREATE PROCEDURE fr_radacct_close_after_reload ()
SQL SECURITY INVOKER
BEGIN
DECLARE v_a BIGINT(21);
DECLARE v_z BIGINT(21);
DECLARE v_updated BIGINT(21) DEFAULT 0;
DECLARE v_last_report DATETIME DEFAULT 0;
DECLARE v_last BOOLEAN DEFAULT FALSE;
DECLARE v_batch_size INT(12);
--
-- This works for many circumstances
--
SET v_batch_size = 2500;
SELECT MIN(radacctid) INTO v_a FROM radacct WHERE acctstoptime IS NULL;
update_loop: LOOP
SET v_z = NULL;
SELECT radacctid INTO v_z FROM radacct WHERE radacctid > v_a ORDER BY radacctid LIMIT v_batch_size,1;
IF v_z IS NULL THEN
SELECT MAX(radacctid) INTO v_z FROM radacct;
SET v_last = TRUE;
END IF;
UPDATE radacct a INNER JOIN nasreload n USING (nasipaddress)
SET
acctstoptime = n.reloadtime,
acctsessiontime = UNIX_TIMESTAMP(n.reloadtime) - UNIX_TIMESTAMP(acctstarttime),
acctterminatecause = 'NAS reboot'
WHERE
radacctid BETWEEN v_a AND v_z
AND acctstoptime IS NULL
AND acctstarttime < n.reloadtime;
SET v_updated = v_updated + ROW_COUNT();
SET v_a = v_z + 1;
--
-- Periodically report how far we've got
--
IF v_last_report != NOW() OR v_last THEN
SELECT v_z AS latest_radacctid, v_updated AS sessions_closed;
SET v_last_report = NOW();
END IF;
IF v_last THEN
LEAVE update_loop;
END IF;
END LOOP;
END$$
DELIMITER ;
|