DB utils update for db initialization
[dmaap/datarouter.git] / datarouter-prov / src / main / java / org / onap / dmaap / datarouter / provisioning / utils / LogfileLoader.java
1 /*******************************************************************************\r
2  * ============LICENSE_START==================================================\r
3  * * org.onap.dmaap\r
4  * * ===========================================================================\r
5  * * Copyright © 2017 AT&T Intellectual Property. All rights reserved.\r
6  * * ===========================================================================\r
7  * * Licensed under the Apache License, Version 2.0 (the "License");\r
8  * * you may not use this file except in compliance with the License.\r
9  * * You may obtain a copy of the License at\r
10  * * \r
11  *  *      http://www.apache.org/licenses/LICENSE-2.0\r
12  * * \r
13  *  * Unless required by applicable law or agreed to in writing, software\r
14  * * distributed under the License is distributed on an "AS IS" BASIS,\r
15  * * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\r
16  * * See the License for the specific language governing permissions and\r
17  * * limitations under the License.\r
18  * * ============LICENSE_END====================================================\r
19  * *\r
20  * * ECOMP is a trademark and service mark of AT&T Intellectual Property.\r
21  * *\r
22  ******************************************************************************/\r
23 \r
24 \r
25 package org.onap.dmaap.datarouter.provisioning.utils;\r
26 \r
27 import java.io.File;\r
28 import java.io.FileInputStream;\r
29 import java.io.FileNotFoundException;\r
30 import java.io.FileReader;\r
31 import java.io.FilenameFilter;\r
32 import java.io.IOException;\r
33 import java.io.InputStreamReader;\r
34 import java.io.LineNumberReader;\r
35 import java.io.Reader;\r
36 import java.sql.Connection;\r
37 import java.sql.PreparedStatement;\r
38 import java.sql.ResultSet;\r
39 import java.sql.SQLException;\r
40 import java.sql.Statement;\r
41 import java.text.ParseException;\r
42 import java.util.Date;\r
43 import java.util.HashMap;\r
44 import java.util.Iterator;\r
45 import java.util.Map;\r
46 import java.util.TreeSet;\r
47 import java.util.zip.GZIPInputStream;\r
48 \r
49 import org.apache.log4j.Logger;\r
50 import org.onap.dmaap.datarouter.provisioning.BaseServlet;\r
51 import org.onap.dmaap.datarouter.provisioning.beans.DeliveryExtraRecord;\r
52 import org.onap.dmaap.datarouter.provisioning.beans.DeliveryRecord;\r
53 import org.onap.dmaap.datarouter.provisioning.beans.ExpiryRecord;\r
54 import org.onap.dmaap.datarouter.provisioning.beans.Loadable;\r
55 import org.onap.dmaap.datarouter.provisioning.beans.LogRecord;\r
56 import org.onap.dmaap.datarouter.provisioning.beans.Parameters;\r
57 import org.onap.dmaap.datarouter.provisioning.beans.PubFailRecord;\r
58 import org.onap.dmaap.datarouter.provisioning.beans.PublishRecord;\r
59 \r
60 /**\r
61  * This class provides methods that run in a separate thread, in order to process logfiles uploaded into the spooldir.\r
62  * These logfiles are loaded into the MariaDB LOG_RECORDS table. In a running provisioning server, there should only be\r
63  * two places where records can be loaded into this table; here, and in the method DB.retroFit4() which may be run at\r
64  * startup to load the old (1.0) style log tables into LOG_RECORDS;\r
65  * <p>This method maintains an {@link RLEBitSet} which can be used to easily see what records are presently in the\r
66  * database.\r
67  * This bit set is used to synchronize between provisioning servers.</p>\r
68  *\r
69  * @author Robert Eby\r
70  * @version $Id: LogfileLoader.java,v 1.22 2014/03/12 19:45:41 eby Exp $\r
71  */\r
72 public class LogfileLoader extends Thread {\r
73         /** Default number of log records to keep when pruning.  Keep 10M by default. */\r
74         public static final long DEFAULT_LOG_RETENTION = 10000000L;\r
75         /** NOT USED: Percentage of free space required before old records are removed. */\r
76         public static final int REQUIRED_FREE_PCT = 20;\r
77 \r
78         /** This is a singleton -- there is only one LogfileLoader object in the server */\r
79         private static LogfileLoader p;\r
80 \r
81         /**\r
82          * Get the singleton LogfileLoader object, and start it if it is not running.\r
83          * @return the LogfileLoader\r
84          */\r
85         public static synchronized LogfileLoader getLoader() {\r
86                 if (p == null)\r
87                         p = new LogfileLoader();\r
88                 if (!p.isAlive())\r
89                         p.start();\r
90                 return p;\r
91         }\r
92 \r
93         /** The PreparedStatement which is loaded by a <i>Loadable</i>. */\r
94         public static final String INSERT_SQL = "insert into LOG_RECORDS values (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)";\r
95         /** Each server can assign this many IDs */\r
96         private static final long SET_SIZE = (1L << 56);\r
97 \r
98         private final Logger logger;\r
99         private final DB db;\r
100         private final String spooldir;\r
101         private final long set_start;\r
102         private final long set_end;\r
103         private RLEBitSet seq_set;\r
104         private long nextid;\r
105         private boolean idle;\r
106 \r
107         private LogfileLoader() {\r
108                 this.logger   = Logger.getLogger("org.onap.dmaap.datarouter.provisioning.internal");\r
109                 this.db       = new DB();\r
110                 this.spooldir = db.getProperties().getProperty("org.onap.dmaap.datarouter.provserver.spooldir");\r
111                 this.set_start = getIdRange();\r
112                 this.set_end   = set_start + SET_SIZE - 1;\r
113                 this.seq_set  = new RLEBitSet();\r
114                 this.nextid   = 0;\r
115                 this.idle     = false;\r
116 \r
117                 // This is a potentially lengthy operation, so has been moved to run()\r
118                 //initializeNextid();\r
119                 this.setDaemon(true);\r
120                 this.setName("LogfileLoader");\r
121         }\r
122 \r
123         private long getIdRange() {\r
124                 long n;\r
125                 if (BaseServlet.isInitialActivePOD())\r
126                         n = 0;\r
127                 else if (BaseServlet.isInitialStandbyPOD())\r
128                         n = SET_SIZE;\r
129                 else\r
130                         n = SET_SIZE * 2;\r
131                 String r = String.format("[%X .. %X]", n, n+SET_SIZE-1);\r
132                 logger.debug("This server shall assign RECORD_IDs in the range "+r);\r
133                 return n;\r
134         }\r
135         /**\r
136          * Return the bit set representing the record ID's that are loaded in this database.\r
137          * @return the bit set\r
138          */\r
139         public RLEBitSet getBitSet() {\r
140                 return seq_set;\r
141         }\r
142         /**\r
143          * True if the LogfileLoader is currently waiting for work.\r
144          * @return true if idle\r
145          */\r
146         public boolean isIdle() {\r
147                 return idle;\r
148         }\r
149         /**\r
150          * Run continuously to look for new logfiles in the spool directory and import them into the DB.\r
151          * The spool is checked once per second.  If free space on the MariaDB filesystem falls below\r
152          * REQUIRED_FREE_PCT (normally 20%) then the oldest logfile entries are removed and the LOG_RECORDS\r
153          * table is compacted until free space rises above the threshold.\r
154          */\r
155         @Override\r
156         public void run() {\r
157                 initializeNextid();     // moved from the constructor\r
158                 while (true) {\r
159                         try {\r
160                                 File dirfile = new File(spooldir);\r
161                                 while (true) {\r
162                                         // process IN files\r
163                                         File[] infiles = dirfile.listFiles(new FilenameFilter() {\r
164                                                 @Override\r
165                                                 public boolean accept(File dir, String name) {\r
166                                                         return name.startsWith("IN.");\r
167                                                 }\r
168                                         });\r
169 \r
170                                         if (infiles.length == 0) {\r
171                                                 idle = true;\r
172                                                 try {\r
173                                                         Thread.sleep(1000L);\r
174                                                 } catch (InterruptedException e) {\r
175                                                 }\r
176                                                 idle = false;\r
177                                         } else {\r
178                                                 // Remove old rows\r
179                                                 if (pruneRecords()) {\r
180                                                         // Removed at least some entries, recompute the bit map\r
181                                                         initializeNextid();\r
182                                                 }\r
183 \r
184                                                 // Process incoming logfiles\r
185                                                 for (File f : infiles) {\r
186                                                         if (logger.isDebugEnabled())\r
187                                                                 logger.debug("PROV8001 Starting " + f + " ...");\r
188                                                         long time = System.currentTimeMillis();\r
189                                                         int[] n = process(f);\r
190                                                         time = System.currentTimeMillis() - time;\r
191                                                         logger.info(String\r
192                                                                         .format("PROV8000 Processed %s in %d ms; %d of %d records.",\r
193                                                                                         f.toString(), time, n[0], n[1]));\r
194                                                         f.delete();\r
195                                                 }\r
196                                         }\r
197                                 }\r
198                         } catch (Exception e) {\r
199                                 logger.warn("PROV0020: Caught exception in LogfileLoader: " + e);\r
200                                 e.printStackTrace();\r
201                         }\r
202                 }\r
203         }\r
204         private boolean pruneRecords() {\r
205                 boolean did1 = false;\r
206                 long count = countRecords();\r
207                 long threshold = DEFAULT_LOG_RETENTION;\r
208                 Parameters param = Parameters.getParameter(Parameters.PROV_LOG_RETENTION);\r
209                 if (param != null) {\r
210                         try {\r
211                                 long n = Long.parseLong(param.getValue());\r
212                                 // This check is to prevent inadvertent errors from wiping the table out\r
213                                 if (n > 1000000L)\r
214                                         threshold = n;\r
215                         } catch (NumberFormatException e) {\r
216                                 // ignore\r
217                         }\r
218                 }\r
219                 logger.debug("Pruning LOG_RECORD table: records in DB="+count+", threshold="+threshold);\r
220                 if (count > threshold) {\r
221                         count -= threshold;                                             // we need to remove this many records;\r
222                         Map<Long,Long> hist = getHistogram();   // histogram of records per day\r
223                         // Determine the cutoff point to remove the needed number of records\r
224                         long sum = 0;\r
225                         long cutoff = 0;\r
226                         for (Long day : new TreeSet<Long>(hist.keySet())) {\r
227                                 sum += hist.get(day);\r
228                                 cutoff = day;\r
229                                 if (sum >= count)\r
230                                         break;\r
231                         }\r
232                         cutoff++;\r
233                         cutoff *= 86400000L;            // convert day to ms\r
234                         logger.debug("  Pruning records older than="+(cutoff/86400000L)+" ("+new Date(cutoff)+")");\r
235 \r
236                         Connection conn = null;\r
237                         try {\r
238                                 // Limit to a million at a time to avoid typing up the DB for too long.\r
239                                 conn = db.getConnection();\r
240                                 PreparedStatement ps = conn.prepareStatement("DELETE from LOG_RECORDS where EVENT_TIME < ? limit 1000000");\r
241                                 ps.setLong(1, cutoff);\r
242                                 while (count > 0) {\r
243                                         if (!ps.execute()) {\r
244                                                 int dcount = ps.getUpdateCount();\r
245                                                 count -= dcount;\r
246                                                 logger.debug("  "+dcount+" rows deleted.");\r
247                                                 did1 |= (dcount!=0);\r
248                                                 if (dcount == 0)\r
249                                                         count = 0;      // prevent inf. loops\r
250                                         } else {\r
251                                                 count = 0;      // shouldn't happen!\r
252                                         }\r
253                                 }\r
254                                 ps.close();\r
255                                 Statement stmt = conn.createStatement();\r
256                                 stmt.execute("OPTIMIZE TABLE LOG_RECORDS");\r
257                                 stmt.close();\r
258                         } catch (SQLException e) {\r
259                                 System.err.println(e);\r
260                                 e.printStackTrace();\r
261                         } finally {\r
262                                 db.release(conn);\r
263                         }\r
264                 }\r
265                 return did1;\r
266         }\r
267         private long countRecords() {\r
268                 long count = 0;\r
269                 Connection conn = null;\r
270                 try {\r
271                         conn = db.getConnection();\r
272                         Statement stmt = conn.createStatement();\r
273                         ResultSet rs = stmt.executeQuery("SELECT COUNT(*) as COUNT from LOG_RECORDS");\r
274                         if (rs.next()) {\r
275                                 count = rs.getLong("COUNT");\r
276                         }\r
277                         rs.close();\r
278                         stmt.close();\r
279                 } catch (SQLException e) {\r
280                         System.err.println(e);\r
281                         e.printStackTrace();\r
282                 } finally {\r
283                         db.release(conn);\r
284                 }\r
285                 return count;\r
286         }\r
287         private Map<Long,Long> getHistogram() {\r
288                 Map<Long,Long> map = new HashMap<Long,Long>();\r
289                 Connection conn = null;\r
290                 try {\r
291                         logger.debug("  LOG_RECORD table histogram...");\r
292                         conn = db.getConnection();\r
293                         Statement stmt = conn.createStatement();\r
294                         ResultSet rs = stmt.executeQuery("SELECT FLOOR(EVENT_TIME/86400000) AS DAY, COUNT(*) AS COUNT FROM LOG_RECORDS GROUP BY DAY");\r
295                         while (rs.next()) {\r
296                                 long day = rs.getLong("DAY");\r
297                                 long cnt = rs.getLong("COUNT");\r
298                                 map.put(day, cnt);\r
299                                 logger.debug("  "+day + "  "+cnt);\r
300                         }\r
301                         rs.close();\r
302                         stmt.close();\r
303                 } catch (SQLException e) {\r
304                         System.err.println(e);\r
305                         e.printStackTrace();\r
306                 } finally {\r
307                         db.release(conn);\r
308                 }\r
309                 return map;\r
310         }\r
311         private void initializeNextid() {\r
312                 Connection conn = null;\r
313                 try {\r
314                         conn = db.getConnection();\r
315                         Statement stmt = conn.createStatement();\r
316                         // Build a bitset of all records in the LOG_RECORDS table\r
317                         // We need to run this SELECT in stages, because otherwise we run out of memory!\r
318                         RLEBitSet nbs = new RLEBitSet();\r
319                         final long stepsize = 6000000L;\r
320                         boolean go_again = true;\r
321                         for (long i = 0; go_again; i += stepsize) {\r
322                                 String sql = String.format("select RECORD_ID from LOG_RECORDS LIMIT %d,%d", i, stepsize);\r
323                                 ResultSet rs = stmt.executeQuery(sql);\r
324                                 go_again = false;\r
325                                 while (rs.next()) {\r
326                                         long n = rs.getLong("RECORD_ID");\r
327                                         nbs.set(n);\r
328                                         go_again = true;\r
329                                 }\r
330                                 rs.close();\r
331                         }\r
332                         stmt.close();\r
333                         seq_set = nbs;\r
334 \r
335                         // Compare with the range for this server\r
336                         // Determine the next ID for this set of record IDs\r
337                         RLEBitSet tbs = (RLEBitSet) nbs.clone();\r
338                         RLEBitSet idset = new RLEBitSet();\r
339                         idset.set(set_start, set_start+SET_SIZE);\r
340                         tbs.and(idset);\r
341                         long t = tbs.length();\r
342                         nextid = (t == 0) ? set_start : (t - 1);\r
343                         if (nextid >= set_start+SET_SIZE) {\r
344                                 // Handle wraparound, when the IDs reach the end of our "range"\r
345                                 Long[] last = null;\r
346                                 Iterator<Long[]> li = tbs.getRangeIterator();\r
347                                 while (li.hasNext()) {\r
348                                         last = li.next();\r
349                                 }\r
350                                 if (last != null) {\r
351                                         tbs.clear(last[0], last[1]+1);\r
352                                         t = tbs.length();\r
353                                         nextid = (t == 0) ? set_start : (t - 1);\r
354                                 }\r
355                         }\r
356                         logger.debug(String.format("initializeNextid, next ID is %d (%x)", nextid, nextid));\r
357                 } catch (SQLException e) {\r
358                         System.err.println(e);\r
359                         e.printStackTrace();\r
360                 } finally {\r
361                         db.release(conn);\r
362                 }\r
363         }\r
364 \r
365         @SuppressWarnings("resource")\r
366         private int[] process(File f) {\r
367                 int ok = 0, total = 0;\r
368                 try {\r
369                         Connection conn = db.getConnection();\r
370                         PreparedStatement ps = conn.prepareStatement(INSERT_SQL);\r
371                         Reader r = f.getPath().endsWith(".gz")\r
372                                 ? new InputStreamReader(new GZIPInputStream(new FileInputStream(f)))\r
373                                 : new FileReader(f);\r
374                         LineNumberReader in = new LineNumberReader(r);\r
375                         String line;\r
376                         while ((line = in.readLine()) != null) {\r
377                                 try {\r
378                                         for (Loadable rec : buildRecords(line)) {\r
379                                                 rec.load(ps);\r
380                                                 if (rec instanceof LogRecord) {\r
381                                                         LogRecord lr = ((LogRecord)rec);\r
382                                                         if (!seq_set.get(lr.getRecordId())) {\r
383                                                                 ps.executeUpdate();\r
384                                                                 seq_set.set(lr.getRecordId());\r
385                                                         } else\r
386                                                                 logger.debug("Duplicate record ignored: "+lr.getRecordId());\r
387                                                 } else {\r
388                                                         if (++nextid > set_end)\r
389                                                                 nextid = set_start;\r
390                                                         ps.setLong(18, nextid);\r
391                                                         ps.executeUpdate();\r
392                                                         seq_set.set(nextid);\r
393                                                 }\r
394                                                 ps.clearParameters();\r
395                                                 ok++;\r
396                                         }\r
397                                 } catch (SQLException e) {\r
398                                         logger.warn("PROV8003 Invalid value in record: "+line);\r
399                                         logger.debug(e);\r
400                                         e.printStackTrace();\r
401                                 } catch (NumberFormatException e) {\r
402                                         logger.warn("PROV8004 Invalid number in record: "+line);\r
403                                         logger.debug(e);\r
404                                         e.printStackTrace();\r
405                                 } catch (ParseException e) {\r
406                                         logger.warn("PROV8005 Invalid date in record: "+line);\r
407                                         logger.debug(e);\r
408                                         e.printStackTrace();\r
409                                 } catch (Exception e) {\r
410                                         logger.warn("PROV8006 Invalid pattern in record: "+line);\r
411                                         logger.debug(e);\r
412                                         e.printStackTrace();\r
413                                 }\r
414                                 total++;\r
415                         }\r
416                         in.close();\r
417                         ps.close();\r
418                         db.release(conn);\r
419                         conn = null;\r
420                 } catch (FileNotFoundException e) {\r
421                         logger.warn("PROV8007 Exception reading "+f+": "+e);\r
422                 } catch (IOException e) {\r
423                         logger.warn("PROV8007 Exception reading "+f+": "+e);\r
424                 } catch (SQLException e) {\r
425                         logger.warn("PROV8007 Exception reading "+f+": "+e);\r
426                 }\r
427                 return new int[] { ok, total };\r
428         }\r
429         private Loadable[] buildRecords(String line) throws ParseException {\r
430                 String[] pp = line.split("\\|");\r
431                 if (pp != null && pp.length >= 7) {\r
432                         String rtype = pp[1].toUpperCase();\r
433                         if (rtype.equals("PUB") && pp.length == 11) {\r
434                                 // Fields are: date|PUB|pubid|feedid|requrl|method|ctype|clen|srcip|user|status\r
435                                 return new Loadable[] { new PublishRecord(pp) };\r
436                         }\r
437                         if (rtype.equals("DEL") && pp.length == 12) {\r
438                                 // Fields are: date|DEL|pubid|feedid|subid|requrl|method|ctype|clen|user|status|xpubid\r
439                                 String[] subs = pp[4].split("\\s+");\r
440                                 if (subs != null) {\r
441                                         Loadable[] rv = new Loadable[subs.length];\r
442                                         for (int i = 0; i < subs.length; i++) {\r
443                                                 // create a new record for each individual sub\r
444                                                 pp[4] = subs[i];\r
445                                                 rv[i] = new DeliveryRecord(pp);\r
446                                         }\r
447                                         return rv;\r
448                                 }\r
449                         }\r
450                         if (rtype.equals("EXP") && pp.length == 11) {\r
451                                 // Fields are: date|EXP|pubid|feedid|subid|requrl|method|ctype|clen|reason|attempts\r
452                                 ExpiryRecord e = new ExpiryRecord(pp);\r
453                                 if (e.getReason().equals("other"))\r
454                                         logger.info("Invalid reason '"+pp[9]+"' changed to 'other' for record: "+e.getPublishId());\r
455                                 return new Loadable[] { e };\r
456                         }\r
457                         if (rtype.equals("PBF") && pp.length == 12) {\r
458                                 // Fields are: date|PBF|pubid|feedid|requrl|method|ctype|clen-expected|clen-received|srcip|user|error\r
459                                 return new Loadable[] { new PubFailRecord(pp) };\r
460                         }\r
461                         if (rtype.equals("DLX") && pp.length == 7) {\r
462                                 // Fields are: date|DLX|pubid|feedid|subid|clen-tosend|clen-sent\r
463                                 return new Loadable[] { new DeliveryExtraRecord(pp) };\r
464                         }\r
465                         if (rtype.equals("LOG") && (pp.length == 19 || pp.length == 20)) {\r
466                                 // Fields are: date|LOG|pubid|feedid|requrl|method|ctype|clen|type|feedFileid|remoteAddr|user|status|subid|fileid|result|attempts|reason|record_id\r
467                                 return new Loadable[] { new LogRecord(pp) };\r
468                         }\r
469                 }\r
470                 logger.warn("PROV8002 bad record: "+line);\r
471                 return new Loadable[0];\r
472         }\r
473 \r
474         /**\r
475          * The LogfileLoader can be run stand-alone by invoking the main() method of this class.\r
476          * @param a ignored\r
477          * @throws InterruptedException\r
478          */\r
479         public static void main(String[] a) throws InterruptedException {\r
480                 LogfileLoader.getLoader();\r
481                 Thread.sleep(200000L);\r
482         }\r
483 }\r