/* * [ImportQuotesFromHTML.java] * * Summary: Imports quote collection from HTML to the database. * * Copyright: (c) 2014-2017 Roedy Green, Canadian Mind Products, http://mindprod.com * * Licence: This software may be copied and used freely for any purpose but military. * http://mindprod.com/contact/nonmil.html * * Requires: JDK 1.8+ * * Created with: JetBrains IntelliJ IDEA IDE http://www.jetbrains.com/idea/ * * Version History: * 1.0 2014-08-08 initial version */ package com.mindprod.quotedb; import com.mindprod.common18.BigDate; import com.mindprod.common18.Chunkify; import com.mindprod.common18.EIO; import com.mindprod.hunkio.HunkIO; import java.io.File; import java.io.IOException; import java.sql.Connection; import java.util.regex.Matcher; import java.util.regex.Pattern; /** * Imports quote collection from HTML to the database. * * @author Roedy Green, Canadian Mind Products * @version 1.0 2014-08-08 initial version * @since 2014-08-08 */ public class ImportQuotesFromHTML { private static final Pattern AUTHOR_EXTRACTOR = Pattern.compile( "([ -;=\\?-~])" ); private static final Pattern BIRTH_EXTRACTOR = Pattern.compile( "