IndexerServiceImpl

/*
 * Copyright 2011 The Kuali Foundation.
 *
 * Licensed under the Educational Community License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.opensource.org/licenses/ecl2.php
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.kuali.ole.docstore.discovery.service;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileReader;
import java.io.FilenameFilter;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.OutputStreamWriter;
import java.io.StringWriter;
import java.net.HttpURLConnection;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.ArrayList;
import java.util.Date;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.UUID;
import javax.xml.stream.XMLInputFactory;
import javax.xml.stream.XMLStreamConstants;
import javax.xml.stream.XMLStreamReader;
import javax.xml.transform.OutputKeys;
import javax.xml.transform.Transformer;
import javax.xml.transform.TransformerFactory;
import javax.xml.transform.stax.StAXSource;
import javax.xml.transform.stream.StreamResult;

import org.apache.commons.io.FileUtils;
import org.apache.commons.lang.time.StopWatch;
import org.apache.solr.client.solrj.SolrQuery;
import org.apache.solr.client.solrj.SolrServer;
import org.apache.solr.client.solrj.SolrServerException;
import org.apache.solr.client.solrj.impl.CommonsHttpSolrServer;
import org.apache.solr.client.solrj.response.QueryResponse;
import org.apache.solr.client.solrj.response.UpdateResponse;
import org.apache.solr.client.solrj.util.ClientUtils;
import org.apache.solr.common.SolrDocument;
import org.apache.solr.common.SolrInputDocument;
import org.apache.solr.common.SolrInputField;
import org.kuali.ole.docstore.discovery.solr.security.patron.oleml.SecurityPatronOlemlDocBuilder;
import org.kuali.ole.docstore.discovery.solr.work.bib.WorkBibCommonFields;
import org.kuali.ole.docstore.discovery.solr.work.bib.dublin.WorkBibDublinDocBuilder;
import org.kuali.ole.docstore.discovery.solr.work.bib.dublin.unqualified.WorkBibDublinUnQualifiedDocBuilder;
import org.kuali.ole.docstore.discovery.solr.work.bib.marc.WorkBibMarcDocBuilder;
import org.kuali.ole.docstore.discovery.solr.work.instance.oleml.WorkInstanceOlemlDocBuilder;
import org.kuali.ole.docstore.discovery.solr.work.license.binary.WorkLicenseBinaryDocBuilder;
import org.kuali.ole.docstore.discovery.solr.work.license.onixpl.WorkLicenseOnixplDocBuilder;
import org.kuali.ole.docstore.discovery.util.PropertyUtil;
import org.kuali.ole.docstore.model.enums.DocCategory;
import org.kuali.ole.docstore.model.enums.DocFormat;
import org.kuali.ole.docstore.model.enums.DocType;
import org.kuali.ole.docstore.model.xmlpojo.ingest.RequestDocument;
import org.kuali.ole.docstore.model.xmlpojo.work.bib.dublin.WorkBibDublinRecord;
import org.kuali.ole.docstore.model.xmlpojo.work.instance.oleml.Instance;
import org.kuali.ole.docstore.model.xmlpojo.work.instance.oleml.InstanceCollection;
import org.kuali.ole.docstore.model.xstream.work.bib.dublin.WorkBibDublinRecordProcessor;
import org.kuali.ole.docstore.model.xstream.work.bib.dublin.unqualified.WorkBibDublinUnQualifiedRecordProcessor;
import org.kuali.ole.docstore.model.xstream.work.bib.marc.WorkBibMarcRecordProcessor;
import org.kuali.ole.docstore.utility.BatchIngestStatistics;
import org.kuali.ole.docstore.utility.BulkIngestStatistics;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

/**
 * This class implements the {@link IndexerService} methods.
 * <p>
 * All updates to the Solr indexes should ideally take place through this class.
 * Some important notes about solr:
 * Unlike a database, there are no distinct sessions (i.e. transactions) between each client,
 * and instead there is in-effect one global modification state.
 * There should be only one process for updating solr.
 * It is recommended to explicitly optimize the Solr index at an opportune time
 * like after a bulk load of data and/or a daily interval in off-peak hours.
 * </p>
 */
public class IndexerServiceImpl
        implements IndexerService {
    private static final Logger LOG                   = LoggerFactory.getLogger(IndexerServiceImpl.class);
    public static final  String UUID_FILE_NAME_SUFFIX = "_UUID_.xml";

    //    private static      String         docSearchUrl            = null;
    private static      IndexerService indexerService      = null;
    public static final String         ID_FIELD_PREFIX     = "id_disc_";
    public static final int            BATCH_SIZE          = 10000;
    private final       String         BIBLIOGRAPHIC       = "bibliographic";
    private final       String         DOC_TYPE            = "DocType";
    private final       String         DOC_FORMAT          = "DocFormat";
    private final       String         HOLDINGS_IDENTIFIER = "holdingsIdentifier";
    private final       String         ITEM_IDENTIFIER     = "itemIdentifier";
    private final       String         INSTANCE            = "instance";


    private IndexerServiceImpl() {
        init();
    }

    public static IndexerService getInstance() {
        if (null == indexerService) {
            indexerService = new IndexerServiceImpl();
        }
        return indexerService;
    }

    protected void init() {
        LOG.debug("IndexerServiceImpl init ");
        //        docSearchUrl = PropertyUtil.getPropertyUtil().getProperty("docSearchURL");
        //        if ((null != docSearchUrl) && !docSearchUrl.endsWith("/")) {
        //            docSearchUrl = docSearchUrl + "/";
        //        }
    }

    public String deleteDocuments(String docCategory, List<String> uuidList)
            throws MalformedURLException, SolrServerException {
        String result = deleteDocumentsByUUIDList(uuidList, docCategory);
        return result;
    }

    public String deleteDocument(String docCategory, String uuid) {
        String result = deleteDocumentByUUID(uuid, docCategory);
        return result;
    }

    public String indexSolrDocuments(List<SolrInputDocument> solrDocs) {
        return indexSolrDocuments(solrDocs, true);
    }

    public String indexSolrDocuments(List<SolrInputDocument> solrDocs, boolean commit) {
        String result = null;
        StopWatch timer = new StopWatch();
        timer.start();
        try {
            result = indexSolrDocuments(solrDocs, commit, false);
            timer.stop();
            LOG.info("Time taken for indexing " + solrDocs.size() + " Solr docs:" + timer.toString());
        }
        catch (Exception e) {
            result = buildFailureMsg(null, "Indexing failed. " + e.getMessage());
            LOG.error(result, e);
        }
        return result;
    }

    @Override
    public String indexDocumentsFromDirBySolrDoc(String docCategory, String docType, String docFormat, String dataDir) {
        String result = null;
        String xmlContent = "";
        // get the files from the dir.
        File srcDir = new File(dataDir);
        if ((null == srcDir) || !srcDir.isDirectory()) {
            result = buildFailureMsg(null, "Invalid data directory:" + dataDir);
            return result;
        }
        FilenameFilter filter = new FilenameFilter() {
            public boolean accept(File dir, String name) {
                return (!name.startsWith(".") && (name.endsWith(".xml")));
            }
        };

        String[] srcFileNames = srcDir.list(filter);
        if ((null == srcFileNames) || (srcFileNames.length == 0)) {
            result = buildFailureMsg(null, "No data files found in data dir:" + dataDir);
            return result;
        }
        List<File> fileList = new ArrayList<File>(srcFileNames.length);
        for (int i = 0; i < srcFileNames.length; i++) {
            File srcFile = new File(dataDir + File.separator + srcFileNames[i]);
            fileList.add(srcFile);
        }
        return indexDocumentsFromFiles(docCategory, docType, docFormat, fileList);
    }

    @Override
    public String indexDocumentsFromStringBySolrDoc(String docCategory, String docType, String docFormat, String data)
            throws IOException {

        File file = File.createTempFile("marc.xml", ".tmp");
        FileUtils.writeStringToFile(file, data, "UTF-8");
        String filePath = file.getAbsolutePath();
        return indexDocumentsFromFileBySolrDoc(docCategory, docType, docFormat,
                                               filePath);  //To change body of implemented methods use File | Settings | File Templates.
    }

    @Override
    public String indexDocumentsFromFileBySolrDoc(String docCategory, String docType, String docFormat,
                                                  String filePath) {
        List<File> fileList = new ArrayList<File>(0);
        fileList.add(new File(filePath));
        return indexDocumentsFromFiles(docCategory, docType, docFormat, fileList);
    }


    /**
     * Indexes the records (of the given docCategory, docType and docFormat) from the files in the given data directory.
     * <p>
     * This is a utility method to use Discovery separately from DocStore.
     * </p>
     *
     * @param docCategory category of the documents expected in the input files
     * @param docType     type of the documents expected in the input files
     * @param docFormat   format of the documents expected in the input files
     * @param fileList    list of files to be indexed
     * @return SUCCESS or FAILURE
     */
    @Override
    public String indexDocumentsFromFiles(String docCategory, String docType, String docFormat, List<File> fileList) {
        // TODO: Modify this method so that if dataDir is a file, it should be indexed.
        String result = null;
        String xmlContent = "";
        try {
            StopWatch indexingTimer = new StopWatch();
            StopWatch conversionTimer = new StopWatch();
            StopWatch fileIOTimer = new StopWatch();
            StopWatch totalTimer = new StopWatch();
            totalTimer.start();
            fileIOTimer.start();
            fileIOTimer.suspend();

            if ((null == fileList) || (fileList.size() == 0)) {
                result = buildFailureMsg(null, "No  files found in data dir:" + fileList);
                return result;
            }
            int numFiles = fileList.size();
            int numDocs = 0;
            SolrServer solr = SolrServerManager.getInstance().getSolrServer();
            TransformerFactory tf = new com.sun.org.apache.xalan.internal.xsltc.trax.TransformerFactoryImpl();
            Transformer t = tf.newTransformer();
            t.setOutputProperty(OutputKeys.OMIT_XML_DECLARATION, "yes");
            t.setOutputProperty(OutputKeys.INDENT, "yes");
            conversionTimer.start();
            conversionTimer.suspend();
            indexingTimer.start();
            indexingTimer.suspend();
            for (int i = 0; i < fileList.size(); i++) {
                File srcFile = fileList.get(i);
                LOG.info("Processing File: " + srcFile.getAbsolutePath());
                String srcFileName = srcFile.getName();

                // Get the id of the doc from the file name if Exists.
                String idFromFileName = null;
                List<String> idFromFileNameList = null;
                int suffixIndex = srcFileName.indexOf(UUID_FILE_NAME_SUFFIX);
                if (suffixIndex > 0) {
                    idFromFileName = srcFileName.substring(0, suffixIndex);
                    idFromFileNameList = new ArrayList<String>(1);
                    idFromFileNameList.add(idFromFileName);
                }

                int recordsProcessedInFile = 0;
                try {
                    XMLInputFactory xif = XMLInputFactory.newInstance();
                    XMLStreamReader xsr = xif.createXMLStreamReader(new FileReader(srcFile));
                    xsr.nextTag();
                    recordsProcessedInFile = 0;
                    List<SolrInputDocument> solrDocsToAdd = new ArrayList<SolrInputDocument>();
                    List<SolrInputDocument> solrDocs = null;
                    while (xsr.hasNext()) {
                        int eventType = xsr.next();
                        if (eventType == XMLStreamConstants.START_ELEMENT) {
                            if (DocFormat.MARC.isEqualTo(docFormat)) {
                                recordsProcessedInFile++;
                                LOG.debug("Processing Record(" + recordsProcessedInFile + ") of File: " + srcFileName);
                                fileIOTimer.resume();
                                StringWriter str = new StringWriter();
                                str.append("<collection>");
                                t.transform(new StAXSource(xsr), new StreamResult(str));
                                str.append("</collection>");
                                xmlContent = str.getBuffer().toString();
                                fileIOTimer.suspend();
                                conversionTimer.resume();
                                solrDocs = convertToSolrDocs(docCategory, docType, docFormat, xmlContent);
                                if ((null == solrDocs) || (solrDocs.size() == 0)) {
                                    continue;
                                }
                                if (idFromFileName == null) {
                                    assignUUIDs(solrDocs, null);
                                }
                                else {
                                    assignUUIDs(solrDocs.subList(0, 1), idFromFileNameList);
                                }
                                conversionTimer.suspend();
                                numDocs += solrDocs.size();
                            }
                            else if (DocFormat.DUBLIN_CORE.isEqualTo(docFormat)) {
                                // TODO: May be moved out of while loop?
                                conversionTimer.resume();
                                solrDocs = convertToSolrDocs(docCategory, docType, docFormat,
                                                             FileUtils.readFileToString(srcFile, "UTF-8"));
                                assignUUIDs(solrDocs, null);
                                conversionTimer.suspend();
                                solrDocsToAdd.addAll(solrDocs);
                                numDocs += solrDocs.size();
                                break;
                            }
                            else if (DocFormat.DUBLIN_UNQUALIFIED.isEqualTo(docFormat)) {
                                if (xsr.getName().getLocalPart().equalsIgnoreCase("record")) {
                                    conversionTimer.resume();
                                    solrDocs = new ArrayList<SolrInputDocument>();
                                    StringWriter str = new StringWriter();
                                    str.append("<OAI-PMH><ListRecords>");
                                    t.transform(new StAXSource(xsr), new StreamResult(str));
                                    str.append("</ListRecords></OAI-PMH>");
                                    str.close();
                                    xmlContent = str.getBuffer().toString();
                                    solrDocs = convertToSolrDocs(docCategory, docType, docFormat, xmlContent);
                                    str.flush();
                                    assignUUIDs(solrDocs, null);
                                    conversionTimer.suspend();
                                    numDocs += solrDocs.size();
                                }
                            }
                            else {
                                throw new Exception("Unsupported Document Format: " + docFormat);
                            }
                        }
                        else {
                            continue;
                        }

                        if (solrDocs != null) {
                            solrDocsToAdd.addAll(solrDocs);
                        }
                        if (solrDocsToAdd.size() < 500) {
                            // TODO: Handle the case when the size of the batch is too high. Do a check on the size.
                            continue;
                        }
                        indexingTimer.resume();
                        solr.add(solrDocsToAdd);
                        indexingTimer.suspend();
                        solrDocsToAdd.clear();
                        if (recordsProcessedInFile % 10000 == 0) {
                            totalTimer.split();
                            LOG.info("Records processed in file " + srcFileName + ":" + recordsProcessedInFile
                                     + "; Time elapsed:" + totalTimer.toSplitString());
                        }
                        if (idFromFileName != null || DocFormat.DUBLIN_CORE.isEqualTo(docFormat)) {
                            break;
                        }
                    }
                    if (solrDocsToAdd.size() > 0) {
                        indexingTimer.resume();
                        solr.add(solrDocsToAdd);
                        indexingTimer.suspend();
                        solrDocsToAdd.clear();
                    }
                }
                catch (Exception ex) {
                    String message = "Failure while processing file '" + srcFile.getAbsolutePath() + "' \nat Record: "
                                     + recordsProcessedInFile + "\n" + xmlContent;
                    ex.printStackTrace();
                    LOG.error(message);
                    solr.rollback();
                    throw ex;
                }
                totalTimer.split();
                if (recordsProcessedInFile > 0) {
                    // Do not log this message if a file has only one record.
                    LOG.info("Records processed in file " + srcFileName + ":" + recordsProcessedInFile
                             + "; Time elapsed:" + totalTimer.toSplitString());
                }
            }
            // commit after all docs are added.
            if (numDocs > 0) {
                indexingTimer.resume();
                solr.commit();
                indexingTimer.suspend();
            }

            conversionTimer.stop();
            fileIOTimer.stop();
            indexingTimer.stop();
            totalTimer.stop();
            LOG.info("Num of files processed:" + numFiles + "; Num of documents processed:" + numDocs);
            LOG.info("Time taken for reading files:" + fileIOTimer.toString()
                     + "; Time taken for parsing and converting to Solr Docs:" + conversionTimer.toString());
            LOG.info(
                    "Time taken for indexing Solr docs:" + indexingTimer.toString() + "; Total time taken:" + totalTimer
                            .toString());
            result = SUCCESS + "-" + numDocs;
        }
        catch (Exception e) {
            result = buildFailureMsg(null, "Indexing failed. " + e.getMessage());
            LOG.error(result, e);
        }
        return result;
    }

    //    public String indexDocuments(List<RequestDocument> requestDocuments) {
    //        for (RequestDocument requestDocument : requestDocuments) {
    //            indexDocument(requestDocument);
    //        }
    //        return null;
    //    }

    public String indexDocument(RequestDocument requestDocument) {
        return indexDocument(requestDocument, true);
    }

    public String indexDocument(RequestDocument requestDocument, boolean commit) {
        List<RequestDocument> requestDocuments = null;
        if (requestDocument != null) {
            requestDocuments = new ArrayList<RequestDocument>(1);
            requestDocuments.add(requestDocument);
        }
        return indexDocuments(requestDocuments, commit);
    }

    @Override
    public String indexDocuments(List<RequestDocument> requestDocuments) {
        return indexDocuments(requestDocuments, true);
    }

    @Override
    public String indexDocuments(List<RequestDocument> requestDocuments, boolean commit) {
        String result = null;
        StopWatch timer = new StopWatch();
        StopWatch buildSolrInputDocTime = new StopWatch();
        StopWatch xmlToObjTime = new StopWatch();
        buildSolrInputDocTime.start();
        buildSolrInputDocTime.suspend();
        xmlToObjTime.start();
        xmlToObjTime.suspend();
        timer.start();
        List<SolrInputDocument> solrInputDocuments = new ArrayList<SolrInputDocument>();
        try {
            for (RequestDocument requestDocument : requestDocuments) {
                if (requestDocument == null) {
                    continue;
                }
                if (DocCategory.WORK.isEqualTo(requestDocument.getCategory())) {
                    if (DocType.BIB.isEqualTo(requestDocument.getType())) { // Biblographic
                        if (DocFormat.MARC.isEqualTo(requestDocument.getFormat())) {
                            new WorkBibMarcDocBuilder()
                                    .buildSolrInputDocument(requestDocument, solrInputDocuments, buildSolrInputDocTime,
                                                            xmlToObjTime);
                        }
                        else if (DocFormat.DUBLIN_CORE.isEqualTo(requestDocument.getFormat())) {
                            new WorkBibDublinDocBuilder().buildSolrInputDocument(requestDocument, solrInputDocuments);
                        }
                        else if (DocFormat.DUBLIN_UNQUALIFIED.isEqualTo(requestDocument.getFormat())) {
                            new WorkBibDublinUnQualifiedDocBuilder()
                                    .buildSolrInputDocument(requestDocument, solrInputDocuments);

                        }
                        else {
                            throw new Exception(
                                    "Unsupported Document Format : " + requestDocument.getFormat() + " Called.");
                        }
                    }
                    else if (DocType.LICENSE.isEqualTo(requestDocument.getType())) { //License
                        if (DocFormat.ONIXPL.isEqualTo((requestDocument.getFormat()))) { //onixpl
                            new WorkLicenseOnixplDocBuilder()
                                    .buildSolrInputDocument(requestDocument, solrInputDocuments);
                        }
                        else if ((DocFormat.PDF.isEqualTo((requestDocument.getFormat()))) || DocFormat.DOC.isEqualTo(
                                requestDocument.getFormat()) || DocFormat.XSLT.isEqualTo(
                                requestDocument.getFormat())) { //pdf
                            new WorkLicenseBinaryDocBuilder()
                                    .buildSolrInputDocument(requestDocument, solrInputDocuments);
                        }
                        else {
                            throw new Exception(
                                    "Unsupported Document Format : " + requestDocument.getFormat() + " Called.");
                        }
                    }

                    else if (DocType.INSTANCE.isEqualTo(requestDocument.getType())) { // Instance
                        if (DocFormat.OLEML.isEqualTo(requestDocument.getFormat())) {
                            new WorkInstanceOlemlDocBuilder()
                                    .buildSolrInputDocument(requestDocument, solrInputDocuments);
                        }
                        else {
                            throw new Exception(
                                    "Unsupported Document Format : " + requestDocument.getFormat() + " Called.");
                        }
                    }
                    else if (DocType.HOLDINGS.isEqualTo(requestDocument.getType())) { // Holdings
                        if (DocFormat.OLEML.isEqualTo(requestDocument.getFormat())) {
                            new WorkInstanceOlemlDocBuilder()
                                    .buildSolrInputDocument(requestDocument, solrInputDocuments);
                        }
                        else {
                            throw new Exception(
                                    "Unsupported Document Format : " + requestDocument.getFormat() + " Called.");
                        }
                    }
                    else if (DocType.ITEM.isEqualTo(requestDocument.getType())) { // Item
                        if (DocFormat.OLEML.isEqualTo(requestDocument.getFormat())) {
                            new WorkInstanceOlemlDocBuilder()
                                    .buildSolrInputDocument(requestDocument, solrInputDocuments);
                        }
                        else {
                            throw new Exception(
                                    "Unsupported Document Format : " + requestDocument.getFormat() + " Called.");
                        }
                    }
                    else if (DocType.SOURCEHOLDINGS.isEqualTo(requestDocument.getType())) { // Item
                        if (DocFormat.OLEML.isEqualTo(requestDocument.getFormat())) {
                            return "success";
                        }
                        else {
                            throw new Exception(
                                    "Unsupported Document Format : " + requestDocument.getFormat() + " Called.");
                        }
                    }
                    else {
                        throw new Exception("Unsupported Document Type : " + requestDocument.getType() + " Called.");
                    }
                }
                else if (DocCategory.SECURITY.isEqualTo(requestDocument.getCategory())) {
                    if (DocType.PATRON.isEqualTo(requestDocument.getType())) {
                        if (DocFormat.OLEML.isEqualTo(requestDocument.getFormat())) {
                            new SecurityPatronOlemlDocBuilder()
                                    .buildSolrInputDocument(requestDocument, solrInputDocuments);
                        }
                        else {
                            throw new Exception(
                                    "Unsupported Document Format : " + requestDocument.getFormat() + " Called.");
                        }
                    }
                    else {
                        throw new Exception("Unsupported Document Type : " + requestDocument.getType() + " Called.");
                    }
                }
                else {
                    //                        logger.error("Unsupported Document Format : " + reqDoc.getFormat() + " Called.");
                    throw new Exception(
                            "Unsupported Document Category : " + requestDocument.getCategory() + " Called.");
                }
                assignUUIDs(solrInputDocuments, null);
            }
        }
        catch (Exception e1) {
            result = buildFailureMsg(null, "Indexing failed. " + e1.getMessage());
            LOG.error(result, e1);
        }
        timer.stop();
        if ((null == solrInputDocuments) || (solrInputDocuments.isEmpty())) {
            result = buildFailureMsg(null, "No valid documents found in input.");
            return result;
        }
        int numDocs = solrInputDocuments.size();
        LOG.info("Conversion to Solr docs- Num:" + numDocs + ": Time taken:" + timer.toString());
        result = indexSolrDocuments(solrInputDocuments, commit);
        return result;
    }

    public String bulkIndexDocuments(List<RequestDocument> requestDocuments, boolean isCommit) {
        String result = "success";
        Map<String, SolrInputDocument> bibIdToDocMap = new HashMap<String, SolrInputDocument>();
        BatchIngestStatistics batchStatistics = BulkIngestStatistics.getInstance().getCurrentBatch();
        if (requestDocuments != null && requestDocuments.size() > 0) {
            StopWatch timer = new StopWatch();
            StopWatch buildSolrInputDocTimer = new StopWatch();
            StopWatch xmlToPojoTimer = new StopWatch();
            timer.start();
            buildSolrInputDocTimer.start();
            buildSolrInputDocTimer.suspend();
            xmlToPojoTimer.start();
            xmlToPojoTimer.suspend();

            List<SolrInputDocument> solrInputDocuments = new ArrayList<SolrInputDocument>();
            try {
                if (DocCategory.WORK.isEqualTo(requestDocuments.get(0).getCategory())) {
                    if (DocType.BIB.isEqualTo(requestDocuments.get(0).getType())) {
                        if (DocFormat.MARC.isEqualTo(requestDocuments.get(0).getFormat())) {
                            WorkBibMarcDocBuilder marcBuilder = new WorkBibMarcDocBuilder();
                            for (RequestDocument requestDocument : requestDocuments) {
                                marcBuilder.buildSolrInputDocument(requestDocument, solrInputDocuments,
                                                                   buildSolrInputDocTimer, xmlToPojoTimer);
                            }
                        }
                        else if (DocFormat.DUBLIN_CORE.isEqualTo(requestDocuments.get(0).getFormat())) {
                            WorkBibDublinDocBuilder dublinBuilder = new WorkBibDublinDocBuilder();
                            for (RequestDocument requestDocument : requestDocuments) {
                                dublinBuilder.buildSolrInputDocument(requestDocument, solrInputDocuments);
                            }
                        }
                        else if (DocFormat.DUBLIN_UNQUALIFIED.isEqualTo(requestDocuments.get(0).getFormat())) {
                            WorkBibDublinUnQualifiedDocBuilder dublinUnqBuilder
                                    = new WorkBibDublinUnQualifiedDocBuilder();
                            for (RequestDocument requestDocument : requestDocuments) {
                                dublinUnqBuilder.buildSolrInputDocument(requestDocument, solrInputDocuments);
                            }
                        }
                    }
                    else if (DocType.INSTANCE.isEqualTo(requestDocuments.get(0).getType())) {
                        WorkInstanceOlemlDocBuilder oleMlDocBuilder = new WorkInstanceOlemlDocBuilder();
                        for (RequestDocument requestDocument : requestDocuments) {
                            Instance instance = ((InstanceCollection) requestDocument.getContent().getContentObject())
                                    .getInstance().get(0);
                            for (String rId : instance.getResourceIdentifier()) {
                                List<SolrDocument> docs = getSolrDocumentBySolrId(rId);
                                for (SolrDocument solrDoc : docs) {
                                    SolrInputDocument bibSolrIDoc = ClientUtils.toSolrInputDocument(solrDoc);
                                    String bibId = bibSolrIDoc.getFieldValue(WorkBibCommonFields.UNIQUE_ID).toString();
                                    if (bibIdToDocMap.get(bibId) == null) {
                                        bibIdToDocMap.put(bibId, bibSolrIDoc);
                                    }
                                    bibIdToDocMap.get(bibId)
                                                 .addField("instanceIdentifier", instance.getInstanceIdentifier());
                                }
                            }
                            oleMlDocBuilder.buildSolrInputDocuments(requestDocument, solrInputDocuments);
                        }
                    }
                }
                if (DocCategory.SECURITY.isEqualTo(requestDocuments.get(0).getCategory())) {
                    if (DocType.PATRON.isEqualTo(requestDocuments.get(0).getType())) {
                        if (DocFormat.OLEML.isEqualTo(requestDocuments.get(0).getFormat())) {
                            SecurityPatronOlemlDocBuilder patronBuilder = new SecurityPatronOlemlDocBuilder();
                            for (RequestDocument requestDocument : requestDocuments) {
                                patronBuilder.buildSolrInputDocument(requestDocument, solrInputDocuments);
                            }
                        }
                    }
                }
                assignUUIDs(solrInputDocuments, null);
                solrInputDocuments.addAll(bibIdToDocMap.values());
            }
            catch (Exception e1) {
                result = buildFailureMsg(null, "Bulk Indexing failed. " + e1.getMessage());
                LOG.error(result, e1);
                return result;
            }
            timer.stop();
            if (solrInputDocuments.isEmpty()) {
                result = buildFailureMsg(null, "No valid documents found in input.");
                return result;
            }
            int numDocs = solrInputDocuments.size();
            batchStatistics.setTimeToConvertXmlToPojo(xmlToPojoTimer.getTime());
            batchStatistics.setTimeToConvertToSolrInputDocs(buildSolrInputDocTimer.getTime());
            StopWatch indexingTimer = new StopWatch();
            indexingTimer.start();
            try {
                result = indexSolrDocuments(solrInputDocuments, isCommit, false, false, false);
                indexingTimer.stop();
                //                batchStatistics.setTimeToIndexSolrInputDocs(indexingTimer.toString());
            }
            catch (Exception e) {
                result = buildFailureMsg(null, "Indexing failed. " + e.getMessage());
                LOG.error(result, e);
            }
            LOG.debug("Time Consumptions...:\txmlToObj(" + numDocs + "):" + xmlToPojoTimer + "\tbuildSolrInputDoc("
                      + numDocs + "):" + buildSolrInputDocTimer + "\tTotal(" + numDocs + "):" + timer.toString()
                      + "\t indexingTime(" + solrInputDocuments.size() + "):" + indexingTimer.toString());
        }
        return result;
    }

    public List<SolrDocument> getSolrDocumentBySolrId(String uniqueId) {
        QueryResponse response = null;
        String result = null;
        try {
            String args = "(" + WorkBibCommonFields.UNIQUE_ID + ":" + uniqueId + ")";
            SolrServer solr = SolrServerManager.getInstance().getSolrServer();
            SolrQuery query = new SolrQuery();
            query.setQuery(args);
            response = solr.query(query);
        }
        catch (Exception e) {
            result = buildFailureMsg();
            LOG.error(result, e);
        }
        return response.getResults();
    }

    public List<SolrDocument> getSolrDocument(String fieldName, String fieldValue) {
        QueryResponse response = null;
        String result = null;
        try {
            String args = "(" + fieldName + ":" + fieldValue + ")";
            SolrServer solr = SolrServerManager.getInstance().getSolrServer();
            SolrQuery query = new SolrQuery();
            query.setQuery(args);
            response = solr.query(query);
        }
        catch (Exception e) {
            result = buildFailureMsg();
            LOG.error(result, e);
        }
        return response.getResults();
    }

    /**
     * Assigns UUIDs for each document (that does not have an "id" field) in the given list.
     * Also makes sure "uniqueId" field is present. The UUIDs generated by this method start
     * with ID_FIELD_PREFIX for easy identification. Optionally takes a list
     * of UUIDs to be used to set/override the "id" field values of the documents.
     *
     * @param solrDocs
     * @param ids      List of id values (optional) to be used for the given documents.
     */
    protected void assignUUIDs(List<SolrInputDocument> solrDocs, List<String> ids) throws Exception {
        if ((null == solrDocs) || (solrDocs.size() == 0)) {
            return;
        }
        if ((null != ids) && (ids.size() < solrDocs.size())) {
            throw new Exception(
                    "Insufficient UUIDs(" + ids.size() + ") specified for documents(" + solrDocs.size() + ".");
        }
        for (int i = 0; i < solrDocs.size(); i++) {
            SolrInputDocument solrInputDocument = solrDocs.get(i);
            SolrInputField idField = solrInputDocument.getField("id");
            String uuid = null;
            if (null != ids) {
                // Get the supplied UUID.
                uuid = ids.get(i);
            }
            if (null == idField) {
                if (null == uuid) {
                    // Generate UUID.
                    uuid = UUID.randomUUID().toString();
                    uuid = ID_FIELD_PREFIX + uuid; // identifies the uuid generated by discovery module.
                }
                solrInputDocument.addField("id", uuid);
                solrInputDocument.addField("uniqueId", uuid);
            }
            else {
                if (null != uuid) {
                    // Use the supplied UUID.
                    solrInputDocument.setField("id", uuid);
                    solrInputDocument.setField("uniqueId", uuid);
                }
                else {
                    // Leave the existing id value and make sure uniqueId is set.
                    //                    uuid = (String) idField.getValue();
                    if (idField.getValue() instanceof List) {
                        List<String> uuidList = (List<String>) idField.getValue();
                        uuid = uuidList.get(0);
                    }
                    else if (idField.getValue() instanceof String) {
                        uuid = (String) idField.getValue();
                    }
                    if (null == uuid) {
                        // Generate UUID.
                        uuid = UUID.randomUUID().toString();
                        uuid = ID_FIELD_PREFIX + uuid; // identifies the uuid generated by discovery module.
                        idField.setValue(uuid, 1.0f);
                    }
                    SolrInputField uniqueIdField = solrInputDocument.getField("uniqueId");
                    if (null == uniqueIdField) {
                        solrInputDocument.addField("uniqueId", uuid);
                    }
                    else {
                        solrInputDocument.setField("uniqueId", uuid);
                    }
                }
            }
        }
    }

    @Override
    public void commit() throws Exception {
        boolean waitFlush = false;
        boolean waitSearcher = false;
        SolrServer solr = SolrServerManager.getInstance().getSolrServer();
        solr.commit(waitFlush, waitSearcher);
    }

    @Override
    public void rollback() throws Exception {
        SolrServer solr = SolrServerManager.getInstance().getSolrServer();
        solr.rollback();
    }

    protected String indexSolrDocuments(List<SolrInputDocument> solrDocs, boolean commit, boolean optimize,
                                        boolean waitFlush, boolean waitSearcher) throws Exception {
        BulkIngestStatistics bulkLoadStatistics = BulkIngestStatistics.getInstance();
        BatchIngestStatistics batchStatistics = bulkLoadStatistics.getCurrentBatch();
        StopWatch indexSolrDocsTime = new StopWatch();
        StopWatch solrCommitTime = new StopWatch();
        indexSolrDocsTime.start();
        SolrServer solr = null;
        if ((null == solrDocs) || (solrDocs.isEmpty())) {
            return SUCCESS + "-0";
        }
        solr = SolrServerManager.getInstance().getSolrServer();
        if (solrDocs.size() > BATCH_SIZE) {
            int numSolrDocs = solrDocs.size();
            for (int fromIndex = 0; fromIndex < numSolrDocs; fromIndex += BATCH_SIZE) {
                int toIndex = fromIndex + BATCH_SIZE;
                if (toIndex > numSolrDocs) {
                    toIndex = numSolrDocs;
                }
                List batchSolrDocs = solrDocs.subList(fromIndex, toIndex);
                if ((null != batchSolrDocs) && (!batchSolrDocs.isEmpty())) {
                    LOG.info("Indexing records. fromIndex=" + fromIndex + ", toIndex=" + toIndex);
                    UpdateResponse response = solr.add(solrDocs);
                }
            }
        }
        else {
            LOG.debug("Indexing records. size=" + solrDocs.size());
            UpdateResponse response = solr.add(solrDocs);
        }
        indexSolrDocsTime.stop();
        solrCommitTime.start();
        if (commit) {
            LOG.info("Bulk ingest: Index commit started. Number of records being committed: " + bulkLoadStatistics
                    .getCommitRecCount());
            solr.commit(waitFlush, waitSearcher);
        }
        solrCommitTime.stop();
        if (optimize) {
            solr.optimize(waitFlush, waitSearcher);
        }


        LOG.debug("Time Consumptions...: Solr input docs of size ..." + solrDocs.size()
                  + "\t time taken to index solr Input Docs" + indexSolrDocsTime + "solrcommit & Optimize"
                  + solrCommitTime);
        batchStatistics.setTimeToIndexSolrInputDocs(indexSolrDocsTime.getTime());
        batchStatistics.setTimeToSolrCommit(solrCommitTime.getTime());
        return SUCCESS + "-" + solrDocs.size();
    }

    protected String indexSolrDocuments(List<SolrInputDocument> solrDocs, boolean commit, boolean optimize)
            throws Exception {
        String result = indexSolrDocuments(solrDocs, commit, optimize, true, true);
        return result;
    }

    protected List<SolrInputDocument> convertToSolrDocs(String docCategory, String docType, String docFormat,
                                                        String docContent) throws Exception {
        List<SolrInputDocument> solrDocs = null;
        if (DocCategory.WORK.isEqualTo(docCategory) && DocType.BIB.isEqualTo(docType) && DocFormat.MARC.isEqualTo(
                docFormat)) {
            try {
                WorkBibMarcRecordProcessor recordProcessor = new WorkBibMarcRecordProcessor();
                solrDocs = new WorkBibMarcDocBuilder()
                        .buildSolrInputDocuments(recordProcessor.fromXML(docContent).getRecords());
            }
            catch (Exception e) {
                e.printStackTrace();
                throw new Exception("Exception while converting given XML Document: ", e);
            }
        }
        else if (DocCategory.WORK.isEqualTo(docCategory) && DocType.BIB.isEqualTo(docType) && DocFormat.DUBLIN_CORE
                                                                                                       .isEqualTo(
                                                                                                               docFormat)) {
            WorkBibDublinRecordProcessor processor = new WorkBibDublinRecordProcessor();
            WorkBibDublinRecord record = processor.fromXML(docContent);
            solrDocs = new ArrayList<SolrInputDocument>();
            solrDocs.add(new WorkBibDublinDocBuilder().buildSolrInputDocument(record));
        }
        else if (DocCategory.WORK.isEqualTo(docCategory) && DocType.BIB.isEqualTo(docType) && DocFormat
                .DUBLIN_UNQUALIFIED.isEqualTo(docFormat)) {
            solrDocs = new WorkBibDublinUnQualifiedDocBuilder()
                    .buildSolrInputDocuments(new WorkBibDublinUnQualifiedRecordProcessor().fromXML(docContent));
        }
        else {
            throw new Exception("UnSupported Document Format: " + docCategory + ", " + docType + ", " + docFormat);
        }
        return solrDocs;
    }

    protected String deleteDocumentByUUID(String uuid, String category, boolean commit) {
        String result = SUCCESS;
        try {
            SolrServer solr = SolrServerManager.getInstance().getSolrServer();
            solr.deleteById(uuid);
            if (commit) {
                solr.commit();
            }
        }
        catch (Exception e) {
            result = buildFailureMsg();
            LOG.error(result, e);
        }
        return result;
    }

    protected String deleteDocumentByUUID(String uuid, String category) {
        return deleteDocumentByUUID(uuid, category, true);
    }

    protected String deleteDocumentsByUUIDList(List<String> uuidList, String category, boolean commit) {
        String result = SUCCESS;
        try {
            SolrServer solr = SolrServerManager.getInstance().getSolrServer();
            List<String> uuidList1 = new ArrayList<String>();
            if (uuidList.size() > 0) {
                for (String id : uuidList) {
                    if (id != null) {
                        uuidList1.add(id);
                    }
                }
            }
            if (uuidList1.size() > 0) {
                solr.deleteById(uuidList1);
            }
            if (commit) {
                solr.commit();
            }
        }
        catch (Exception e) {
            result = buildFailureMsg();
            LOG.error(result, e);
        }
        return result;
    }

    protected String deleteDocumentsByUUIDList(List<String> uuidsList, String category)
            throws SolrServerException, MalformedURLException {
        List<String> deleteUuidsList = new ArrayList<String>();
        List<String> holdingsIdentifierList = new ArrayList<String>();
        List<String> itemIdentifierList = new ArrayList<String>();
        SolrServer solr = SolrServerManager.getInstance().getSolrServer();
        SolrQuery query = new SolrQuery();
        deleteUuidsList.addAll(uuidsList);
        for (int i = 0; i < uuidsList.size(); i++) {
            query.setQuery("id:" + uuidsList.get(i));
            QueryResponse response = solr.query(query);
            LOG.debug("query-->" + query);
            for (SolrDocument doc : response.getResults()) {
                LOG.debug("doc" + doc.toString());
                String docFormat = (String) doc.getFieldValue(DOC_FORMAT);
                String docType = (String) doc.getFieldValue(DOC_TYPE);
                if (docType.equalsIgnoreCase(BIBLIOGRAPHIC)) {
                }
                else if (docType.equalsIgnoreCase(INSTANCE)) {
                    if (doc.getFieldValue(ITEM_IDENTIFIER) instanceof List) {
                        itemIdentifierList = (List<String>) doc.getFieldValue(ITEM_IDENTIFIER);
                    }
                    else {
                        itemIdentifierList.add((String) doc.getFieldValue(ITEM_IDENTIFIER));
                    }
                    if (doc.getFieldValue(HOLDINGS_IDENTIFIER) instanceof String) {
                        holdingsIdentifierList.add((String) doc.getFieldValue(HOLDINGS_IDENTIFIER));
                    }
                    else {
                        holdingsIdentifierList = (List<String>) doc.getFieldValue(HOLDINGS_IDENTIFIER);
                    }
                    if (holdingsIdentifierList != null && holdingsIdentifierList.size() > 0) {
                        deleteUuidsList.addAll(holdingsIdentifierList);
                    }
                    if (itemIdentifierList != null && itemIdentifierList.size() > 0) {
                        deleteUuidsList.addAll(itemIdentifierList);

                    }
                }
            }
        }
        return deleteDocumentsByUUIDList(deleteUuidsList, category, true);
    }

    protected String buildDeleteQueryParamsForDeleteUrl(List<String> uuidList, boolean commit) {
        StringBuffer deleteQueryBuffer = new StringBuffer("");
        deleteQueryBuffer.append("stream.body=");
        deleteQueryBuffer.append("<delete>");
        for (int i = 0; i < uuidList.size(); i++) {
            deleteQueryBuffer.append("<query>");
            deleteQueryBuffer.append("id:");
            deleteQueryBuffer.append(uuidList.get(i));
            deleteQueryBuffer.append("</query>");
        }
        deleteQueryBuffer.append("</delete>");
        if (commit) {
            deleteQueryBuffer.append("&stream.body=<commit/>");
        }
        return deleteQueryBuffer.toString();

    }

    protected String buildDeleteQuery(String uuid, String category, boolean commit) {
        StringBuffer deleteQueryUrl = new StringBuffer("");
        if (commit) {
            deleteQueryUrl.append(SolrServerManager.getInstance().getSolrCoreURL());
            deleteQueryUrl.append("/update?stream.body=<delete><query>id:" + uuid
                                  + "</query></delete>&stream.body=<commit/>");
        }
        else {
            deleteQueryUrl.append(SolrServerManager.getInstance().getSolrCoreURL());
            deleteQueryUrl.append("/update?stream.body=<delete><query>id:" + uuid + "</query></delete>");
        }
        return deleteQueryUrl.toString();
    }

    /**
     * @param inputURL
     * @throws Exception
     */
     protected void openConnection(URL inputURL) throws Exception {
         HttpURLConnection urlConnection = (HttpURLConnection) inputURL.openConnection();
         urlConnection.setDoOutput(true);
         urlConnection.connect();
         OutputStreamWriter streamWriter = new OutputStreamWriter(urlConnection.getOutputStream());
         streamWriter.flush();
         // Get the response from inputURL
         BufferedReader bufferReader = new BufferedReader(new InputStreamReader(urlConnection.getInputStream()));
         String xmlResponse;
         while ((xmlResponse = bufferReader.readLine()) != null) {
             if (LOG.isDebugEnabled()) {
                 LOG.debug("XmlResponse->" + xmlResponse);
             }
         }
     }

     protected String getErrorID() {
         return String.valueOf(new Date().getTime());
     }

     protected String buildFailureMsg(String id, String msg) {
         StringBuilder sb = new StringBuilder();
         sb.append(FAILURE).append("-ErrorID:");
         if (null != id) {
             sb.append(id);
         }
         else {
             sb.append(getErrorID());
         }
         if (null != msg) {
             sb.append("-ErrorMsg:").append(msg);
         }
         return sb.toString();
     }

     protected String buildFailureMsg() {
         return FAILURE + "-ErrorID:" + getErrorID();
     }

     public QueryResponse searchBibRecord(String docCat, String docType, String docFormat, String fieldName,
                                          String fieldValue, String fieldList) {
         QueryResponse response = null;
         String result = null;
         try {
             String identifier_args = "(" + fieldName + ":" + fieldValue + ")";
             String docCategory_args = "(DocCategory" + ":" + docCat + ")";
             String docType_args = "(DocType" + ":" + docType + ")";
             String docFormat_args = "(DocFormat" + ":" + docFormat + ")";
             String args = identifier_args + "AND" + docCategory_args + "AND" + docType_args + "AND" + docFormat_args;
             SolrServer solr = new CommonsHttpSolrServer(
                     PropertyUtil.getPropertyUtil().getProperty("docSearchURL") + "bib");
             SolrQuery query = new SolrQuery();
             query.addField(fieldList);
             query.setQuery(args);
             response = solr.query(query);
         }
         catch (Exception e) {
             result = buildFailureMsg();
             LOG.error(result, e);
         }
         return response;
     }

     @Override
     public void cleanupDiscoveryData() throws IOException, SolrServerException {
         SolrServer server = null;
         try {
             server = SolrServerManager.getInstance().getSolrServer();
         }
         catch (SolrServerException e) {
             e.printStackTrace();  //To change body of catch statement use File | Settings | File Templates.
         }
         server.deleteByQuery("*:*");
         server.commit();

     }
 }