diff --git a/uce.portal/resources/templates/corpus/corpusInspector.ftl b/uce.portal/resources/templates/corpus/corpusInspector.ftl index 484c6790..c074f490 100644 --- a/uce.portal/resources/templates/corpus/corpusInspector.ftl +++ b/uce.portal/resources/templates/corpus/corpusInspector.ftl @@ -17,6 +17,17 @@ +
+ +
diff --git a/uce.portal/resources/templates/css/document-reader.css b/uce.portal/resources/templates/css/document-reader.css index 1e6c42f5..e8104f16 100644 --- a/uce.portal/resources/templates/css/document-reader.css +++ b/uce.portal/resources/templates/css/document-reader.css @@ -776,7 +776,7 @@ body { outline: none; } -#vp-3, #vp-4, #vp-5, #vp-2, #vp-1 { +#vp-3, #vp-4, #vp-5, #vp-2, #vp-1, #vp-6 { display: flex; align-items: center; justify-content: center; diff --git a/uce.portal/resources/templates/js/documentReader.js b/uce.portal/resources/templates/js/documentReader.js index 8b7dd880..97fc11ba 100644 --- a/uce.portal/resources/templates/js/documentReader.js +++ b/uce.portal/resources/templates/js/documentReader.js @@ -916,6 +916,10 @@ $(document).on('click', '.viz-nav-btn', function () { setTimeout(() => renderSentenceTopicSankey('vp-5'), 500); } + if (target === '#viz-panel-6') { + setTimeout(() => renderTemporalExplorer('vp-6'), 500); + + } }); diff --git a/uce.portal/resources/templates/landing-page.ftl b/uce.portal/resources/templates/landing-page.ftl index 98e75ac8..987da127 100644 --- a/uce.portal/resources/templates/landing-page.ftl +++ b/uce.portal/resources/templates/landing-page.ftl @@ -3,7 +3,8 @@
-
${uceConfig.getMeta().getName()?trim!"-"}
+
${uceConfig.getMeta().getName()?trim!"-"}
@@ -15,8 +16,21 @@
-

${languageResource.get("corpora")}

+
+

${languageResource.get("corpora")}

+ <#if uceConfig.settings.enablePathImport?? && uceConfig.settings.enablePathImport> + + + +
+ +
<#if corpora?size == 0>
@@ -33,7 +47,8 @@ data-id="${corpusVm.getCorpus().getId()}"> ${corpusVm.getCorpus().getName()?trim} -

${corpusVm.getCorpus().getAuthor()}

+

${corpusVm.getCorpus().getAuthor()}

+
+ +<#--Modal for importing files via a path--> + + +<#--Modal for uploading files--> + + + \ No newline at end of file diff --git a/uce.portal/resources/templates/reader/documentReaderView.ftl b/uce.portal/resources/templates/reader/documentReaderView.ftl index 8c18fdf2..58eb198e 100644 --- a/uce.portal/resources/templates/reader/documentReaderView.ftl +++ b/uce.portal/resources/templates/reader/documentReaderView.ftl @@ -315,6 +315,9 @@
+
+
+
@@ -323,6 +326,7 @@ +
diff --git a/uce.portal/resources/templates/wiki/analysisResultFragment.ftl b/uce.portal/resources/templates/wiki/analysisResultFragment.ftl index 7e012f0c..2fce37a3 100644 --- a/uce.portal/resources/templates/wiki/analysisResultFragment.ftl +++ b/uce.portal/resources/templates/wiki/analysisResultFragment.ftl @@ -1,4 +1,23 @@ +<#if analysisId??> +
+ +
+ + <#if DUUI??> <#if DUUI.modelGroups?has_content> <#if DUUI.isTopic> @@ -7,7 +26,10 @@
<#list DUUI.textInformation.topicAVG as model>
-
${model.getModelInfo().getName()}
+
+ ${model.getModelInfo().getName()} + +
<#list model.topics as topic> <#assign opacity = topic.getScore()?string?replace(",", ".")> @@ -16,6 +38,9 @@
+
diff --git a/uce.portal/uce.analysis/src/main/java/org/texttechnologylab/uce/analysis/DUUIPipeline.java b/uce.portal/uce.analysis/src/main/java/org/texttechnologylab/uce/analysis/DUUIPipeline.java index 3cb3d72a..e016d4ae 100644 --- a/uce.portal/uce.analysis/src/main/java/org/texttechnologylab/uce/analysis/DUUIPipeline.java +++ b/uce.portal/uce.analysis/src/main/java/org/texttechnologylab/uce/analysis/DUUIPipeline.java @@ -129,8 +129,8 @@ public JCas getLanguage(String inputText) throws Exception { public JCas getSentences(JCas cas) throws Exception { HashMap spacyUrls = new HashMap<>(); - spacyUrls.put("Spacy", "http://spacy-cohmetrix.service.component.duui.texttechnologylab.org"); -// spacyUrls.put("Spacy", "http://spacy.service.component.duui.texttechnologylab.org"); +// spacyUrls.put("Spacy", "http://spacy-cohmetrix.service.component.duui.texttechnologylab.org"); + spacyUrls.put("Spacy", "http://spacy.service.component.duui.texttechnologylab.org"); spacyUrls.put("Syntok", "http://paragraph-syntok.service.component.duui.texttechnologylab.org/"); DUUIComposer composer = setListComposer(spacyUrls); cas = runPipeline(cas, composer); diff --git a/uce.portal/uce.analysis/src/main/java/org/texttechnologylab/uce/analysis/RunDUUIPipeline.java b/uce.portal/uce.analysis/src/main/java/org/texttechnologylab/uce/analysis/RunDUUIPipeline.java index 02687feb..c34c6f15 100644 --- a/uce.portal/uce.analysis/src/main/java/org/texttechnologylab/uce/analysis/RunDUUIPipeline.java +++ b/uce.portal/uce.analysis/src/main/java/org/texttechnologylab/uce/analysis/RunDUUIPipeline.java @@ -1,6 +1,8 @@ package org.texttechnologylab.uce.analysis; import de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Sentence; +import org.apache.logging.log4j.LogManager; +import org.apache.logging.log4j.Logger; import org.apache.uima.fit.factory.JCasFactory; import org.apache.uima.fit.util.JCasUtil; import org.apache.uima.jcas.JCas; @@ -8,11 +10,41 @@ import org.texttechnologylab.uce.analysis.modules.*; import org.texttechnologylab.uce.analysis.typeClasses.TextClass; + + + +import java.time.Instant; +import java.util.concurrent.ConcurrentHashMap; +import java.util.concurrent.TimeUnit; +import java.io.InputStream; +import java.io.DataOutputStream; +import java.net.HttpURLConnection; +import java.net.URL; +import java.nio.charset.StandardCharsets; + import java.util.*; public class RunDUUIPipeline { + private static final AnalysisCache analysisCache = new AnalysisCache(); + private static final ThreadLocal lastAnalysisIdTL = new ThreadLocal<>(); + private static final Logger logger = LogManager.getLogger(RunDUUIPipeline.class); + private static final ThreadLocal currentUserIdTL = new ThreadLocal<>(); + + + public static AnalysisSession getCachedSession(String analysisId) { + return analysisCache.get(analysisId); + } + public static void setThreadLocalUserId(String userId) { + currentUserIdTL.set(userId); + } + + private static String getCurrentUserId() { + // TODO: replace with your auth/session identity + + return currentUserIdTL.get(); + } public DUUIInformation getModelResources(List modelGroups, String inputText, String claim, String coherenceText, String stanceText, String systemPrompt) throws Exception { ModelResources modelResources = new ModelResources(); @@ -189,10 +221,13 @@ public DUUIInformation getModelResources(List modelGroups, String inputT newCas.setDocumentText(text); cas = newCas; + logger.info("[CAS] Created secondary JCas for special models (fact/coherence/stance/LLM)"); + } // run pipeline DUUIComposer composer = pipeline.setComposer(modelInfosMap); JCas result = pipeline.runPipeline(cas, composer); + logger.info("[CAS] Final result JCas created via pipeline.runPipeline(cas, composer)"); // get results Object[] results = pipeline.getJCasResults(result, modelInfosList, ttlabScorerGroups, cohmetrixScorerGroups); // print results @@ -232,9 +267,29 @@ public DUUIInformation getModelResources(List modelGroups, String inputT if (isCohmetrix) { duuiInformation.setCohMetrixGroups(cohmetrixScorerGroups); } + String analysisId = UUID.randomUUID().toString(); + String userId = getCurrentUserId(); + logger.info("[USER] Running pipeline for User: " + userId); + String title = "Analysis " + Instant.now(); + + byte[] xmiBytes = toXmiBytes(result); + AnalysisSession session = new AnalysisSession( + analysisId, userId, title, /*externalId*/ null, + result, /*xmiBytes*/ xmiBytes + ); + analysisCache.put(session); + lastAnalysisIdTL.set(analysisId); + logger.info("[CACHE] Added analysisId=" + analysisId + " (stored in memory; TTL=45min)"); return duuiInformation; } + public AnalysisResponse getModelResourcesWithHandle(List modelGroups, String inputText, String claim, + String coherenceText, String stanceText, String systemPrompt) throws Exception { + DUUIInformation info = getModelResources(modelGroups, inputText, claim, coherenceText, stanceText, systemPrompt); + String id = lastAnalysisIdTL.get(); + return new AnalysisResponse(id, info); + } + public static void main(String[] args) throws Exception { ModelResources modelResources = new ModelResources(); List modelGroups = modelResources.getGroupedModelObjects(); @@ -256,5 +311,195 @@ public static void main(String[] args) throws Exception { DUUIInformation duuiInformation = new RunDUUIPipeline().getModelResources(modelGroupNames, inputText, claim, coherenceText, stanceText, systemPrompt); } + public static final class AnalysisResponse { + public final String analysisId; + public final DUUIInformation duuiInformation; + + public AnalysisResponse(String analysisId, DUUIInformation duuiInformation) { + this.analysisId = analysisId; + this.duuiInformation = duuiInformation; + } + } + + + //AnalysisSession + public static final class AnalysisSession { + public final String analysisId; + public final String userId; + public final long createdAtMillis; + public final String title; + public final String externalId; + public final JCas jcas; + public final byte[] xmiBytes; + + public AnalysisSession(String analysisId, String userId, String title, String externalId, + JCas jcas, byte[] xmiBytes) { + this.analysisId = analysisId; + this.userId = userId; + this.title = title; + this.externalId = externalId; + this.createdAtMillis = System.currentTimeMillis(); + this.jcas = jcas; + this.xmiBytes = xmiBytes; + } + } + + + // AnalysisCache + public static final class AnalysisCache { + private final Map map = new ConcurrentHashMap<>(); + private final long ttlMillis = 45 * 60 * 1000L; // 45 minutes + + public void put(AnalysisSession s) { map.put(s.analysisId, s); } + + public AnalysisSession get(String id) { // Retrieve a session from the cache + AnalysisSession s = map.get(id); + if (s == null) return null; + + if (System.currentTimeMillis() - s.createdAtMillis > ttlMillis) { // If this session is older than 45 minutes -> expire it + map.remove(id); + return null; + } + return s; + } + +// public void remove(String id) { +// map.remove(id); +// } //Manually remove a session by ID +// +// +// public void cleanupExpired() { // cleanup all expired sessions +// long now = System.currentTimeMillis(); +// for (var entry : map.entrySet()) { +// AnalysisSession s = entry.getValue(); +// if (now - s.createdAtMillis > ttlMillis) { +// map.remove(entry.getKey()); +// logger.info("[CRON] Removed expired session: " + s.analysisId); +// } +// } +// } +// } +// private static final java.util.concurrent.ScheduledExecutorService scheduler = //Cron job for automatic cleanup every 5 minutes +// java.util.concurrent.Executors.newScheduledThreadPool(1); +// +// static { +// scheduler.scheduleAtFixedRate(() -> { +// try { +// analysisCache.cleanupExpired(); +// } catch (Exception e) { +// logger.error("[CACHE] Cache cleanup failed: " + e.getMessage()); +// } +// }, 5, 5, java.util.concurrent.TimeUnit.MINUTES); +// +// scheduler.scheduleAtFixedRate(() -> { +// logger.info("[CACHE] Running cache cleanup task..."); +// analysisCache.cleanupExpired(); // your cleanup method +// }, 1, 5, TimeUnit.MINUTES); +// +// + } + private static byte[] toXmiBytes(org.apache.uima.jcas.JCas jcas) throws Exception { + java.io.ByteArrayOutputStream bos = new java.io.ByteArrayOutputStream(); + org.apache.uima.cas.impl.XmiCasSerializer ser = + new org.apache.uima.cas.impl.XmiCasSerializer(jcas.getTypeSystem()); + org.apache.uima.util.XMLSerializer xmlSer = + new org.apache.uima.util.XMLSerializer(bos, true); + xmlSer.setOutputProperty(javax.xml.transform.OutputKeys.VERSION, "1.1"); + ser.serialize(jcas.getCas(), xmlSer.getContentHandler()); + return bos.toByteArray(); + } + + + // When we send CAS to the importer via HTTP, we want to capture the response. + // This small class acts like a container for the HTTP response details + private static class HttpResult { + final int status; + final String body; + final String locationHeader; + HttpResult(int status, String body, String locationHeader) { + this.status = status; this.body = body; this.locationHeader = locationHeader; + } + } + + + // Send CAS via HTTP + private static HttpResult postMultipart(String urlStr, + Map fields, + String fileField, String filename, + String fileContentType, byte[] fileBytes) throws Exception { + String boundary = "----JAVA-" + UUID.randomUUID(); //Generate a boundary string to separate parts in multipart body + URL url = new URL(urlStr); //Open HTTP connection to the importer endpoint + HttpURLConnection conn = (HttpURLConnection) url.openConnection(); + conn.setDoOutput(true); + conn.setRequestMethod("POST"); + conn.setRequestProperty("Content-Type", "multipart/form-data; boundary=" + boundary); + + try (DataOutputStream out = new DataOutputStream(conn.getOutputStream())) { //Write request body + // text fields + for (var e : fields.entrySet()) { + out.writeBytes("--" + boundary + "\r\n"); + out.writeBytes("Content-Disposition: form-data; name=\"" + e.getKey() + "\"\r\n\r\n"); + out.write(e.getValue().getBytes(StandardCharsets.UTF_8)); + out.writeBytes("\r\n"); + } + // file field + out.writeBytes("--" + boundary + "\r\n"); + out.writeBytes("Content-Disposition: form-data; name=\"" + fileField + "\"; filename=\"" + filename + "\"\r\n"); + out.writeBytes("Content-Type: " + fileContentType + "\r\n\r\n"); + out.write(fileBytes); + out.writeBytes("\r\n"); + out.writeBytes("--" + boundary + "--\r\n"); + out.flush(); + } + + int status = conn.getResponseCode(); //Read the HTTP response from the importer + String location = conn.getHeaderField("Location"); + String body; + + try (InputStream in = (status >= 200 && status < 400) ? conn.getInputStream() : conn.getErrorStream()) { + body = (in != null) ? new String(in.readAllBytes(), StandardCharsets.UTF_8) : ""; + } + conn.disconnect(); + return new HttpResult(status, body, location); + } + + public static HttpResult sendToImporterViaHttp(String importUrl, //Send cached CAS to importer + String analysisId, + long corpusId, + String documentId, + String casView) throws Exception { + AnalysisSession s = getCachedSession(analysisId); + if (s == null) throw new IllegalArgumentException("No cached session for id: " + analysisId); + + byte[] casBytes = toXmiBytes(s.jcas); + + Map fields = new LinkedHashMap<>(); // Form-data fields + fields.put("analysisId", analysisId); + fields.put("corpusId", Long.toString(corpusId)); + if (documentId != null && !documentId.isBlank()) fields.put("documentId", documentId); + if (casView != null && !casView.isBlank()) fields.put("casView", casView); + + + // Send multipart as XMI + String filename = "cas_" + analysisId + ".xmi"; + logger.info("[IMPORT][HTTP] POST " + importUrl + + " corpusId=" + corpusId + " analysisId=" + analysisId + + " documentId=" + documentId + " casView=" + casView + + " file=" + filename + " (" + casBytes.length + " bytes)"); + + HttpResult res = postMultipart( + importUrl, + fields, + "file", + filename, + "application/xml", + casBytes + ); + logger.info("[IMPORT][HTTP] status=" + res.status + + (res.locationHeader != null ? " Location=" + res.locationHeader : "") + + (res.body != null && !res.body.isBlank() ? " body=" + res.body : "")); + return res; + } + } diff --git a/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/config/HibernateConf.java b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/config/HibernateConf.java index 03afde97..3469904f 100644 --- a/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/config/HibernateConf.java +++ b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/config/HibernateConf.java @@ -11,6 +11,7 @@ import org.texttechnologylab.uce.common.models.corpus.*; import org.texttechnologylab.uce.common.models.corpus.emotion.Emotion; import org.texttechnologylab.uce.common.models.corpus.emotion.Feeling; +import org.texttechnologylab.uce.common.models.corpus.emotion.SentenceEmotion; import org.texttechnologylab.uce.common.models.corpus.links.AnnotationLink; import org.texttechnologylab.uce.common.models.corpus.links.AnnotationToDocumentLink; import org.texttechnologylab.uce.common.models.corpus.links.DocumentLink; @@ -55,6 +56,7 @@ public static SessionFactory buildSessionFactory() { metadataSources.addAnnotatedClass(Sentiment.class); metadataSources.addAnnotatedClass(Emotion.class); metadataSources.addAnnotatedClass(Feeling.class); + metadataSources.addAnnotatedClass(SentenceEmotion.class); metadataSources.addAnnotatedClass(GeoName.class); metadataSources.addAnnotatedClass(Paragraph.class); metadataSources.addAnnotatedClass(Sentence.class); diff --git a/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/config/uceConfig/SettingsConfig.java b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/config/uceConfig/SettingsConfig.java index 3d2671f7..1fcfd6d9 100644 --- a/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/config/uceConfig/SettingsConfig.java +++ b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/config/uceConfig/SettingsConfig.java @@ -12,4 +12,5 @@ public class SettingsConfig { private EmbeddingsConfig embeddings; private AuthConfig authentication; private MCPConfig mcp = new MCPConfig(); + private boolean enablePathImport = false; } diff --git a/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/models/corpus/emotion/Emotion.java b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/models/corpus/emotion/Emotion.java index 45c78768..f649a78f 100644 --- a/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/models/corpus/emotion/Emotion.java +++ b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/models/corpus/emotion/Emotion.java @@ -24,6 +24,10 @@ public class Emotion extends UIMAAnnotation implements WikiModel { @JoinColumn(name = "emotion_id") private List feelings; + @OneToMany(mappedBy = "emotion", cascade = CascadeType.ALL, orphanRemoval = true) + private List sentenceEmotions; + + public String generateEmotionMarker() { var tooltip = ""; if (this.feelings != null && !this.feelings.isEmpty()) { diff --git a/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/models/corpus/emotion/SentenceEmotion.java b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/models/corpus/emotion/SentenceEmotion.java new file mode 100644 index 00000000..bb579170 --- /dev/null +++ b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/models/corpus/emotion/SentenceEmotion.java @@ -0,0 +1,79 @@ +package org.texttechnologylab.uce.common.models.corpus.emotion; + +import lombok.Getter; +import lombok.Setter; +import org.texttechnologylab.uce.common.models.corpus.Sentence; + +import javax.persistence.*; +import java.io.Serializable; +import java.util.Objects; + +@Getter +@Setter +@Entity +@Table(name = "sentenceemotion") +@IdClass(SentenceEmotion.SentenceEmotionId.class) +public class SentenceEmotion { + + @Id + @ManyToOne(fetch = FetchType.LAZY, optional = false) + @JoinColumn(name = "sentence_id", nullable = false) + private Sentence sentence; + + @Id + @ManyToOne(fetch = FetchType.LAZY, optional = false) + @JoinColumn(name = "emotion_id", nullable = false) + private Emotion emotion; + + @Id + @Column(name = "model", nullable = false, length = 255) + private String model; + + @Id + @Column(name = "feeling", nullable = false, length = 255) + private String feeling; + + @Column(name = "value") + private Double value; + + public SentenceEmotion() {} + + public SentenceEmotion(Sentence sentence, Emotion emotion, String model, String feeling, Double value) { + this.sentence = sentence; + this.emotion = emotion; + this.model = model; + this.feeling = feeling; + this.value = value; + } + + public static class SentenceEmotionId implements Serializable { + private Long sentence; // references Sentence.id + private Long emotion; // references Emotion.id + private String model; + private String feeling; + + public SentenceEmotionId() {} + + public SentenceEmotionId(Long sentence, Long emotion, String model, String feeling) { + this.sentence = sentence; + this.emotion = emotion; + this.model = model; + this.feeling = feeling; + } + + @Override + public boolean equals(Object o) { + if (this == o) return true; + if (!(o instanceof SentenceEmotionId that)) return false; + return Objects.equals(sentence, that.sentence) + && Objects.equals(emotion, that.emotion) + && Objects.equals(model, that.model) + && Objects.equals(feeling, that.feeling); + } + + @Override + public int hashCode() { + return Objects.hash(sentence, emotion, model, feeling); + } + } +} diff --git a/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/services/PostgresqlDataInterface_Impl.java b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/services/PostgresqlDataInterface_Impl.java index 170525c0..17dfb943 100644 --- a/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/services/PostgresqlDataInterface_Impl.java +++ b/uce.portal/uce.common/src/main/java/org/texttechnologylab/uce/common/services/PostgresqlDataInterface_Impl.java @@ -2122,7 +2122,10 @@ public List getTopicWordsByDocumentId(long documentId) throws Database public Map getUnifiedTopicToSentenceMap(long documentId) throws DatabaseOperationException { return executeOperationSafely((session) -> { - String sql = "SELECT unifiedtopic_id, sentence_id FROM sentencetopics WHERE document_id = :documentId"; + String sql = "SELECT unifiedtopic_id, sentence_id " + + "FROM sentencetopics " + + "WHERE document_id = :documentId " + + "AND unifiedtopic_id IS NOT NULL"; var query = session.createNativeQuery(sql) .setParameter("documentId", documentId); @@ -2264,4 +2267,74 @@ private String escapeSql(String input) { return input.replace("(", "\\(").replace(")", "\\)").replace(":", "\\:").replace("|", "\\|"); } + /** + * Inserts a sentence-level topic classification into the database. + * This method matches a sentence by its begin and end + * offsets within a given document and inserts a corresponding entry into the sentencetopics table + */ + public int insertSentenceTopicBySpan(long documentId, int begin, int end, String topicLabel, double score) + throws DatabaseOperationException { + + return executeOperationSafely((session) -> { + + String sql = + "INSERT INTO sentencetopics (document_id, sentence_id, topiclabel, thetast) " + + "SELECT :docId, s.id, :label, :score " + + "FROM sentence s " + + "WHERE s.document_id = :docId AND s.beginn = :begin AND s.endd = :end " + + "AND NOT EXISTS ( " + + " SELECT 1 FROM sentencetopics st " + + " WHERE st.sentence_id = s.id AND st.topiclabel = :label " + + ")"; + + var query = session.createNativeQuery(sql); + query.setParameter("docId", documentId); + query.setParameter("begin", begin); + query.setParameter("end", end); + query.setParameter("label", topicLabel); + query.setParameter("score", score); + + return query.executeUpdate(); + }); + } + /** + * Create unifiedtopic rows if missing for sentences that have sentencetopics + * Backfill sentencetopics.unifiedtopic_id + */ + public int ensureUnifiedTopicsForSentenceTopics(long documentId) throws DatabaseOperationException { + return executeOperationSafely(session -> { + + + String insertUnifiedTopics = + "INSERT INTO unifiedtopic (document_id, beginn, endd, coveredtext, islexicalized, page_id) " + + "SELECT DISTINCT s.document_id, s.beginn, s.endd, s.coveredtext, s.islexicalized, s.page_id " + + "FROM sentence s " + + "JOIN sentencetopics st ON st.sentence_id = s.id AND st.document_id = :docId " + + "LEFT JOIN unifiedtopic ut " + + " ON ut.document_id = s.document_id AND ut.beginn = s.beginn AND ut.endd = s.endd " + + "WHERE ut.id IS NULL"; + + session.createNativeQuery(insertUnifiedTopics) + .setParameter("docId", documentId) + .executeUpdate(); + + + String updateSentenceTopics = + "UPDATE sentencetopics st " + + "SET unifiedtopic_id = ut.id " + + "FROM sentence s " + + "JOIN unifiedtopic ut " + + " ON ut.document_id = s.document_id AND ut.beginn = s.beginn AND ut.endd = s.endd " + + "WHERE st.document_id = :docId " + + " AND st.sentence_id = s.id " + + " AND st.unifiedtopic_id IS NULL"; + + int updated = session.createNativeQuery(updateSentenceTopics) + .setParameter("docId", documentId) + .executeUpdate(); + + return updated; + }); + } + } diff --git a/uce.portal/uce.common/src/main/resources/defaultUceConfig.json b/uce.portal/uce.common/src/main/resources/defaultUceConfig.json index 3ccf0a6a..3e5462bc 100644 --- a/uce.portal/uce.common/src/main/resources/defaultUceConfig.json +++ b/uce.portal/uce.common/src/main/resources/defaultUceConfig.json @@ -144,7 +144,7 @@ ] }, "analysis": { - "enableAnalysisEngine": false + "enableAnalysisEngine": true }, "authentication": { "isActivated": false, diff --git a/uce.portal/uce.corpus-importer/logs/uce-corpus-importer-2025-11-27-1.log b/uce.portal/uce.corpus-importer/logs/uce-corpus-importer-2025-11-27-1.log new file mode 100644 index 00000000..e03b5847 --- /dev/null +++ b/uce.portal/uce.corpus-importer/logs/uce-corpus-importer-2025-11-27-1.log @@ -0,0 +1,66 @@ +2025-11-27 20:53:27.127 [main] INFO org.hibernate.Version - HHH000412: Hibernate ORM core version 5.6.15.Final +2025-11-27 20:53:27.228 [main] INFO org.hibernate.spatial.integration.SpatialService - HHH80000001: hibernate-spatial integration enabled : true +2025-11-27 20:53:27.265 [main] INFO org.hibernate.annotations.common.Version - HCANN000001: Hibernate Commons Annotations {5.1.2.Final} +2025-11-27 20:53:27.370 [main] WARN org.hibernate.orm.connections.pooling - HHH10001002: Using Hibernate built-in connection pool (not for production use!) +2025-11-27 20:53:27.370 [main] INFO org.hibernate.orm.connections.pooling - HHH10001005: using driver [null] at URL [jdbc:postgresql://localhost:8002/uce] +2025-11-27 20:53:27.371 [main] INFO org.hibernate.orm.connections.pooling - HHH10001001: Connection properties: {password=****, user=postgres} +2025-11-27 20:53:27.371 [main] INFO org.hibernate.orm.connections.pooling - HHH10001003: Autocommit mode: false +2025-11-27 20:53:27.374 [main] INFO org.hibernate.engine.jdbc.connections.internal.DriverManagerConnectionProviderImpl - HHH000115: Hibernate connection pool size: 20 (min=1) +2025-11-27 20:53:27.532 [main] INFO org.hibernate.dialect.Dialect - HHH000400: Using dialect: org.hibernate.dialect.PostgreSQL10Dialect +2025-11-27 20:53:28.416 [main] INFO org.hibernate.orm.connections.access - HHH10001501: Connection obtained from JdbcConnectionAccess [org.hibernate.engine.jdbc.env.internal.JdbcEnvironmentInitiator$ConnectionProviderJdbcConnectionAccess@1f7557fe] for (non-JTA) DDL execution was not in auto-commit mode; the Connection 'local transaction' will be committed and the Connection will be set into auto-commit mode. +2025-11-27 20:53:29.335 [main] INFO org.texttechnologylab.uce.corpusimporter.App - Executing external database scripts from ../database/ +2025-11-27 20:53:29.337 [main] WARN org.texttechnologylab.uce.corpusimporter.App - Couldn't read the db scripts in the external database scripts folder; path wasn't found or other IO problems. +java.nio.file.NoSuchFileException: ..\database + at java.base/sun.nio.fs.WindowsException.translateToIOException(WindowsException.java:85) ~[?:?] + at java.base/sun.nio.fs.WindowsException.rethrowAsIOException(WindowsException.java:103) ~[?:?] + at java.base/sun.nio.fs.WindowsException.rethrowAsIOException(WindowsException.java:108) ~[?:?] + at java.base/sun.nio.fs.WindowsDirectoryStream.(WindowsDirectoryStream.java:86) ~[?:?] + at java.base/sun.nio.fs.WindowsFileSystemProvider.newDirectoryStream(WindowsFileSystemProvider.java:541) ~[?:?] + at java.base/java.nio.file.Files.newDirectoryStream(Files.java:482) ~[?:?] + at java.base/java.nio.file.Files.list(Files.java:3785) ~[?:?] + at org.texttechnologylab.uce.common.utils.SystemStatus.executeExternalDatabaseScripts(SystemStatus.java:38) ~[classes/:?] + at org.texttechnologylab.uce.corpusimporter.App.lambda$main$0(App.java:44) ~[classes/:?] + at org.texttechnologylab.uce.common.exceptions.ExceptionUtils.tryCatchLog(ExceptionUtils.java:30) [classes/:?] + at org.texttechnologylab.uce.corpusimporter.App.main(App.java:43) [classes/:?] +2025-11-27 20:53:29.341 [main] INFO org.texttechnologylab.uce.corpusimporter.App - Finished with executing external database scripts. +2025-11-27 20:55:05.236 [main] INFO org.hibernate.Version - HHH000412: Hibernate ORM core version 5.6.15.Final +2025-11-27 20:55:05.340 [main] INFO org.hibernate.spatial.integration.SpatialService - HHH80000001: hibernate-spatial integration enabled : true +2025-11-27 20:55:05.373 [main] INFO org.hibernate.annotations.common.Version - HCANN000001: Hibernate Commons Annotations {5.1.2.Final} +2025-11-27 20:55:05.475 [main] WARN org.hibernate.orm.connections.pooling - HHH10001002: Using Hibernate built-in connection pool (not for production use!) +2025-11-27 20:55:05.475 [main] INFO org.hibernate.orm.connections.pooling - HHH10001005: using driver [null] at URL [jdbc:postgresql://localhost:8002/uce] +2025-11-27 20:55:05.475 [main] INFO org.hibernate.orm.connections.pooling - HHH10001001: Connection properties: {password=****, user=postgres} +2025-11-27 20:55:05.475 [main] INFO org.hibernate.orm.connections.pooling - HHH10001003: Autocommit mode: false +2025-11-27 20:55:05.477 [main] INFO org.hibernate.engine.jdbc.connections.internal.DriverManagerConnectionProviderImpl - HHH000115: Hibernate connection pool size: 20 (min=1) +2025-11-27 20:55:05.624 [main] INFO org.hibernate.dialect.Dialect - HHH000400: Using dialect: org.hibernate.dialect.PostgreSQL10Dialect +2025-11-27 20:55:06.528 [main] INFO org.hibernate.orm.connections.access - HHH10001501: Connection obtained from JdbcConnectionAccess [org.hibernate.engine.jdbc.env.internal.JdbcEnvironmentInitiator$ConnectionProviderJdbcConnectionAccess@52963839] for (non-JTA) DDL execution was not in auto-commit mode; the Connection 'local transaction' will be committed and the Connection will be set into auto-commit mode. +2025-11-27 20:55:07.427 [main] INFO org.texttechnologylab.uce.corpusimporter.App - Executing external database scripts from ../database/ +2025-11-27 20:55:07.430 [main] WARN org.texttechnologylab.uce.corpusimporter.App - Couldn't read the db scripts in the external database scripts folder; path wasn't found or other IO problems. +java.nio.file.NoSuchFileException: ..\database + at java.base/sun.nio.fs.WindowsException.translateToIOException(WindowsException.java:85) ~[?:?] + at java.base/sun.nio.fs.WindowsException.rethrowAsIOException(WindowsException.java:103) ~[?:?] + at java.base/sun.nio.fs.WindowsException.rethrowAsIOException(WindowsException.java:108) ~[?:?] + at java.base/sun.nio.fs.WindowsDirectoryStream.(WindowsDirectoryStream.java:86) ~[?:?] + at java.base/sun.nio.fs.WindowsFileSystemProvider.newDirectoryStream(WindowsFileSystemProvider.java:541) ~[?:?] + at java.base/java.nio.file.Files.newDirectoryStream(Files.java:482) ~[?:?] + at java.base/java.nio.file.Files.list(Files.java:3785) ~[?:?] + at org.texttechnologylab.uce.common.utils.SystemStatus.executeExternalDatabaseScripts(SystemStatus.java:38) ~[classes/:?] + at org.texttechnologylab.uce.corpusimporter.App.lambda$main$0(App.java:44) ~[classes/:?] + at org.texttechnologylab.uce.common.exceptions.ExceptionUtils.tryCatchLog(ExceptionUtils.java:30) [classes/:?] + at org.texttechnologylab.uce.corpusimporter.App.main(App.java:43) [classes/:?] +2025-11-27 20:55:07.433 [main] INFO org.texttechnologylab.uce.corpusimporter.App - Finished with executing external database scripts. +2025-11-27 20:55:07.524 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - + _ _ _____ _____ _____ _ +| | | / __ \| ___| |_ _| | | +| | | | / \/| |__ | | _ __ ___ _ __ ___ _ __| |_ +| | | | | | __| | || '_ ` _ \| '_ \ / _ \| '__| __| +| |_| | \__/\| |___ _| || | | | | | |_) | (_) | | | |_ + \___/ \____/\____/ \___/_| |_| |_| .__/ \___/|_| \__| + | | + |_| +2025-11-27 20:55:07.524 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Global Import Id: 07d96ad0-e619-4231-832a-e2202fc86c9d +2025-11-27 20:55:07.525 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Importer Number: 1 +2025-11-27 20:55:07.525 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Used Threads: 1 +2025-11-27 20:55:07.525 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Importing from path: F:\Area51\UCE\corpora\my_first_corpus +2025-11-27 20:55:07.525 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Reading view: null + + diff --git a/uce.portal/uce.corpus-importer/logs/uce-corpus-importer.log b/uce.portal/uce.corpus-importer/logs/uce-corpus-importer.log new file mode 100644 index 00000000..060a6efa --- /dev/null +++ b/uce.portal/uce.corpus-importer/logs/uce-corpus-importer.log @@ -0,0 +1,1650 @@ +2026-01-30 17:38:54.080 [main] INFO org.hibernate.Version - HHH000412: Hibernate ORM core version 5.6.15.Final +2026-01-30 17:38:54.188 [main] INFO org.hibernate.spatial.integration.SpatialService - HHH80000001: hibernate-spatial integration enabled : true +2026-01-30 17:38:54.225 [main] INFO org.hibernate.annotations.common.Version - HCANN000001: Hibernate Commons Annotations {5.1.2.Final} +2026-01-30 17:38:54.329 [main] WARN org.hibernate.orm.connections.pooling - HHH10001002: Using Hibernate built-in connection pool (not for production use!) +2026-01-30 17:38:54.329 [main] INFO org.hibernate.orm.connections.pooling - HHH10001005: using driver [null] at URL [jdbc:postgresql://localhost:8002/uce] +2026-01-30 17:38:54.342 [main] INFO org.hibernate.orm.connections.pooling - HHH10001001: Connection properties: {password=****, user=postgres} +2026-01-30 17:38:54.342 [main] INFO org.hibernate.orm.connections.pooling - HHH10001003: Autocommit mode: false +2026-01-30 17:38:54.345 [main] INFO org.hibernate.engine.jdbc.connections.internal.DriverManagerConnectionProviderImpl - HHH000115: Hibernate connection pool size: 20 (min=1) +2026-01-30 17:38:54.507 [main] INFO org.hibernate.dialect.Dialect - HHH000400: Using dialect: org.hibernate.dialect.PostgreSQL10Dialect +2026-01-30 17:38:55.386 [main] INFO org.hibernate.orm.connections.access - HHH10001501: Connection obtained from JdbcConnectionAccess [org.hibernate.engine.jdbc.env.internal.JdbcEnvironmentInitiator$ConnectionProviderJdbcConnectionAccess@42e4431] for (non-JTA) DDL execution was not in auto-commit mode; the Connection 'local transaction' will be committed and the Connection will be set into auto-commit mode. +2026-01-30 17:38:56.293 [main] INFO org.texttechnologylab.uce.corpusimporter.App - Executing external database scripts from ../database/ +2026-01-30 17:38:56.295 [main] WARN org.texttechnologylab.uce.corpusimporter.App - Couldn't read the db scripts in the external database scripts folder; path wasn't found or other IO problems. +java.nio.file.NoSuchFileException: ..\database + at java.base/sun.nio.fs.WindowsException.translateToIOException(WindowsException.java:85) ~[?:?] + at java.base/sun.nio.fs.WindowsException.rethrowAsIOException(WindowsException.java:103) ~[?:?] + at java.base/sun.nio.fs.WindowsException.rethrowAsIOException(WindowsException.java:108) ~[?:?] + at java.base/sun.nio.fs.WindowsDirectoryStream.(WindowsDirectoryStream.java:86) ~[?:?] + at java.base/sun.nio.fs.WindowsFileSystemProvider.newDirectoryStream(WindowsFileSystemProvider.java:541) ~[?:?] + at java.base/java.nio.file.Files.newDirectoryStream(Files.java:482) ~[?:?] + at java.base/java.nio.file.Files.list(Files.java:3785) ~[?:?] + at org.texttechnologylab.uce.common.utils.SystemStatus.executeExternalDatabaseScripts(SystemStatus.java:38) ~[classes/:?] + at org.texttechnologylab.uce.corpusimporter.App.lambda$main$0(App.java:44) ~[classes/:?] + at org.texttechnologylab.uce.common.exceptions.ExceptionUtils.tryCatchLog(ExceptionUtils.java:30) [classes/:?] + at org.texttechnologylab.uce.corpusimporter.App.main(App.java:43) [classes/:?] +2026-01-30 17:38:56.299 [main] INFO org.texttechnologylab.uce.corpusimporter.App - Finished with executing external database scripts. +2026-01-30 17:38:56.316 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - + _ _ _____ _____ _____ _ +| | | / __ \| ___| |_ _| | | +| | | | / \/| |__ | | _ __ ___ _ __ ___ _ __| |_ +| | | | | | __| | || '_ ` _ \| '_ \ / _ \| '__| __| +| |_| | \__/\| |___ _| || | | | | | |_) | (_) | | | |_ + \___/ \____/\____/ \___/_| |_| |_| .__/ \___/|_| \__| + | | + |_| +2026-01-30 17:38:56.316 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Global Import Id: f3ff8f20-2b53-4dc9-9b09-81964b9a3a8c +2026-01-30 17:38:56.316 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Importer Number: 1 +2026-01-30 17:38:56.316 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Used Threads: 1 +2026-01-30 17:38:56.316 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Importing from path: F:\Area51\UCE\corpora\my_first_corpus +2026-01-30 17:38:56.316 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - ===========> Reading view: null + + +2026-01-30 17:38:56.345 [main] WARN org.hibernate.orm.deprecation - HHH90000022: Hibernate's legacy org.hibernate.Criteria API is deprecated; use the JPA javax.persistence.criteria.CriteriaQuery instead +2026-01-30 17:38:57.584 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:38:57.599 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:38:57.606 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing 23-year-old Ukrainian refugee killed on North Carolina transit system.json +2026-01-30 17:38:57.678 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:38:57.679 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:38:57.680 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:38:57.681 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:38:57.684 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:38:57.710 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:38:57.712 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:38:57.717 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\23-year-old Ukrainian refugee killed on North Carolina transit system.json.xmi.gz.xmi.gz +2026-01-30 17:38:57.717 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:38:57.717 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id 23-year-old Ukrainian refugee killed on North Carolina transit system.json... +2026-01-30 17:38:59.940 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document 23-year-old Ukrainian refugee killed on North Carolina transit system.json.xmi.gz.xmi.gz +2026-01-30 17:38:59.940 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:38:59.946 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\23-year-old Ukrainian refugee killed on North Carolina transit system.json.xmi.gz.xmi.gz +2026-01-30 17:38:59.950 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\23-year-old Ukrainian refugee killed on North Carolina transit system.json.xmi.gz.xmi.gz +2026-01-30 17:39:00.025 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:00.028 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:00.050 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json +2026-01-30 17:39:00.054 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:00.054 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:00.054 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:00.055 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:00.056 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:00.061 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:00.061 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:00.064 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json.xmi.gz.xmi.gz +2026-01-30 17:39:00.064 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:00.064 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json... +2026-01-30 17:39:00.954 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:01.094 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json.xmi.gz.xmi.gz +2026-01-30 17:39:01.094 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:01.098 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json.xmi.gz.xmi.gz +2026-01-30 17:39:01.101 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json.xmi.gz.xmi.gz +2026-01-30 17:39:01.315 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:01.323 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:01.327 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Adams case and other Trump moves threaten to open corruption floodgates, experts say.json +2026-01-30 17:39:01.331 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:01.331 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:01.331 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:01.331 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:01.332 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:01.362 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:01.363 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:01.367 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Adams case and other Trump moves threaten to open corruption floodgates, experts say.json.xmi.gz.xmi.gz +2026-01-30 17:39:01.367 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:01.367 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Adams case and other Trump moves threaten to open corruption floodgates, experts say.json... +2026-01-30 17:39:01.673 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:05.728 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Adams case and other Trump moves threaten to open corruption floodgates, experts say.json.xmi.gz.xmi.gz +2026-01-30 17:39:05.728 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:05.732 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Adams case and other Trump moves threaten to open corruption floodgates, experts say.json.xmi.gz.xmi.gz +2026-01-30 17:39:05.737 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Adams case and other Trump moves threaten to open corruption floodgates, experts say.json.xmi.gz.xmi.gz +2026-01-30 17:39:05.781 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:05.785 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:05.788 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json +2026-01-30 17:39:05.791 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:05.791 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:05.791 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:05.792 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:05.793 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:05.797 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:05.798 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:05.802 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json.xmi.gz.xmi.gz +2026-01-30 17:39:05.802 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:05.802 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json... +2026-01-30 17:39:07.020 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json.xmi.gz.xmi.gz +2026-01-30 17:39:07.020 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:07.024 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json.xmi.gz.xmi.gz +2026-01-30 17:39:07.028 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json.xmi.gz.xmi.gz +2026-01-30 17:39:07.095 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:07.099 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:07.124 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Agency that handles green cards and citizenship to hire armed agents who can make arrests.json +2026-01-30 17:39:07.128 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:07.129 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:07.129 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:07.129 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:07.130 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:07.148 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:07.149 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:07.155 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Agency that handles green cards and citizenship to hire armed agents who can make arrests.json.xmi.gz.xmi.gz +2026-01-30 17:39:07.155 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:07.155 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Agency that handles green cards and citizenship to hire armed agents who can make arrests.json... +2026-01-30 17:39:07.614 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:07.670 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:09.302 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Agency that handles green cards and citizenship to hire armed agents who can make arrests.json.xmi.gz.xmi.gz +2026-01-30 17:39:09.302 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:09.306 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Agency that handles green cards and citizenship to hire armed agents who can make arrests.json.xmi.gz.xmi.gz +2026-01-30 17:39:09.311 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Agency that handles green cards and citizenship to hire armed agents who can make arrests.json.xmi.gz.xmi.gz +2026-01-30 17:39:09.342 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:09.345 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:09.349 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json +2026-01-30 17:39:09.352 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:09.352 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:09.352 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:09.353 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:09.354 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:09.361 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:09.361 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:09.365 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json.xmi.gz.xmi.gz +2026-01-30 17:39:09.365 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:09.366 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json... +2026-01-30 17:39:10.270 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:10.623 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json.xmi.gz.xmi.gz +2026-01-30 17:39:10.624 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:10.628 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json.xmi.gz.xmi.gz +2026-01-30 17:39:10.632 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json.xmi.gz.xmi.gz +2026-01-30 17:39:10.668 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:10.670 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:10.672 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json +2026-01-30 17:39:10.674 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:10.675 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:10.675 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:10.675 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:10.675 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:10.681 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:10.681 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:10.684 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json.xmi.gz.xmi.gz +2026-01-30 17:39:10.684 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:10.684 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json... +2026-01-30 17:39:11.151 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:12.346 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json.xmi.gz.xmi.gz +2026-01-30 17:39:12.346 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:12.348 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json.xmi.gz.xmi.gz +2026-01-30 17:39:12.352 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json.xmi.gz.xmi.gz +2026-01-30 17:39:12.368 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:12.370 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:12.372 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json +2026-01-30 17:39:12.374 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:12.374 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:12.374 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:12.374 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:12.374 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:12.377 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:12.378 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:12.380 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json.xmi.gz.xmi.gz +2026-01-30 17:39:12.380 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:12.381 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json... +2026-01-30 17:39:12.982 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:13.154 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json.xmi.gz.xmi.gz +2026-01-30 17:39:13.155 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:13.156 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json.xmi.gz.xmi.gz +2026-01-30 17:39:13.162 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json.xmi.gz.xmi.gz +2026-01-30 17:39:13.204 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:13.206 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:13.209 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Biden administration has no plans to fine companies if TikTok ban goes into effect.json +2026-01-30 17:39:13.211 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:13.212 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:13.212 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:13.212 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:13.212 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:13.217 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:13.217 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:13.220 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Biden administration has no plans to fine companies if TikTok ban goes into effect.json.xmi.gz.xmi.gz +2026-01-30 17:39:13.221 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:13.221 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Biden administration has no plans to fine companies if TikTok ban goes into effect.json... +2026-01-30 17:39:13.467 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:15.004 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Biden administration has no plans to fine companies if TikTok ban goes into effect.json.xmi.gz.xmi.gz +2026-01-30 17:39:15.004 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:15.006 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Biden administration has no plans to fine companies if TikTok ban goes into effect.json.xmi.gz.xmi.gz +2026-01-30 17:39:15.009 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Biden administration has no plans to fine companies if TikTok ban goes into effect.json.xmi.gz.xmi.gz +2026-01-30 17:39:15.032 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:15.033 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:15.036 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json +2026-01-30 17:39:15.038 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:15.038 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:15.038 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:15.038 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:15.039 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:15.041 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:15.041 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:15.044 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json.xmi.gz.xmi.gz +2026-01-30 17:39:15.044 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:15.044 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json... +2026-01-30 17:39:15.745 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:16.236 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json.xmi.gz.xmi.gz +2026-01-30 17:39:16.236 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:16.238 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json.xmi.gz.xmi.gz +2026-01-30 17:39:16.241 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json.xmi.gz.xmi.gz +2026-01-30 17:39:16.271 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:16.272 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:16.276 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json +2026-01-30 17:39:16.278 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:16.278 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:16.278 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:16.278 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:16.278 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:16.280 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:16.280 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:16.283 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json.xmi.gz.xmi.gz +2026-01-30 17:39:16.283 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:16.283 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json... +2026-01-30 17:39:16.745 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:17.126 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json.xmi.gz.xmi.gz +2026-01-30 17:39:17.126 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:17.130 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json.xmi.gz.xmi.gz +2026-01-30 17:39:17.132 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json.xmi.gz.xmi.gz +2026-01-30 17:39:17.157 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:17.159 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:17.161 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Civil rights agency sued over handling of trans worker discrimination complaints.json +2026-01-30 17:39:17.163 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:17.163 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:17.163 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:17.163 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:17.163 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:17.165 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:17.166 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:17.168 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Civil rights agency sued over handling of trans worker discrimination complaints.json.xmi.gz.xmi.gz +2026-01-30 17:39:17.168 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:17.168 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Civil rights agency sued over handling of trans worker discrimination complaints.json... +2026-01-30 17:39:17.507 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:18.438 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Civil rights agency sued over handling of trans worker discrimination complaints.json.xmi.gz.xmi.gz +2026-01-30 17:39:18.438 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:18.441 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Civil rights agency sued over handling of trans worker discrimination complaints.json.xmi.gz.xmi.gz +2026-01-30 17:39:18.444 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Civil rights agency sued over handling of trans worker discrimination complaints.json.xmi.gz.xmi.gz +2026-01-30 17:39:18.465 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:18.466 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:18.470 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing DHS has begun performing polygraph tests on employees to find leakers.json +2026-01-30 17:39:18.472 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:18.472 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:18.472 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:18.472 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:18.472 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:18.474 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:18.474 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:18.478 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\DHS has begun performing polygraph tests on employees to find leakers.json.xmi.gz.xmi.gz +2026-01-30 17:39:18.478 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:18.478 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id DHS has begun performing polygraph tests on employees to find leakers.json... +2026-01-30 17:39:19.007 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:19.246 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document DHS has begun performing polygraph tests on employees to find leakers.json.xmi.gz.xmi.gz +2026-01-30 17:39:19.246 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:19.248 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\DHS has begun performing polygraph tests on employees to find leakers.json.xmi.gz.xmi.gz +2026-01-30 17:39:19.251 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\DHS has begun performing polygraph tests on employees to find leakers.json.xmi.gz.xmi.gz +2026-01-30 17:39:19.274 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:19.276 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:19.278 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json +2026-01-30 17:39:19.280 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:19.281 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:19.281 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:19.281 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:19.281 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:19.283 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:19.283 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:19.285 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json.xmi.gz.xmi.gz +2026-01-30 17:39:19.285 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:19.285 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json... +2026-01-30 17:39:19.571 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:20.504 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json.xmi.gz.xmi.gz +2026-01-30 17:39:20.504 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:20.506 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json.xmi.gz.xmi.gz +2026-01-30 17:39:20.509 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json.xmi.gz.xmi.gz +2026-01-30 17:39:20.560 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:20.562 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:20.564 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing How much money you should save for a comfortable retirement.json +2026-01-30 17:39:20.566 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:20.566 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:20.566 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:20.566 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:20.566 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:20.568 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:20.568 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:20.571 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\How much money you should save for a comfortable retirement.json.xmi.gz.xmi.gz +2026-01-30 17:39:20.571 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:20.571 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id How much money you should save for a comfortable retirement.json... +2026-01-30 17:39:20.952 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:23.767 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document How much money you should save for a comfortable retirement.json.xmi.gz.xmi.gz +2026-01-30 17:39:23.767 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:23.771 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\How much money you should save for a comfortable retirement.json.xmi.gz.xmi.gz +2026-01-30 17:39:23.774 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\How much money you should save for a comfortable retirement.json.xmi.gz.xmi.gz +2026-01-30 17:39:23.796 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:23.797 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:23.800 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json +2026-01-30 17:39:23.802 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:23.802 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:23.802 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:23.802 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:23.802 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:23.804 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:23.804 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:23.807 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json.xmi.gz.xmi.gz +2026-01-30 17:39:23.807 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:23.807 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json... +2026-01-30 17:39:24.940 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:24.953 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json.xmi.gz.xmi.gz +2026-01-30 17:39:24.954 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:24.956 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json.xmi.gz.xmi.gz +2026-01-30 17:39:24.959 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json.xmi.gz.xmi.gz +2026-01-30 17:39:24.989 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:24.991 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:24.993 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Lakers star Luka Dončić says he took a month off from basketball to transform his body.json +2026-01-30 17:39:24.995 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:24.996 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:24.996 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:24.996 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:24.996 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:24.998 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:24.998 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:25.001 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Lakers star Luka Dončić says he took a month off from basketball to transform his body.json.xmi.gz.xmi.gz +2026-01-30 17:39:25.001 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:25.001 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Lakers star Luka Dončić says he took a month off from basketball to transform his body.json... +2026-01-30 17:39:25.347 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:26.238 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Lakers star Luka Dončić says he took a month off from basketball to transform his body.json.xmi.gz.xmi.gz +2026-01-30 17:39:26.238 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:26.241 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Lakers star Luka Dončić says he took a month off from basketball to transform his body.json.xmi.gz.xmi.gz +2026-01-30 17:39:26.243 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Lakers star Luka Dončić says he took a month off from basketball to transform his body.json.xmi.gz.xmi.gz +2026-01-30 17:39:26.251 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:26.252 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:26.255 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Musk's brain implant company filed as a 'disadvantaged business'.json +2026-01-30 17:39:26.256 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:26.256 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:26.256 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:26.257 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:26.257 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:26.258 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:26.258 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:26.262 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Musk's brain implant company filed as a 'disadvantaged business'.json.xmi.gz.xmi.gz +2026-01-30 17:39:26.262 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:26.262 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Musk's brain implant company filed as a 'disadvantaged business'.json... +2026-01-30 17:39:26.817 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:27.492 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Musk's brain implant company filed as a 'disadvantaged business'.json.xmi.gz.xmi.gz +2026-01-30 17:39:27.492 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:27.495 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Musk's brain implant company filed as a 'disadvantaged business'.json.xmi.gz.xmi.gz +2026-01-30 17:39:27.497 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Musk's brain implant company filed as a 'disadvantaged business'.json.xmi.gz.xmi.gz +2026-01-30 17:39:27.522 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:27.524 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:27.527 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json +2026-01-30 17:39:27.529 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:27.529 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:27.529 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:27.529 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:27.529 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:27.531 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:27.531 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:27.533 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json.xmi.gz.xmi.gz +2026-01-30 17:39:27.534 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:27.534 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json... +2026-01-30 17:39:28.206 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:29.243 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json.xmi.gz.xmi.gz +2026-01-30 17:39:29.243 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:29.246 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json.xmi.gz.xmi.gz +2026-01-30 17:39:29.249 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json.xmi.gz.xmi.gz +2026-01-30 17:39:29.257 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:29.257 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:29.260 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing New York Jets to sign QB Justin Fields, according to reports.json +2026-01-30 17:39:29.262 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:29.262 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:29.262 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:29.262 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:29.262 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:29.262 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:29.263 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:29.265 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\New York Jets to sign QB Justin Fields, according to reports.json.xmi.gz.xmi.gz +2026-01-30 17:39:29.265 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:29.265 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id New York Jets to sign QB Justin Fields, according to reports.json... +2026-01-30 17:39:29.789 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:29.825 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document New York Jets to sign QB Justin Fields, according to reports.json.xmi.gz.xmi.gz +2026-01-30 17:39:29.826 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:29.829 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\New York Jets to sign QB Justin Fields, according to reports.json.xmi.gz.xmi.gz +2026-01-30 17:39:29.832 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\New York Jets to sign QB Justin Fields, according to reports.json.xmi.gz.xmi.gz +2026-01-30 17:39:29.848 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:29.849 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:29.852 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json +2026-01-30 17:39:29.853 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:29.853 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:29.853 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:29.854 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:29.854 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:29.855 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:29.855 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:29.858 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json.xmi.gz.xmi.gz +2026-01-30 17:39:29.858 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:29.858 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json... +2026-01-30 17:39:30.039 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:30.867 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json.xmi.gz.xmi.gz +2026-01-30 17:39:30.867 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:30.869 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json.xmi.gz.xmi.gz +2026-01-30 17:39:30.872 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json.xmi.gz.xmi.gz +2026-01-30 17:39:30.892 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:30.893 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:30.895 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json +2026-01-30 17:39:30.897 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:30.897 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:30.897 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:30.897 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:30.897 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:30.899 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:30.899 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:30.901 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json.xmi.gz.xmi.gz +2026-01-30 17:39:30.901 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:30.901 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json... +2026-01-30 17:39:31.310 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:31.988 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json.xmi.gz.xmi.gz +2026-01-30 17:39:31.988 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:31.990 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json.xmi.gz.xmi.gz +2026-01-30 17:39:31.992 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json.xmi.gz.xmi.gz +2026-01-30 17:39:32.022 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:32.023 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:32.026 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Sen. Michael Bennet will run for governor of Colorado in 2026.json +2026-01-30 17:39:32.028 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:32.028 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:32.028 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:32.028 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:32.028 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:32.029 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:32.029 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:32.032 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Sen. Michael Bennet will run for governor of Colorado in 2026.json.xmi.gz.xmi.gz +2026-01-30 17:39:32.032 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:32.032 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Sen. Michael Bennet will run for governor of Colorado in 2026.json... +2026-01-30 17:39:32.455 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:33.698 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Sen. Michael Bennet will run for governor of Colorado in 2026.json.xmi.gz.xmi.gz +2026-01-30 17:39:33.698 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:33.700 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Sen. Michael Bennet will run for governor of Colorado in 2026.json.xmi.gz.xmi.gz +2026-01-30 17:39:33.703 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Sen. Michael Bennet will run for governor of Colorado in 2026.json.xmi.gz.xmi.gz +2026-01-30 17:39:33.755 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:33.757 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:33.760 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json +2026-01-30 17:39:33.762 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:33.762 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:33.762 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:33.762 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:33.763 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:33.765 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:33.766 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:33.769 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json.xmi.gz.xmi.gz +2026-01-30 17:39:33.769 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:33.769 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json... +2026-01-30 17:39:34.440 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:36.454 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json.xmi.gz.xmi.gz +2026-01-30 17:39:36.454 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:36.457 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json.xmi.gz.xmi.gz +2026-01-30 17:39:36.460 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json.xmi.gz.xmi.gz +2026-01-30 17:39:36.525 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:36.527 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:36.530 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Target says its holiday sales were better than expected — but its profits weren't.json +2026-01-30 17:39:36.532 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:36.532 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:36.532 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:36.532 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:36.533 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:36.535 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:36.535 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:36.538 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Target says its holiday sales were better than expected — but its profits weren't.json.xmi.gz.xmi.gz +2026-01-30 17:39:36.538 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:36.538 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Target says its holiday sales were better than expected — but its profits weren't.json... +2026-01-30 17:39:37.556 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:39.092 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Target says its holiday sales were better than expected — but its profits weren't.json.xmi.gz.xmi.gz +2026-01-30 17:39:39.093 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:39.095 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Target says its holiday sales were better than expected — but its profits weren't.json.xmi.gz.xmi.gz +2026-01-30 17:39:39.098 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Target says its holiday sales were better than expected — but its profits weren't.json.xmi.gz.xmi.gz +2026-01-30 17:39:39.155 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:39.157 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:39.159 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing The 14 best toothpastes for clean, healthy teeth in 2025.json +2026-01-30 17:39:39.162 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:39.162 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:39.162 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:39.162 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:39.162 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:39.164 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:39.164 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:39.166 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\The 14 best toothpastes for clean, healthy teeth in 2025.json.xmi.gz.xmi.gz +2026-01-30 17:39:39.166 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:39.166 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id The 14 best toothpastes for clean, healthy teeth in 2025.json... +2026-01-30 17:39:40.127 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:41.418 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document The 14 best toothpastes for clean, healthy teeth in 2025.json.xmi.gz.xmi.gz +2026-01-30 17:39:41.418 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:41.420 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\The 14 best toothpastes for clean, healthy teeth in 2025.json.xmi.gz.xmi.gz +2026-01-30 17:39:41.423 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\The 14 best toothpastes for clean, healthy teeth in 2025.json.xmi.gz.xmi.gz +2026-01-30 17:39:41.528 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:41.532 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:41.534 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing The 50+ best white t-shirts tested and ranked, according to NBC Select editors.json +2026-01-30 17:39:41.536 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:41.536 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:41.536 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:41.536 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:41.537 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:41.540 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:41.541 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:41.544 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\The 50 best white t-shirts tested and ranked, according to NBC Select editors.json.xmi.gz.xmi.gz +2026-01-30 17:39:41.544 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:41.544 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id The 50+ best white t-shirts tested and ranked, according to NBC Select editors.json... +2026-01-30 17:39:42.345 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:46.996 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document The 50 best white t-shirts tested and ranked, according to NBC Select editors.json.xmi.gz.xmi.gz +2026-01-30 17:39:46.996 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:46.999 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\The 50 best white t-shirts tested and ranked, according to NBC Select editors.json.xmi.gz.xmi.gz +2026-01-30 17:39:47.002 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\The 50 best white t-shirts tested and ranked, according to NBC Select editors.json.xmi.gz.xmi.gz +2026-01-30 17:39:47.034 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:47.035 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:47.037 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing These three LGBTQ women just made congressional 'herstory'.json +2026-01-30 17:39:47.039 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:47.039 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:47.039 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:47.039 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:47.039 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:47.041 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:47.041 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:47.044 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\These three LGBTQ women just made congressional 'herstory'.json.xmi.gz.xmi.gz +2026-01-30 17:39:47.044 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:47.044 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id These three LGBTQ women just made congressional 'herstory'.json... +2026-01-30 17:39:48.227 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document These three LGBTQ women just made congressional 'herstory'.json.xmi.gz.xmi.gz +2026-01-30 17:39:48.227 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:48.229 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\These three LGBTQ women just made congressional 'herstory'.json.xmi.gz.xmi.gz +2026-01-30 17:39:48.232 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\These three LGBTQ women just made congressional 'herstory'.json.xmi.gz.xmi.gz +2026-01-30 17:39:48.248 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:48.248 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:48.254 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Thousands of U.S. seniors deal with the harsh realities of homelessness.json +2026-01-30 17:39:48.255 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:48.256 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:48.256 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:48.256 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:48.256 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:48.258 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:48.258 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:48.260 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Thousands of U.S. seniors deal with the harsh realities of homelessness.json.xmi.gz.xmi.gz +2026-01-30 17:39:48.261 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:48.261 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Thousands of U.S. seniors deal with the harsh realities of homelessness.json... +2026-01-30 17:39:48.748 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:49.048 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Thousands of U.S. seniors deal with the harsh realities of homelessness.json.xmi.gz.xmi.gz +2026-01-30 17:39:49.048 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:49.050 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Thousands of U.S. seniors deal with the harsh realities of homelessness.json.xmi.gz.xmi.gz +2026-01-30 17:39:49.052 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Thousands of U.S. seniors deal with the harsh realities of homelessness.json.xmi.gz.xmi.gz +2026-01-30 17:39:49.100 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:49.102 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:49.104 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json +2026-01-30 17:39:49.105 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:49.106 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:49.106 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:49.106 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:49.106 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:49.108 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:49.108 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:49.110 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json.xmi.gz.xmi.gz +2026-01-30 17:39:49.110 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:49.110 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json... +2026-01-30 17:39:49.195 [ForkJoinPool.commonPool-worker-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:49.358 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:51.251 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json.xmi.gz.xmi.gz +2026-01-30 17:39:51.251 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:51.255 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json.xmi.gz.xmi.gz +2026-01-30 17:39:51.257 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json.xmi.gz.xmi.gz +2026-01-30 17:39:51.328 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:51.329 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:51.331 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Trump wants automakers to move vehicle production to the U.S. It's not that simple..json +2026-01-30 17:39:51.333 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:51.333 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:51.334 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:51.334 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:51.334 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:51.336 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:51.337 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:51.339 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Trump wants automakers to move vehicle production to the U.S. It's not that simple..json.xmi.gz.xmi.gz +2026-01-30 17:39:51.339 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:51.339 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Trump wants automakers to move vehicle production to the U.S. It's not that simple..json... +2026-01-30 17:39:52.155 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:54.184 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Trump wants automakers to move vehicle production to the U.S. It's not that simple..json.xmi.gz.xmi.gz +2026-01-30 17:39:54.184 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:54.186 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Trump wants automakers to move vehicle production to the U.S. It's not that simple..json.xmi.gz.xmi.gz +2026-01-30 17:39:54.190 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Trump wants automakers to move vehicle production to the U.S. It's not that simple..json.xmi.gz.xmi.gz +2026-01-30 17:39:54.229 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:54.230 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:54.233 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json +2026-01-30 17:39:54.235 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:54.235 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:54.235 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:54.236 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:54.236 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:54.237 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:54.237 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:54.239 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json.xmi.gz.xmi.gz +2026-01-30 17:39:54.239 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:54.239 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json... +2026-01-30 17:39:55.349 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:55.742 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json.xmi.gz.xmi.gz +2026-01-30 17:39:55.742 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:55.745 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json.xmi.gz.xmi.gz +2026-01-30 17:39:55.748 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json.xmi.gz.xmi.gz +2026-01-30 17:39:55.774 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:55.775 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:55.777 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json +2026-01-30 17:39:55.779 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:55.779 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:55.779 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:55.779 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:55.779 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:55.780 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:55.780 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:55.782 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json.xmi.gz.xmi.gz +2026-01-30 17:39:55.782 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:55.782 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json... +2026-01-30 17:39:56.331 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:57.112 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json.xmi.gz.xmi.gz +2026-01-30 17:39:57.112 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:57.114 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json.xmi.gz.xmi.gz +2026-01-30 17:39:57.117 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json.xmi.gz.xmi.gz +2026-01-30 17:39:57.130 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:57.130 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:57.132 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json +2026-01-30 17:39:57.134 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:57.134 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:57.134 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:57.134 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:57.134 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:57.135 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:57.135 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:57.137 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json.xmi.gz.xmi.gz +2026-01-30 17:39:57.137 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:57.137 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json... +2026-01-30 17:39:57.664 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:57.833 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json.xmi.gz.xmi.gz +2026-01-30 17:39:57.833 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:57.835 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json.xmi.gz.xmi.gz +2026-01-30 17:39:57.837 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json.xmi.gz.xmi.gz +2026-01-30 17:39:57.871 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:57.872 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:57.875 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json +2026-01-30 17:39:57.877 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:57.877 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:57.878 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:57.878 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:57.878 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:57.879 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:57.880 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:57.882 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json.xmi.gz.xmi.gz +2026-01-30 17:39:57.883 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:57.883 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json... +2026-01-30 17:39:58.114 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:39:59.606 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json.xmi.gz.xmi.gz +2026-01-30 17:39:59.606 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:39:59.608 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json.xmi.gz.xmi.gz +2026-01-30 17:39:59.610 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json.xmi.gz.xmi.gz +2026-01-30 17:39:59.630 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:39:59.631 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:39:59.634 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Waymo's robotaxis to start carrying passengers in Atlanta.json +2026-01-30 17:39:59.635 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:39:59.635 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:39:59.636 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:39:59.636 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:39:59.636 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:39:59.637 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:39:59.637 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:39:59.638 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Waymo's robotaxis to start carrying passengers in Atlanta.json.xmi.gz.xmi.gz +2026-01-30 17:39:59.638 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:39:59.638 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id Waymo's robotaxis to start carrying passengers in Atlanta.json... +2026-01-30 17:40:00.332 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:40:00.675 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document Waymo's robotaxis to start carrying passengers in Atlanta.json.xmi.gz.xmi.gz +2026-01-30 17:40:00.675 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:40:00.678 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Waymo's robotaxis to start carrying passengers in Atlanta.json.xmi.gz.xmi.gz +2026-01-30 17:40:00.680 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\Waymo's robotaxis to start carrying passengers in Atlanta.json.xmi.gz.xmi.gz +2026-01-30 17:40:00.719 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:00.721 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:00.723 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing ‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json +2026-01-30 17:40:00.724 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting full text done. +2026-01-30 17:40:00.724 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - No DocumentAnnotation found. Skipping this annotation then. +2026-01-30 17:40:00.724 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting sentences done. +2026-01-30 17:40:00.724 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Named-Entities done. +2026-01-30 17:40:00.724 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Emotions done. +2026-01-30 17:40:00.726 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Lemmas done. +2026-01-30 17:40:00.726 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting synthetic pages done. +2026-01-30 17:40:00.729 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully extracted all annotations from F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json.xmi.gz.xmi.gz +2026-01-30 17:40:00.729 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:00.729 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Trying to store document with document id ‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json... +2026-01-30 17:40:01.094 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:40:02.532 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Stored document ‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json.xmi.gz.xmi.gz +2026-01-30 17:40:02.532 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with the UIMA annotations - postprocessing the doc now. +2026-01-30 17:40:02.534 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json.xmi.gz.xmi.gz +2026-01-30 17:40:02.537 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Successfully post processed document F:\Area51\UCE\corpora\my_first_corpus\input\emotion\bert-emotion\‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json.xmi.gz.xmi.gz +2026-01-30 17:40:02.570 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:02.570 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:02.572 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing 23-year-old Ukrainian refugee killed on North Carolina transit system.json +2026-01-30 17:40:02.576 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id 23-year-old Ukrainian refugee killed on North Carolina transit system.json already exists in the corpus 8. +2026-01-30 17:40:02.576 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:02.615 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:02.615 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:02.615 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:02.637 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:02.637 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:02.641 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json +2026-01-30 17:40:02.643 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json already exists in the corpus 8. +2026-01-30 17:40:02.643 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:02.657 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:02.657 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:02.657 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:02.754 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:02.758 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:02.762 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Adams case and other Trump moves threaten to open corruption floodgates, experts say.json +2026-01-30 17:40:02.764 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Adams case and other Trump moves threaten to open corruption floodgates, experts say.json already exists in the corpus 8. +2026-01-30 17:40:02.764 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:02.783 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:02.783 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:02.783 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:02.812 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:02.813 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:02.817 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json +2026-01-30 17:40:02.819 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json already exists in the corpus 8. +2026-01-30 17:40:02.819 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:02.837 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:02.837 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:02.837 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:02.878 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:02.879 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:02.882 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Agency that handles green cards and citizenship to hire armed agents who can make arrests.json +2026-01-30 17:40:02.884 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Agency that handles green cards and citizenship to hire armed agents who can make arrests.json already exists in the corpus 8. +2026-01-30 17:40:02.884 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:02.899 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:02.899 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:02.899 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:02.927 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:02.928 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:02.930 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json +2026-01-30 17:40:02.931 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json already exists in the corpus 8. +2026-01-30 17:40:02.931 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:02.942 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:02.942 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:02.942 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:02.976 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:02.976 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:02.980 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json +2026-01-30 17:40:02.982 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json already exists in the corpus 8. +2026-01-30 17:40:02.982 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:02.996 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:02.996 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:02.996 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.018 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.019 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.022 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json +2026-01-30 17:40:03.024 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json already exists in the corpus 8. +2026-01-30 17:40:03.024 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.039 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.039 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.039 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.085 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.086 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.088 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Biden administration has no plans to fine companies if TikTok ban goes into effect.json +2026-01-30 17:40:03.089 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Biden administration has no plans to fine companies if TikTok ban goes into effect.json already exists in the corpus 8. +2026-01-30 17:40:03.089 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.100 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.101 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.101 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.130 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.131 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.133 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json +2026-01-30 17:40:03.134 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json already exists in the corpus 8. +2026-01-30 17:40:03.135 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.147 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.147 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.147 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.170 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.170 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.172 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json +2026-01-30 17:40:03.174 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json already exists in the corpus 8. +2026-01-30 17:40:03.174 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.186 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.186 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.186 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.228 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.231 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.233 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Civil rights agency sued over handling of trans worker discrimination complaints.json +2026-01-30 17:40:03.235 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Civil rights agency sued over handling of trans worker discrimination complaints.json already exists in the corpus 8. +2026-01-30 17:40:03.235 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.249 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.249 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.249 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.269 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.269 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.272 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing DHS has begun performing polygraph tests on employees to find leakers.json +2026-01-30 17:40:03.274 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id DHS has begun performing polygraph tests on employees to find leakers.json already exists in the corpus 8. +2026-01-30 17:40:03.274 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.286 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.286 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.286 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.314 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.315 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.317 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json +2026-01-30 17:40:03.319 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json already exists in the corpus 8. +2026-01-30 17:40:03.319 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.330 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.330 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.330 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.375 [ForkJoinPool.commonPool-worker-2] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with import. +2026-01-30 17:40:03.386 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.387 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.390 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing How much money you should save for a comfortable retirement.json +2026-01-30 17:40:03.393 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id How much money you should save for a comfortable retirement.json already exists in the corpus 8. +2026-01-30 17:40:03.394 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.410 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.410 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.410 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.448 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.449 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.453 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json +2026-01-30 17:40:03.456 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json already exists in the corpus 8. +2026-01-30 17:40:03.456 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.472 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.472 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.472 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.498 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.499 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.501 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Lakers star Luka Dončić says he took a month off from basketball to transform his body.json +2026-01-30 17:40:03.503 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Lakers star Luka Dončić says he took a month off from basketball to transform his body.json already exists in the corpus 8. +2026-01-30 17:40:03.503 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.513 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.513 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.513 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.536 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.537 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.540 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Musk's brain implant company filed as a 'disadvantaged business'.json +2026-01-30 17:40:03.541 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Musk's brain implant company filed as a 'disadvantaged business'.json already exists in the corpus 8. +2026-01-30 17:40:03.541 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.549 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.549 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.549 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.576 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.577 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.580 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json +2026-01-30 17:40:03.582 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json already exists in the corpus 8. +2026-01-30 17:40:03.582 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.589 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.589 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.589 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.605 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.606 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.609 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing New York Jets to sign QB Justin Fields, according to reports.json +2026-01-30 17:40:03.611 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id New York Jets to sign QB Justin Fields, according to reports.json already exists in the corpus 8. +2026-01-30 17:40:03.611 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.621 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.622 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.622 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.645 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.646 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.650 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json +2026-01-30 17:40:03.652 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json already exists in the corpus 8. +2026-01-30 17:40:03.652 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.662 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.662 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.662 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.690 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.691 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.694 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json +2026-01-30 17:40:03.697 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json already exists in the corpus 8. +2026-01-30 17:40:03.697 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.705 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.705 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.705 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.739 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.740 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.744 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Sen. Michael Bennet will run for governor of Colorado in 2026.json +2026-01-30 17:40:03.745 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Sen. Michael Bennet will run for governor of Colorado in 2026.json already exists in the corpus 8. +2026-01-30 17:40:03.745 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.753 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.753 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.753 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.804 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.805 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.808 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json +2026-01-30 17:40:03.810 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json already exists in the corpus 8. +2026-01-30 17:40:03.810 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.820 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.821 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.821 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.885 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.887 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.890 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Target says its holiday sales were better than expected — but its profits weren't.json +2026-01-30 17:40:03.892 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Target says its holiday sales were better than expected — but its profits weren't.json already exists in the corpus 8. +2026-01-30 17:40:03.892 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.903 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.903 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.903 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:03.952 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:03.953 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:03.956 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing The 14 best toothpastes for clean, healthy teeth in 2025.json +2026-01-30 17:40:03.957 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id The 14 best toothpastes for clean, healthy teeth in 2025.json already exists in the corpus 8. +2026-01-30 17:40:03.957 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:03.965 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:03.965 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:03.965 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.080 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.083 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.087 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing The 50+ best white t-shirts tested and ranked, according to NBC Select editors.json +2026-01-30 17:40:04.090 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id The 50+ best white t-shirts tested and ranked, according to NBC Select editors.json already exists in the corpus 8. +2026-01-30 17:40:04.090 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.101 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.101 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.101 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.129 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.130 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.132 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing These three LGBTQ women just made congressional 'herstory'.json +2026-01-30 17:40:04.135 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id These three LGBTQ women just made congressional 'herstory'.json already exists in the corpus 8. +2026-01-30 17:40:04.135 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.142 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.142 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.143 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.160 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.161 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.164 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Thousands of U.S. seniors deal with the harsh realities of homelessness.json +2026-01-30 17:40:04.165 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Thousands of U.S. seniors deal with the harsh realities of homelessness.json already exists in the corpus 8. +2026-01-30 17:40:04.165 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.173 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.173 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.173 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.225 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.226 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.229 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json +2026-01-30 17:40:04.230 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json already exists in the corpus 8. +2026-01-30 17:40:04.230 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.238 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.238 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.238 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.302 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.304 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.309 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Trump wants automakers to move vehicle production to the U.S. It's not that simple..json +2026-01-30 17:40:04.310 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Trump wants automakers to move vehicle production to the U.S. It's not that simple..json already exists in the corpus 8. +2026-01-30 17:40:04.310 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.322 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.322 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.322 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.366 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.367 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.370 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json +2026-01-30 17:40:04.372 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json already exists in the corpus 8. +2026-01-30 17:40:04.372 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.382 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.382 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.382 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.413 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.413 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.416 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json +2026-01-30 17:40:04.417 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json already exists in the corpus 8. +2026-01-30 17:40:04.417 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.424 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.424 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.424 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.442 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.442 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.445 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json +2026-01-30 17:40:04.447 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json already exists in the corpus 8. +2026-01-30 17:40:04.447 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.455 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.455 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.455 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.492 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.493 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.497 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json +2026-01-30 17:40:04.498 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json already exists in the corpus 8. +2026-01-30 17:40:04.498 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.506 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.506 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.506 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.539 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.540 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.544 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Waymo's robotaxis to start carrying passengers in Atlanta.json +2026-01-30 17:40:04.545 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Waymo's robotaxis to start carrying passengers in Atlanta.json already exists in the corpus 8. +2026-01-30 17:40:04.545 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.556 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.556 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.556 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.598 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.599 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.602 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing ‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json +2026-01-30 17:40:04.604 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id ‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json already exists in the corpus 8. +2026-01-30 17:40:04.604 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.614 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.614 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.614 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.651 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.652 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.655 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing 23-year-old Ukrainian refugee killed on North Carolina transit system.json +2026-01-30 17:40:04.657 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id 23-year-old Ukrainian refugee killed on North Carolina transit system.json already exists in the corpus 8. +2026-01-30 17:40:04.657 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.665 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.665 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.665 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.706 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.707 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.711 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing 23-year-old Ukrainian refugee killed on North Carolina transit system.json +2026-01-30 17:40:04.712 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id 23-year-old Ukrainian refugee killed on North Carolina transit system.json already exists in the corpus 8. +2026-01-30 17:40:04.712 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.721 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.722 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.722 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.740 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.740 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.744 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json +2026-01-30 17:40:04.746 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id A 10-year-old boy in Tokyo ended up with Shohei Ohtani's first home run of the season.json already exists in the corpus 8. +2026-01-30 17:40:04.746 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.756 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.756 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.756 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.835 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.836 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.840 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Adams case and other Trump moves threaten to open corruption floodgates, experts say.json +2026-01-30 17:40:04.841 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Adams case and other Trump moves threaten to open corruption floodgates, experts say.json already exists in the corpus 8. +2026-01-30 17:40:04.841 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.849 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.849 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.849 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.876 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.876 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.879 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json +2026-01-30 17:40:04.880 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id After a couple struck a deer in Alabama, a fire chief who stopped to help was fatally shot.json already exists in the corpus 8. +2026-01-30 17:40:04.880 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.888 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.888 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.888 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.926 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.927 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.931 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Agency that handles green cards and citizenship to hire armed agents who can make arrests.json +2026-01-30 17:40:04.933 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Agency that handles green cards and citizenship to hire armed agents who can make arrests.json already exists in the corpus 8. +2026-01-30 17:40:04.933 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.943 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.943 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.943 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:04.971 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:04.972 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:04.976 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json +2026-01-30 17:40:04.977 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Amazon apologizes to Mandy Moore after package is delivered to ruins of in-laws' California home.json already exists in the corpus 8. +2026-01-30 17:40:04.977 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:04.989 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:04.989 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:04.989 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.026 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.027 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.029 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json +2026-01-30 17:40:05.030 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id As Trump considers ways to dismantle the Education Deparment, here's what to know about your student loans.json already exists in the corpus 8. +2026-01-30 17:40:05.030 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.038 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.038 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.038 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.059 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.060 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.063 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json +2026-01-30 17:40:05.065 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Belgium's future queen caught up in Trump administration's Harvard foreign student ban effort.json already exists in the corpus 8. +2026-01-30 17:40:05.065 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.071 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.071 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.071 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.115 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.115 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.119 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Biden administration has no plans to fine companies if TikTok ban goes into effect.json +2026-01-30 17:40:05.120 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Biden administration has no plans to fine companies if TikTok ban goes into effect.json already exists in the corpus 8. +2026-01-30 17:40:05.120 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.128 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.128 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.128 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.157 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.158 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.161 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json +2026-01-30 17:40:05.164 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Bruce Springsteen opens U.K. tour by calling Trump 'unfit' for office.json already exists in the corpus 8. +2026-01-30 17:40:05.164 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.174 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.174 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.174 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.195 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.196 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.199 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json +2026-01-30 17:40:05.201 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Charlie Javice, college financial aid startup founder, found guilty of defrauding JPMorgan.json already exists in the corpus 8. +2026-01-30 17:40:05.201 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.210 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.210 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.210 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.242 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.242 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.245 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Civil rights agency sued over handling of trans worker discrimination complaints.json +2026-01-30 17:40:05.247 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Civil rights agency sued over handling of trans worker discrimination complaints.json already exists in the corpus 8. +2026-01-30 17:40:05.247 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.254 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.254 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.254 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.271 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.271 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.274 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing DHS has begun performing polygraph tests on employees to find leakers.json +2026-01-30 17:40:05.276 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id DHS has begun performing polygraph tests on employees to find leakers.json already exists in the corpus 8. +2026-01-30 17:40:05.276 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.282 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.282 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.282 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.309 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.310 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.314 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json +2026-01-30 17:40:05.315 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Elon Musk turns on Nigel Farage, calls on him to step down as U.K. party leader.json already exists in the corpus 8. +2026-01-30 17:40:05.315 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.322 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.322 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.322 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.371 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.374 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.378 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing How much money you should save for a comfortable retirement.json +2026-01-30 17:40:05.380 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id How much money you should save for a comfortable retirement.json already exists in the corpus 8. +2026-01-30 17:40:05.380 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.389 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.389 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.389 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.411 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.413 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.416 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json +2026-01-30 17:40:05.418 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Israeli strikes kill 14 in Gaza in one day as negotiators work to uphold fragile ceasefire.json already exists in the corpus 8. +2026-01-30 17:40:05.418 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.428 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.428 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.428 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.453 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.453 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.457 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Lakers star Luka Dončić says he took a month off from basketball to transform his body.json +2026-01-30 17:40:05.458 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Lakers star Luka Dončić says he took a month off from basketball to transform his body.json already exists in the corpus 8. +2026-01-30 17:40:05.458 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.468 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.468 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.468 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.490 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.490 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.493 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Musk's brain implant company filed as a 'disadvantaged business'.json +2026-01-30 17:40:05.495 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Musk's brain implant company filed as a 'disadvantaged business'.json already exists in the corpus 8. +2026-01-30 17:40:05.495 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.502 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.502 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.502 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.529 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.530 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.533 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json +2026-01-30 17:40:05.534 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Naomi Osaka tears up after first-round French Open loss to Paula Badosa.json already exists in the corpus 8. +2026-01-30 17:40:05.534 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.541 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.542 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.542 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.556 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.556 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.560 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing New York Jets to sign QB Justin Fields, according to reports.json +2026-01-30 17:40:05.561 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id New York Jets to sign QB Justin Fields, according to reports.json already exists in the corpus 8. +2026-01-30 17:40:05.561 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.570 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.570 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.570 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.592 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.593 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.597 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json +2026-01-30 17:40:05.599 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Phillies star Bryce Harper uses a blue bat in gender reveal for his child.json already exists in the corpus 8. +2026-01-30 17:40:05.599 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.609 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.609 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.609 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.638 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.638 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.641 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json +2026-01-30 17:40:05.644 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Russian strikes batter Ukraine as Zelenskyy accuses Putin of stalling peace talks.json already exists in the corpus 8. +2026-01-30 17:40:05.644 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.655 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.655 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.655 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.691 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.691 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.695 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Sen. Michael Bennet will run for governor of Colorado in 2026.json +2026-01-30 17:40:05.697 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Sen. Michael Bennet will run for governor of Colorado in 2026.json already exists in the corpus 8. +2026-01-30 17:40:05.697 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.704 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.704 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.704 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.754 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.755 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.758 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json +2026-01-30 17:40:05.759 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Suspect pleads guilty in Highland Park mass shooting at July Fourth parade.json already exists in the corpus 8. +2026-01-30 17:40:05.760 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.767 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.767 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.767 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.818 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.819 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.822 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Target says its holiday sales were better than expected — but its profits weren't.json +2026-01-30 17:40:05.824 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Target says its holiday sales were better than expected — but its profits weren't.json already exists in the corpus 8. +2026-01-30 17:40:05.824 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.833 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.833 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.833 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:05.881 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:05.882 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:05.886 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing The 14 best toothpastes for clean, healthy teeth in 2025.json +2026-01-30 17:40:05.888 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id The 14 best toothpastes for clean, healthy teeth in 2025.json already exists in the corpus 8. +2026-01-30 17:40:05.888 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:05.900 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:05.900 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:05.900 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.002 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.005 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.009 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing The 50+ best white t-shirts tested and ranked, according to NBC Select editors.json +2026-01-30 17:40:06.010 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id The 50+ best white t-shirts tested and ranked, according to NBC Select editors.json already exists in the corpus 8. +2026-01-30 17:40:06.010 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.018 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.018 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.018 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.047 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.048 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.051 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing These three LGBTQ women just made congressional 'herstory'.json +2026-01-30 17:40:06.052 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id These three LGBTQ women just made congressional 'herstory'.json already exists in the corpus 8. +2026-01-30 17:40:06.052 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.062 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.062 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.062 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.080 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.081 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.084 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Thousands of U.S. seniors deal with the harsh realities of homelessness.json +2026-01-30 17:40:06.087 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Thousands of U.S. seniors deal with the harsh realities of homelessness.json already exists in the corpus 8. +2026-01-30 17:40:06.087 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.096 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.096 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.096 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.148 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.149 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.152 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json +2026-01-30 17:40:06.153 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Trump administration uses King's 'Dream' speech to introduce executive orders cutting DEI.json already exists in the corpus 8. +2026-01-30 17:40:06.153 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.160 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.160 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.160 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.217 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.218 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.223 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Trump wants automakers to move vehicle production to the U.S. It's not that simple..json +2026-01-30 17:40:06.224 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Trump wants automakers to move vehicle production to the U.S. It's not that simple..json already exists in the corpus 8. +2026-01-30 17:40:06.224 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.234 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.234 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.234 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.267 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.268 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.271 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json +2026-01-30 17:40:06.273 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Trump's 'big, beautiful bill' includes these key tax changes for 2025 — what they mean for you.json already exists in the corpus 8. +2026-01-30 17:40:06.273 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.285 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.285 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.285 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.318 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.319 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.322 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json +2026-01-30 17:40:06.324 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id U.S. envoy Steve Witkoff will travel to Israel to address humanitarian crisis in Gaza.json already exists in the corpus 8. +2026-01-30 17:40:06.324 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.332 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.332 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.332 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.352 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.353 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.355 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json +2026-01-30 17:40:06.357 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Ukraine and allies discuss ways to pressure Russia into 30-day ceasefire.json already exists in the corpus 8. +2026-01-30 17:40:06.357 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.365 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.365 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.365 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.401 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.402 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.406 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json +2026-01-30 17:40:06.408 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Utah lawmakers said gender-affirming care is harmful to kids. Their own study contradicts that claim..json already exists in the corpus 8. +2026-01-30 17:40:06.408 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.415 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.415 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.415 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.441 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.442 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.445 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing Waymo's robotaxis to start carrying passengers in Atlanta.json +2026-01-30 17:40:06.447 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id Waymo's robotaxis to start carrying passengers in Atlanta.json already exists in the corpus 8. +2026-01-30 17:40:06.447 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.456 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.456 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.456 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.498 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - =============================== Importing a new CAS as a Document. =============================== +2026-01-30 17:40:06.500 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Setting Metadata done. +2026-01-30 17:40:06.503 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Importing ‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json +2026-01-30 17:40:06.505 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document with id ‘Call Her Daddy’ host Alex Cooper claims college soccer coach sexually harassed her.json already exists in the corpus 8. +2026-01-30 17:40:06.505 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Checking if that document was also post-processed yet... +2026-01-30 17:40:06.517 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Document was already post-processed. +2026-01-30 17:40:06.517 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done. +2026-01-30 17:40:06.517 [pool-2-thread-1] INFO org.texttechnologylab.uce.corpusimporter.Importer - Finished with importing that CAS. + + + +2026-01-30 17:40:06.890 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - Postprocessing the Corpus GerParCor_Reichstag +2026-01-30 17:40:06.890 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - Done with the corpus postprocessing. +2026-01-30 17:40:06.890 [main] INFO org.texttechnologylab.uce.corpusimporter.Importer - + +================================= + Done with the corpus import. diff --git a/uce.portal/uce.corpus-importer/src/main/java/org/texttechnologylab/uce/corpusimporter/Importer.java b/uce.portal/uce.corpus-importer/src/main/java/org/texttechnologylab/uce/corpusimporter/Importer.java index bba58c2d..4d98c653 100644 --- a/uce.portal/uce.corpus-importer/src/main/java/org/texttechnologylab/uce/corpusimporter/Importer.java +++ b/uce.portal/uce.corpus-importer/src/main/java/org/texttechnologylab/uce/corpusimporter/Importer.java @@ -41,6 +41,7 @@ import org.texttechnologylab.uce.common.models.biofid.GnFinderTaxon; import org.texttechnologylab.uce.common.models.corpus.*; import org.texttechnologylab.uce.common.models.corpus.emotion.Feeling; +import org.texttechnologylab.uce.common.models.corpus.emotion.SentenceEmotion; import org.texttechnologylab.uce.common.models.corpus.links.AnnotationLink; import org.texttechnologylab.uce.common.models.corpus.links.AnnotationToDocumentLink; import org.texttechnologylab.uce.common.models.corpus.links.DocumentLink; @@ -481,6 +482,34 @@ public Document XMIToDocument(JCas jCas, Corpus corpus, String filePath) { return XMIToDocument(jCas, corpus, filePath, null); } + private void linkSentenceEmotions(Document document) { + if (document.getSentences() == null || document.getEmotions() == null) return; + + var sentenceBySpan = new java.util.HashMap(); + for (var s : document.getSentences()) { + sentenceBySpan.put(s.getBegin() + ":" + s.getEnd(), s); + } + + for (var e : document.getEmotions()) { + var s = sentenceBySpan.get(e.getBegin() + ":" + e.getEnd()); + if (s == null) continue; + + if (e.getSentenceEmotions() == null) { + e.setSentenceEmotions(new java.util.ArrayList<>()); + } + + var model = (e.getModel() != null) ? e.getModel() : "unknown"; + + if (e.getFeelings() == null) continue; + + for (var f : e.getFeelings()) { + e.getSentenceEmotions().add( + new SentenceEmotion(s, e, model, f.getFeeling(), f.getValue()) + ); + } + } + } + /** * Convert a UIMA jCas to an OCRDocument * @@ -605,7 +634,10 @@ public Document XMIToDocument(JCas jCas, Corpus corpus, String filePath, String if (corpusConfig.getAnnotations().isEmotion()) ExceptionUtils.tryCatchLog( - () -> setEmotions(document, jCas), + () -> { + setEmotions(document, jCas); + linkSentenceEmotions(document); + }, (ex) -> logImportWarn("This file should have contained Emotion annotations, but selecting them caused an error.", ex, filePath)); if (corpusConfig.getAnnotations().isLemma()) @@ -1817,6 +1849,67 @@ private void postProccessCorpus(Corpus corpus, CorpusConfig corpusConfig) { logger.info("Done with the corpus postprocessing."); } + /** + * Each topic annotation is matched to an existing sentence using + * its begin and end offsets. For every (label, score) pair found, + * a corresponding entry is inserted into the + * table, linking the topic classification to the sentence. + * The method only performs sentence-level imports and does not + * create unified or aggregated topic representations + */ + private void importSentenceTopicsFromXmiIntoDb(Document document, String xmiFilePath) { + try { + var jCas = JCasFactory.createJCas(); + + try (InputStream raw = Files.newInputStream(Paths.get(xmiFilePath)); + InputStream in = xmiFilePath.endsWith(".gz") ? new GZIPInputStream(raw) : raw) { + + CasIOUtils.load(in, jCas.getCas()); + } + + if (casView != null) { + jCas = jCas.getView(casView); + } + + var topicAnnos = JCasUtil.select(jCas, org.texttechnologylab.annotation.Topic.class); + if (topicAnnos.isEmpty()) { + logger.info("No Topic annotations found in XMI: {}", xmiFilePath); + return; + } + + int inserted = 0; + + for (var topicSpan : topicAnnos) { + int begin = topicSpan.getBegin(); + int end = topicSpan.getEnd(); + + var topicsArr = topicSpan.getTopics(); + if (topicsArr == null || topicsArr.size() == 0) continue; + + for (int i = 0; i < topicsArr.size(); i++) { + var fs = topicsArr.get(i); + if (!(fs instanceof AnnotationComment comment)) continue; + + String label = comment.getKey(); + String valueStr = comment.getValue(); + if (label == null || label.isBlank() || valueStr == null || valueStr.isBlank()) continue; + + double score; + try { score = Double.parseDouble(valueStr); } + catch (NumberFormatException nfe) { continue; } + + inserted += db.insertSentenceTopicBySpan(document.getId(), begin, end, label, score); + } + } + + logger.info("Imported sentence topic annotations into sentencetopics: documentId={}, insertedRows={}", + document.getId(), inserted); + + } catch (Exception ex) { + logger.error("Error importing sentence topics from XMI into DB. xmi={}", xmiFilePath, ex); + } + } + /** * Here we apply any postprocessing of a document that isn't DUUI and needs the document to be stored once like * the rag vector embeddings. @@ -1825,6 +1918,15 @@ private void postProccessDocument(Document document, Corpus corpus, String fileP logImportInfo("Postprocessing " + filePath, LogStatus.POST_PROCESSING, filePath, 0); var start = System.currentTimeMillis(); var corpusConfig = corpus.getViewModel().getCorpusConfig(); + // Import sentence-level topic annotations (News XMI: annotation2:Topic + AnnotationComment) + importSentenceTopicsFromXmiIntoDb(document, filePath); + + // build unifiedtopic + link sentencetopics.unifiedtopic_id + ExceptionUtils.tryCatchLog( + () -> db.ensureUnifiedTopicsForSentenceTopics(document.getId()), + (ex) -> logImportError("Error creating/linking unifiedtopic rows for sentence topics.", ex, filePath) + ); + // Store simple connections between Time, Geonames and Annotation to approximate the question: // This annotation occurred in context with this location at this time. @@ -1989,13 +2091,14 @@ private void postProccessDocument(Document document, Corpus corpus, String fileP logger.info("Inserting Sentence and Document Topics..."); try { - Path insertSentenceTopicsFilePath = Paths.get(commonConfig.getDatabaseScriptsLocation(), "topic/1_updateSentenceTopics.sql"); + /**Path insertSentenceTopicsFilePath = Paths.get(commonConfig.getDatabaseScriptsLocation(), "topic/1_updateSentenceTopics.sql"); var insertSentenceTopicsScript = Files.readString(insertSentenceTopicsFilePath); ExceptionUtils.tryCatchLog( () -> db.executeSqlWithoutReturn(insertSentenceTopicsScript), (ex) -> logImportError("Error executing SQL script to populate sentencetopics table", ex, filePath) ); + */ Path insertDocumentTopicsFilePath = Paths.get(commonConfig.getDatabaseScriptsLocation(), "topic/2_updateDocumentTopics.sql"); var insertDocumentTopicsScript = Files.readString(insertDocumentTopicsFilePath); diff --git a/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/App.java b/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/App.java index 97534c64..6037916a 100644 --- a/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/App.java +++ b/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/App.java @@ -93,7 +93,7 @@ public static void main(String[] args) throws IOException { () -> new AnnotationConfigApplicationContext(SpringConfig.class), (ex) -> logger.fatal("========== [ABORT] ==========\nThe Application context couldn't be established. " + "This is very likely due to a missing/invalid database connection. UCE will have to shutdown.")); - if(context == null) return; + if (context == null) return; logger.info("Loaded application context and services."); // Execute the external database scripts @@ -115,7 +115,7 @@ public static void main(String[] args) throws IOException { logger.info(languageResource.get("search")); // Load in and test the model resources for the Analysis Engine - if(SystemStatus.UceConfig.getSettings().getAnalysis().isEnableAnalysisEngine()){ + if (SystemStatus.UceConfig.getSettings().getAnalysis().isEnableAnalysisEngine()) { var modelResources = new ModelResources(); var ttlabScorer = new TTLabScorerInfo(); var cohMetrixInfo = new CohMetrixInfo(); @@ -134,7 +134,7 @@ public static void main(String[] args) throws IOException { SystemStatus.LexiconIsCalculating = true; var lexiconService = context.getBean(LexiconService.class); var addedLexiconEntries = 0; - if(forceLexicalization) addedLexiconEntries = lexiconService.updateLexicon(true); + if (forceLexicalization) addedLexiconEntries = lexiconService.updateLexicon(true); else addedLexiconEntries = lexiconService.checkForUpdates(); logger.info("Finished updating the lexicon. Added new entries: " + addedLexiconEntries); SystemStatus.LexiconIsCalculating = false; @@ -142,23 +142,23 @@ public static void main(String[] args) throws IOException { logger.info("Checking if we can or should update any linkables... (this may take a moment depending on the time of the last update. Runs asynchronous.)"); CompletableFuture.runAsync(() -> { - try{ + try { var result = context.getBean(PostgresqlDataInterface_Impl.class).callLogicalLinksRefresh(); logger.info("Finished updating the linkables. Updated linkables: " + result); - } catch (Exception ex){ + } catch (Exception ex) { logger.error("There was an error trying to refresh linkables in the startup of the web app. App starts normally though."); } }); logger.info("Checking if we can or should update any geoname locations... (this may take a moment depending on the time of the last update. Runs asynchronous.)"); CompletableFuture.runAsync(() -> { - try{ + try { var result = context.getBean(PostgresqlDataInterface_Impl.class).callGeonameLocationRefresh(); logger.info("Finished updating the geoname locations. Updated locations: " + result); logger.info("Trying to refresh the timeline map cache..."); context.getBean(MapService.class).refreshCachedTimelineMap(false); logger.info("Finished refreshing the timeline map."); - } catch (Exception ex){ + } catch (Exception ex) { logger.error("There was an error trying to refresh geoname locations in the startup of the web app. App starts normally though."); } }); @@ -176,8 +176,7 @@ public static void main(String[] args) throws IOException { // We use the externalLocation method so that the files in the public folder are hot reloaded if (commonConfig.useExternalPublicLocation()) { config.staticFiles.add(commonConfig.getPublicLocation(), Location.EXTERNAL); - } - else { + } else { config.staticFiles.add("/public", Location.CLASSPATH); } logger.info("Setup FreeMarker templates and public folders."); @@ -200,8 +199,7 @@ public static void main(String[] args) throws IOException { ExceptionUtils.tryCatchLog(() -> initMCP(registry, config), (ex) -> logger.error("There was a problem initializing the MCP server, web service will be shut down.", ex)); logger.info("MCP server initialized."); - } - else { + } else { logger.info("MCP server is disabled and will not be initialized."); } config.jsonMapper(mapper); @@ -350,174 +348,177 @@ private static void initSparkRoutes(ApplicationContext context, ApiRegistry regi List groups = modelResources.getGroupedModelObjects(); config.router.apiBuilder(() -> { - before(ctx -> { - ctx.res().setCharacterEncoding("UTF-8"); - // Setup and log all API calls with some information. We don't want to log file uploads, since it would - // destroy the file body stream. - if (!(ctx.contentType() != null && ctx.contentType().contains("multipart/form-data"))) { - ctx.attribute("id", UUID.randomUUID().toString()); - logger.info("Received API call: ID={}, IP={}, Method={}, URI={}, QUERY={}, BODY={}", - ctx.attribute("id"), ctx.ip(), ctx.method().name(), ctx.url(), ctx.queryString(), ctx.body()); - - // Should we log to db as well? - if (commonConfig.getLogToDb() && SystemStatus.PostgresqlDbStatus.isAlive()) { - var uceLog = new UCELog(ctx.ip(), ctx.method().name(), ctx.url(), ctx.body(), ctx.queryString()); - ExceptionUtils.tryCatchLog( - () -> context.getBean(PostgresqlDataInterface_Impl.class).saveUceLog(uceLog), - (ex) -> logger.error("Error storing a log to the database: ", ex)); - logger.info("Last log was also logged to the db with id " + uceLog.getId()); - } - } else { - // Else we have a form-data upload. We handle those explicitly. - // Set the multipart data configs for uploads - ctx.req().setAttribute("org.eclipse.jetty.multipartConfig", new MultipartConfigElement("/tmp")); - } - - // Always inject the current system config into all UI templates - RequestContextHolder.setUceConfigHolder(SystemStatus.UceConfig); - - // Check if the request contains a language parameter - var languageResources = LanguageResources.fromRequest(ctx); - ctx.header("Content-Language", languageResources.getDefaultLanguage()); - RequestContextHolder.setLanguageResources(languageResources); - - // Check if we have an authenticated user in the session and inject it into the template - if (SystemStatus.UceConfig.getSettings().getAuthentication().isActivated()) { - var user = SessionManager.getUserFromRequest(ctx); - RequestContextHolder.setAuthenticatedUceUser(user); - } - }); + before(ctx -> { + ctx.res().setCharacterEncoding("UTF-8"); + // Setup and log all API calls with some information. We don't want to log file uploads, since it would + // destroy the file body stream. + if (!(ctx.contentType() != null && ctx.contentType().contains("multipart/form-data"))) { + ctx.attribute("id", UUID.randomUUID().toString()); + logger.info("Received API call: ID={}, IP={}, Method={}, URI={}, QUERY={}, BODY={}", + ctx.attribute("id"), ctx.ip(), ctx.method().name(), ctx.url(), ctx.queryString(), ctx.body()); + + // Should we log to db as well? + if (commonConfig.getLogToDb() && SystemStatus.PostgresqlDbStatus.isAlive()) { + var uceLog = new UCELog(ctx.ip(), ctx.method().name(), ctx.url(), ctx.body(), ctx.queryString()); + ExceptionUtils.tryCatchLog( + () -> context.getBean(PostgresqlDataInterface_Impl.class).saveUceLog(uceLog), + (ex) -> logger.error("Error storing a log to the database: ", ex)); + logger.info("Last log was also logged to the db with id " + uceLog.getId()); + } + } else { + // Else we have a form-data upload. We handle those explicitly. + // Set the multipart data configs for uploads + ctx.req().setAttribute("org.eclipse.jetty.multipartConfig", new MultipartConfigElement("/tmp")); + } + + // Always inject the current system config into all UI templates + RequestContextHolder.setUceConfigHolder(SystemStatus.UceConfig); + + // Check if the request contains a language parameter + var languageResources = LanguageResources.fromRequest(ctx); + ctx.header("Content-Language", languageResources.getDefaultLanguage()); + RequestContextHolder.setLanguageResources(languageResources); + + // Check if we have an authenticated user in the session and inject it into the template + if (SystemStatus.UceConfig.getSettings().getAuthentication().isActivated()) { + var user = SessionManager.getUserFromRequest(ctx); + RequestContextHolder.setAuthenticatedUceUser(user); + } + }); + + // Landing page + get("/", ctx -> { + var model = new HashMap(); + model.put("title", SystemStatus.UceConfig.getMeta().getName()); + model.put("corpora", context.getBean(PostgresqlDataInterface_Impl.class) + .getAllCorpora() + .stream().map(Corpus::getViewModel) + .toList()); + model.put("commonConf", commonConfig); + model.put("isSparqlAlive", SystemStatus.JenaSparqlStatus.isAlive()); + model.put("isAuthAlive", SystemStatus.AuthenticationService.isAlive()); + model.put("isDbAlive", SystemStatus.PostgresqlDbStatus.isAlive()); + model.put("isRagAlive", SystemStatus.RagServiceStatus.isAlive()); + model.put("isS3StorageAlive", SystemStatus.S3StorageStatus.isAlive()); + model.put("isLexiconCalculating", SystemStatus.LexiconIsCalculating); + model.put("alphabetList", StringUtils.getAlphabetAsList()); + model.put("lexiconEntriesCount", context.getBean(LexiconService.class).countLexiconEntries()); + model.put("lexiconizableAnnotations", LexiconService.lexiconizableAnnotations); + model.put("uceVersion", commonConfig.getUceVersion()); + model.put("modelGroups", groups); + model.put("ttlabScorer", taInputMap); + model.put("cohMetrix", cohMetrixMap); + + // The vm files are located under the resources directory + ctx.render("index.ftl", model); + }); + + // Potential imprint + get("/imprint", ctx -> { + var model = new HashMap(); + model.put("imprint", SystemStatus.UceConfig.getCorporate().getImprint()); + ctx.render("imprint.ftl", model); + }); + + // A document reader view + get("/documentReader", (ctx) -> (registry.get(DocumentApi.class)).getSingleDocumentReadView(ctx)); + + // A corpus World View + get("/globe", (ctx) -> (registry.get(DocumentApi.class)).get3dGlobe(ctx)); + + + path("/auth", () -> { + get("/login", (ctx) -> (registry.get(AuthenticationApi.class)).loginCallback(ctx)); + get("/logout", (ctx) -> (registry.get(AuthenticationApi.class)).logoutCallback(ctx)); + }); + + // API routes + path("/api", () -> { + before("/*", (ctx) -> { + }); - // Landing page - get("/", ctx -> { - var model = new HashMap(); - model.put("title", SystemStatus.UceConfig.getMeta().getName()); - model.put("corpora", context.getBean(PostgresqlDataInterface_Impl.class) - .getAllCorpora() - .stream().map(Corpus::getViewModel) - .toList()); - model.put("commonConf", commonConfig); - model.put("isSparqlAlive", SystemStatus.JenaSparqlStatus.isAlive()); - model.put("isAuthAlive", SystemStatus.AuthenticationService.isAlive()); - model.put("isDbAlive", SystemStatus.PostgresqlDbStatus.isAlive()); - model.put("isRagAlive", SystemStatus.RagServiceStatus.isAlive()); - model.put("isS3StorageAlive", SystemStatus.S3StorageStatus.isAlive()); - model.put("isLexiconCalculating", SystemStatus.LexiconIsCalculating); - model.put("alphabetList", StringUtils.getAlphabetAsList()); - model.put("lexiconEntriesCount", context.getBean(LexiconService.class).countLexiconEntries()); - model.put("lexiconizableAnnotations", LexiconService.lexiconizableAnnotations); - model.put("uceVersion", commonConfig.getUceVersion()); - model.put("modelGroups", groups); - model.put("ttlabScorer", taInputMap); - model.put("cohMetrix", cohMetrixMap); - - // The vm files are located under the resources directory - ctx.render("index.ftl", model); + path("/ie", () -> { + post("/upload/uima", (ctx) -> (registry.get(ImportExportApi.class)).uploadUIMA(ctx)); + get("/download/uima", (ctx) -> (registry.get(ImportExportApi.class)).downloadUIMA(ctx)); + post("/import/path", (ctx) -> (registry.get(ImportExportApi.class)).importCorpusFromPath(ctx)); + post("/import/upload",(ctx) -> (registry.get(ImportExportApi.class)).importCorpusFromUpload(ctx)); + }); + + path("/wiki", () -> { + get("/page", (ctx) -> (registry.get(WikiApi.class)).getPage(ctx)); + get("/annotation", (ctx) -> (registry.get(WikiApi.class)).getAnnotation(ctx)); + path("/linkable", () -> { + post("/node", (ctx) -> (registry.get(WikiApi.class)).getLinkableNode(ctx)); + }); + path("/lexicon", () -> { + post("/entries", (ctx) -> (registry.get(WikiApi.class)).getLexicon(ctx)); + post("/occurrences", (ctx) -> (registry.get(WikiApi.class)).getOccurrencesOfLexiconEntry(ctx)); }); + post("/queryOntology", (ctx) -> (registry.get(WikiApi.class)).queryOntology(ctx)); + }); - // Potential imprint - get("/imprint", ctx -> { - var model = new HashMap(); - model.put("imprint", SystemStatus.UceConfig.getCorporate().getImprint()); - ctx.render("imprint.ftl", model); + path("/corpus", () -> { + get("/inspector", (ctx) -> (registry.get(DocumentApi.class)).getCorpusInspectorView(ctx)); + get("/documentsList", (ctx) -> (registry.get(DocumentApi.class)).getDocumentListOfCorpus(ctx)); + path("/map", () -> { + post("/linkedOccurrences", (ctx) -> (registry.get(MapApi.class)).getLinkedOccurrences(ctx)); + post("/linkedOccurrenceClusters", (ctx) -> (registry.get(MapApi.class)).getLinkedOccurrenceClusters(ctx)); }); + }); - // A document reader view - get("/documentReader", (ctx) -> (registry.get(DocumentApi.class)).getSingleDocumentReadView(ctx)); + path("/search", () -> { + post("/default", (ctx) -> (registry.get(SearchApi.class)).search(ctx)); + post("/semanticRole", (ctx) -> (registry.get(SearchApi.class)).semanticRoleSearch(ctx)); + post("/layered", (ctx) -> (registry.get(SearchApi.class)).layeredSearch(ctx)); + get("/active/page", (ctx) -> (registry.get(SearchApi.class)).activeSearchPage(ctx)); + get("/active/sort", (ctx) -> (registry.get(SearchApi.class)).activeSearchSort(ctx)); + get("/semanticRole/builder", (ctx) -> (registry.get(SearchApi.class)).getSemanticRoleBuilderView(ctx)); + }); - // A corpus World View - get("/globe", (ctx) -> (registry.get(DocumentApi.class)).get3dGlobe(ctx)); + path("/analysis", () -> { + post("/runPipeline", (ctx) -> (registry.get(AnalysisApi.class)).runPipeline(ctx)); + get("/setHistory", (ctx) -> (registry.get(AnalysisApi.class)).setHistory(ctx)); + post("/callHistory", (ctx) -> (registry.get(AnalysisApi.class)).callHistory(ctx)); + post("/callHistoryText", (ctx) -> (registry.get(AnalysisApi.class)).callHistoryText(ctx)); + post("/importCas", (registry.get(AnalysisApi.class)).importCas); //added the importCas path + }); + path("/corpusUniverse", () -> { + // Gets a corpus universe view + get("/new", (ctx) -> (registry.get(CorpusUniverseApi.class)).getCorpusUniverseView(ctx)); + post("/fromSearch", (ctx) -> (registry.get(CorpusUniverseApi.class)).fromSearch(ctx)); + post("/fromCorpus", (ctx) -> (registry.get(CorpusUniverseApi.class)).fromCorpus(ctx)); + get("/nodeInspectorContent", (ctx) -> (registry.get(CorpusUniverseApi.class)).getNodeInspectorContentView(ctx)); + }); - path("/auth", () -> { - get("/login", (ctx) -> (registry.get(AuthenticationApi.class)).loginCallback(ctx)); - get("/logout", (ctx) -> (registry.get(AuthenticationApi.class)).logoutCallback(ctx)); - }); + path("/document", () -> { + get("/reader/pagesList", (ctx) -> (registry.get(DocumentApi.class)).getPagesListView(ctx)); + get("/uceMetadata", (ctx) -> (registry.get(DocumentApi.class)).getUceMetadataOfDocument(ctx)); + get("/topics", (ctx) -> (registry.get(DocumentApi.class)).getDocumentTopics(ctx)); + get("/page/taxon", (ctx) -> (registry.get(DocumentApi.class)).getTaxonCountByPage(ctx)); + get("/page/topics", (ctx) -> (registry.get(DocumentApi.class)).getDocumentTopicDistributionByPage(ctx)); + get("/page/topicEntityRelation", (ctx) -> (registry.get(DocumentApi.class)).getSentenceTopicsWithEntities(ctx)); + get("/page/topicWords", (ctx) -> (registry.get(DocumentApi.class)).getTopicWordsByDocument(ctx)); + get("/unifiedTopicSentenceMap", (ctx) -> (registry.get(DocumentApi.class)).getUnifiedTopicToSentenceMap(ctx)); + get("/page/namedEntities", (ctx) -> (registry.get(DocumentApi.class)).getDocumentNamedEntitiesByPage(ctx)); + get("/page/lemma", (ctx) -> (registry.get(DocumentApi.class)).getDocumentLemmaByPage(ctx)); + get("/page/geoname", (ctx) -> (registry.get(DocumentApi.class)).getDocumentGeonameByPage(ctx)); + delete("/delete", (ctx) -> (registry.get(DocumentApi.class)).deleteDocument(ctx)); + get("/findIdByMetadata", (ctx) -> (registry.get(DocumentApi.class)).findDocumentIdByMetadata(ctx)); + get("/findIdsByMetadata", (ctx) -> (registry.get(DocumentApi.class)).findDocumentIdsByMetadata(ctx)); + }); - // API routes - path("/api", () -> { - before("/*", (ctx) -> { - }); - - path("/ie", () -> { - post("/upload/uima", (ctx) -> (registry.get(ImportExportApi.class)).uploadUIMA(ctx)); - get("/download/uima", (ctx) -> (registry.get(ImportExportApi.class)).downloadUIMA(ctx)); - }); - - path("/wiki", () -> { - get("/page", (ctx) -> (registry.get(WikiApi.class)).getPage(ctx)); - get("/annotation", (ctx) -> (registry.get(WikiApi.class)).getAnnotation(ctx)); - path("/linkable", () -> { - post("/node", (ctx) -> (registry.get(WikiApi.class)).getLinkableNode(ctx)); - }); - path("/lexicon", () -> { - post("/entries", (ctx) -> (registry.get(WikiApi.class)).getLexicon(ctx)); - post("/occurrences", (ctx) -> (registry.get(WikiApi.class)).getOccurrencesOfLexiconEntry(ctx)); - }); - post("/queryOntology", (ctx) -> (registry.get(WikiApi.class)).queryOntology(ctx)); - }); - - path("/corpus", () -> { - get("/inspector", (ctx) -> (registry.get(DocumentApi.class)).getCorpusInspectorView(ctx)); - get("/documentsList", (ctx) -> (registry.get(DocumentApi.class)).getDocumentListOfCorpus(ctx)); - path("/map", () -> { - post("/linkedOccurrences", (ctx) -> (registry.get(MapApi.class)).getLinkedOccurrences(ctx)); - post("/linkedOccurrenceClusters", (ctx) -> (registry.get(MapApi.class)).getLinkedOccurrenceClusters(ctx)); - }); - }); - - path("/search", () -> { - post("/default", (ctx) -> (registry.get(SearchApi.class)).search(ctx)); - post("/semanticRole", (ctx) -> (registry.get(SearchApi.class)).semanticRoleSearch(ctx)); - post("/layered", (ctx) -> (registry.get(SearchApi.class)).layeredSearch(ctx)); - get("/active/page", (ctx) -> (registry.get(SearchApi.class)).activeSearchPage(ctx)); - get("/active/sort", (ctx) -> (registry.get(SearchApi.class)).activeSearchSort(ctx)); - get("/semanticRole/builder", (ctx) -> (registry.get(SearchApi.class)).getSemanticRoleBuilderView(ctx)); - }); - - path("/analysis", () -> { - post("/runPipeline", (ctx) -> (registry.get(AnalysisApi.class)).runPipeline(ctx)); - get("/setHistory", (ctx) -> (registry.get(AnalysisApi.class)).setHistory(ctx)); - post("/callHistory", (ctx) -> (registry.get(AnalysisApi.class)).callHistory(ctx)); - post("/callHistoryText", (ctx) -> (registry.get(AnalysisApi.class)).callHistoryText(ctx)); - }); - - path("/corpusUniverse", () -> { - // Gets a corpus universe view - get("/new", (ctx) -> (registry.get(CorpusUniverseApi.class)).getCorpusUniverseView(ctx)); - post("/fromSearch", (ctx) -> (registry.get(CorpusUniverseApi.class)).fromSearch(ctx)); - post("/fromCorpus", (ctx) -> (registry.get(CorpusUniverseApi.class)).fromCorpus(ctx)); - get("/nodeInspectorContent", (ctx) -> (registry.get(CorpusUniverseApi.class)).getNodeInspectorContentView(ctx)); - }); - - path("/document", () -> { - get("/reader/pagesList", (ctx) -> (registry.get(DocumentApi.class)).getPagesListView(ctx)); - get("/uceMetadata", (ctx) -> (registry.get(DocumentApi.class)).getUceMetadataOfDocument(ctx)); - get("/topics", (ctx) -> (registry.get(DocumentApi.class)).getDocumentTopics(ctx)); - get("/page/taxon", (ctx) -> (registry.get(DocumentApi.class)).getTaxonCountByPage(ctx)); - get("/page/topics", (ctx) -> (registry.get(DocumentApi.class)).getDocumentTopicDistributionByPage(ctx)); - get("/page/topicEntityRelation", (ctx) -> (registry.get(DocumentApi.class)).getSentenceTopicsWithEntities(ctx)); - get("/page/topicWords", (ctx) -> (registry.get(DocumentApi.class)).getTopicWordsByDocument(ctx)); - get("/unifiedTopicSentenceMap", (ctx) -> (registry.get(DocumentApi.class)).getUnifiedTopicToSentenceMap(ctx)); - get("/page/namedEntities", (ctx) -> (registry.get(DocumentApi.class)).getDocumentNamedEntitiesByPage(ctx)); - get("/page/lemma", (ctx) -> (registry.get(DocumentApi.class)).getDocumentLemmaByPage(ctx)); - get("/page/geoname", (ctx) -> (registry.get(DocumentApi.class)).getDocumentGeonameByPage(ctx)); - delete("/delete", (ctx) -> (registry.get(DocumentApi.class)).deleteDocument(ctx)); - get("/findIdByMetadata", (ctx) -> (registry.get(DocumentApi.class)).findDocumentIdByMetadata(ctx)); - get("/findIdsByMetadata", (ctx) -> (registry.get(DocumentApi.class)).findDocumentIdsByMetadata(ctx)); - }); - - path("/rag", () -> { - get("/new", (ctx) -> (registry.get(RAGApi.class)).getNewRAGChat(ctx)); - // NOTE we allow also "post" here, as the system prompt can get quite long... - post("/new", (ctx) -> (registry.get(RAGApi.class)).getNewRAGChat(ctx)); - post("/postUserMessage", (ctx) -> (registry.get(RAGApi.class)).postUserMessage(ctx)); - get("/messages", (ctx) -> (registry.get(RAGApi.class)).getMessagesForChat(ctx)); - get("/plotTsne", (ctx) -> (registry.get(RAGApi.class)).getTsnePlot(ctx)); - get("/sentenceEmbeddings", (ctx) -> (registry.get(RAGApi.class)).getSentenceEmbeddings(ctx)); - }); - }); + path("/rag", () -> { + get("/new", (ctx) -> (registry.get(RAGApi.class)).getNewRAGChat(ctx)); + // NOTE we allow also "post" here, as the system prompt can get quite long... + post("/new", (ctx) -> (registry.get(RAGApi.class)).getNewRAGChat(ctx)); + post("/postUserMessage", (ctx) -> (registry.get(RAGApi.class)).postUserMessage(ctx)); + get("/messages", (ctx) -> (registry.get(RAGApi.class)).getMessagesForChat(ctx)); + get("/plotTsne", (ctx) -> (registry.get(RAGApi.class)).getTsnePlot(ctx)); + get("/sentenceEmbeddings", (ctx) -> (registry.get(RAGApi.class)).getSentenceEmbeddings(ctx)); }); + }); + }); } private static JsonMapper getJsonMapper() { diff --git a/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/routes/AnalysisApi.java b/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/routes/AnalysisApi.java index 866242bc..16fbd9eb 100644 --- a/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/routes/AnalysisApi.java +++ b/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/routes/AnalysisApi.java @@ -3,6 +3,7 @@ import com.google.gson.Gson; import freemarker.template.Configuration; import io.javalin.http.Context; +import io.javalin.http.Handler; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.springframework.context.ApplicationContext; @@ -10,8 +11,10 @@ import org.texttechnologylab.uce.analysis.RunDUUIPipeline; import org.texttechnologylab.uce.analysis.modules.DUUIInformation; import org.texttechnologylab.uce.common.annotations.auth.Authentication; +import org.texttechnologylab.uce.common.models.authentication.UceUser; import org.texttechnologylab.uce.common.models.dto.AnalysisRequestDto; import org.texttechnologylab.uce.common.models.dto.HistoryRequestDto; +import org.texttechnologylab.uce.web.SessionManager; import java.util.HashMap; import java.util.List; @@ -55,11 +58,19 @@ public void runPipeline(Context ctx) { model.put("inputStance", inputStance); model.put("inputLLM", inputLLM); + UceUser user = SessionManager.getUserFromRequest(ctx); + String userId = (user != null) ? user.getUsername() : "user-unknown"; + RunDUUIPipeline.setThreadLocalUserId(userId); + RunDUUIPipeline pipeline = new RunDUUIPipeline(); - DUUIInformation DataRequest = pipeline.getModelResources(selectedModels, inputText, inputClaim, inputCoherence, inputStance, inputLLM); + RunDUUIPipeline.AnalysisResponse resp = + pipeline.getModelResourcesWithHandle(selectedModels, inputText, inputClaim, + inputCoherence, inputStance, inputLLM); + DUUIInformation DataRequest = resp.duuiInformation; model.put("DUUI", DataRequest); model.put("SuccessRequest", true); model.put("modelGroups", DataRequest.getModelGroups()); + model.put("analysisId", resp.analysisId); // set history history.addDuuiInformation(String.valueOf(counter), DataRequest); @@ -180,5 +191,38 @@ public void callHistoryText(Context ctx) { ctx.render("defaultError.ftl"); } } - + // IMPORT ROUTE + @Authentication(required = Authentication.Requirement.LOGGED_IN, + route = Authentication.RouteTypes.POST, + path = "/api/analysis/importCas" + ) + public Handler importCas = ctx -> { + try { + String analysisId = ctx.queryParam("analysisId"); + if (analysisId == null || analysisId.isBlank()) { + ctx.status(400).result("Missing analysisId"); + return; + } + + // Lookup cached session + RunDUUIPipeline.AnalysisSession session = RunDUUIPipeline.getCachedSession(analysisId); + if (session == null) { + ctx.status(404).result("No cached CAS found for analysisId=" + analysisId); + return; + } + + // send to importer + long corpusId = Long.parseLong(ctx.queryParam("corpusId")); // from ?corpusId=... + String importPath = "/api/ie/upload/uima"; + String importUrl = ctx.scheme() + "://" + ctx.host() + importPath; + + RunDUUIPipeline.sendToImporterViaHttp(importUrl, analysisId, corpusId, analysisId, null); + ctx.status(200).result("CAS imported successfully for analysisId=" + analysisId); + } catch (NumberFormatException nfe) { + ctx.status(400).result("corpusId is required and must be a number"); + } catch (Exception e) { + logger.error("Error importing CAS", e); + ctx.status(500).result("Error importing CAS: " + e.getMessage()); + } + }; } diff --git a/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/routes/ImportExportApi.java b/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/routes/ImportExportApi.java index a47013a9..bc43a31e 100644 --- a/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/routes/ImportExportApi.java +++ b/uce.portal/uce.web/src/main/java/org/texttechnologylab/uce/web/routes/ImportExportApi.java @@ -1,35 +1,45 @@ package org.texttechnologylab.uce.web.routes; import com.google.gson.Gson; -import com.google.gson.JsonIOException; -import com.google.gson.JsonSyntaxException; +import com.google.gson.GsonBuilder; import io.javalin.http.Context; +import io.javalin.http.UploadedFile; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.springframework.context.ApplicationContext; import org.texttechnologylab.uce.common.config.CorpusConfig; +import org.texttechnologylab.uce.common.config.corpusConfig.CorpusAnnotationConfig; +import org.texttechnologylab.uce.common.config.corpusConfig.OtherConfig; +import org.texttechnologylab.uce.common.config.corpusConfig.TaxonConfig; import org.texttechnologylab.uce.common.exceptions.DatabaseOperationException; import org.texttechnologylab.uce.common.exceptions.ExceptionUtils; -import org.texttechnologylab.uce.common.models.corpus.Corpus; +import org.texttechnologylab.uce.common.models.imp.ImportStatus; +import org.texttechnologylab.uce.common.models.imp.UCEImport; import org.texttechnologylab.uce.common.services.PostgresqlDataInterface_Impl; import org.texttechnologylab.uce.common.services.S3StorageService; import org.texttechnologylab.uce.common.utils.StringUtils; import org.texttechnologylab.uce.corpusimporter.Importer; +import java.io.IOException; +import java.io.InputStream; import java.nio.charset.StandardCharsets; +import java.nio.file.Files; +import java.nio.file.Path; +import java.nio.file.Paths; +import java.nio.file.StandardCopyOption; import java.util.HashMap; import java.util.Map; +import java.util.UUID; import java.util.concurrent.CompletableFuture; + public class ImportExportApi implements UceApi { + private static final Logger logger = LogManager.getLogger(PostgresqlDataInterface_Impl.class); private S3StorageService s3StorageService; private PostgresqlDataInterface_Impl db; private ApplicationContext serviceContext; - private static final Logger logger = LogManager.getLogger(PostgresqlDataInterface_Impl.class); - private static Gson gson = new Gson(); - public ImportExportApi(ApplicationContext serviceContext) { this.serviceContext = serviceContext; this.s3StorageService = serviceContext.getBean(S3StorageService.class); @@ -54,7 +64,7 @@ public void downloadUIMA(Context ctx) { ctx.res().setContentType(contentType); ctx.res().setHeader("Content-Disposition", "attachment; filename=\"" + objectName + "." + StringUtils.getExtensionByContentType(contentType) + "\""); - var buffer = new byte[8192]; + var buffer = new byte[8192]; int bytesRead; while ((bytesRead = s3Stream.read(buffer)) != -1) { out.write(buffer, 0, bytesRead); @@ -74,9 +84,11 @@ public void uploadUIMA(Context ctx) { // First, we need to know which corpus this document should be added to. var corpusId = ExceptionUtils.tryCatchLog( () -> Long.parseLong(new String(ctx.req().getPart("corpusId").getInputStream().readAllBytes(), StandardCharsets.UTF_8)), - (ex) -> logger.error("Error getting the corpusId this document should be added to. Aborting.", ex)); + (ex) -> logger.error("Error getting corpusId from request.", ex)); + if (corpusId == null) { - ctx.result("Parameter corpusId didn't exist. Without it, the document cannot be uploaded."); + ctx.status(400); + ctx.result("Parameter corpusId didn't exist; cannot upload document."); return; } @@ -91,29 +103,12 @@ public void uploadUIMA(Context ctx) { var corpus = ExceptionUtils.tryCatchLog( () -> db.getCorpusById(corpusId), - (ex) -> logger.error("Couldn't fetch corpus when uploading new document to corpusId " + corpusId, ex)); + (ex) -> logger.error("Couldn't fetch corpus with id " + corpusId, ex)); + if (corpus == null) { - var corpusConfigRaw = ExceptionUtils.tryCatchLog( - () -> new String(ctx.req().getPart("corpusConfig").getInputStream().readAllBytes(), StandardCharsets.UTF_8), - (ex) -> logger.error("Error getting the corpusConfig that should be used for this document. Aborting.", ex)); - if (corpusConfigRaw == null) { - ctx.result("Corpus with id " + corpusId + " wasn't found in the database; no config was provided; can't upload document."); - return; - } - logger.info("Corpus with id " + corpusId + " wasn't found in the database; creating a new corpus with the provided config."); - try { - var corpusConfig = gson.fromJson(corpusConfigRaw, CorpusConfig.class); - corpus = new Corpus(); - var corpusReturn = Importer.CreateDBCorpus(corpus, corpusConfig, this.db); - if (corpusReturn != null) { - corpus = corpusReturn; - } - } catch (JsonIOException | JsonSyntaxException e) { - ctx.result("The corpusConfig provided is not properly formatted."); - } catch (DatabaseOperationException e) { - ctx.result("Error creating a new corpus in the database: " + e.getMessage()); - return; - } + ctx.status(404); + ctx.result("Corpus with id " + corpusId + " wasn't found in the database."); + return; } // TODO just use 1 as default? will throw an error if this is null otherwise... @@ -122,10 +117,9 @@ public void uploadUIMA(Context ctx) { try (var input = ctx.req().getPart("file").getInputStream()) { var fileName = ctx.req().getPart("file").getSubmittedFileName(); // Import the doc in the background - final Corpus corpus1 = corpus; var importFuture = CompletableFuture.supplyAsync(() -> { try { - return importer.storeUploadedXMIToCorpusAsync(input, corpus1, fileName, documentId); + return importer.storeUploadedXMIToCorpusAsync(input, corpus, fileName, documentId); } catch (DatabaseOperationException e) { throw new RuntimeException(e); } @@ -139,6 +133,7 @@ public void uploadUIMA(Context ctx) { if (acceptedContentType != null && acceptedContentType.equals("application/json")) { Map apiResult = new HashMap<>(); apiResult.put("document_id", newDocumentId); +// ctx.contentType("application/json"); //redundant ctx.json(apiResult); return; } @@ -149,6 +144,169 @@ public void uploadUIMA(Context ctx) { ctx.status(500); ctx.result("Error uploading a file: " + e.getMessage()); } - }; + } + + + public void importCorpusFromPath(Context ctx) { + try { + String path = ctx.formParam("path"); + String numThreadStr = ctx.formParam("numThreads"); + int numThreads = (numThreadStr != null && !numThreadStr.isBlank()) ? Integer.parseInt(numThreadStr) : 1; + String casView = ctx.formParam("casView"); + + if (casView != null && casView.isBlank()) { + casView = null; + } + + if (path == null || path.isBlank()) { + ctx.status(400).result("Path is required"); + return; + } + + String importId = UUID.randomUUID().toString(); + int importerNumber = 1; + Importer importer = new Importer(serviceContext, path, importerNumber, importId, casView); + UCEImport uceImport = new UCEImport(importId, path, ImportStatus.STARTING); + Integer fileCount = ExceptionUtils.tryCatchLog(importer::getXMICountInPath, + (ex) -> logger.warn("There was an IO error counting the importable UIMA files - the import will probably fail at some point.", ex)); + uceImport.setTotalDocuments(fileCount == null ? -1 : fileCount); + db.saveOrUpdateUceImport(uceImport); + CompletableFuture.runAsync(() -> { + try { + importer.start(numThreads); + } catch (DatabaseOperationException e) { + logger.error("Error during asynchronous corpus import", e); + } + }); + ctx.status(200).result("Import started. Import ID: " + importId); + } catch (DatabaseOperationException e) { + logger.error("Error when creating saving/updating to database" + e); + ctx.status(500).result("Database error initiating corpus import" + e.getMessage()); + + } catch (Exception e) { + logger.error("Error initiating corpus import", e); + ctx.status(500).result("Error initiating import: " + e.getMessage()); + } + + } + + public void importCorpusFromUpload(Context ctx){ + try{ + String importId = UUID.randomUUID().toString(); + Path rootDir = java.nio.file.Paths.get(System.getProperty("java.io.tmpdir"), "uce_uploads", importId); + Path inputDir = rootDir.resolve("input"); + Files.createDirectories(inputDir); + + var validFiles = ctx.uploadedFiles("files").stream() + .filter(f -> f.size() > 0 && f.filename() != null && !f.filename().isBlank()) + .toList(); + + if (validFiles.isEmpty()) { + ctx.status(400).result("No files selected. Please select at least one XMI file or archive."); + return; + } + + for(UploadedFile uploadedFile : ctx.uploadedFiles("files")){ + try(InputStream input = uploadedFile.content()){ + Files.copy(input,inputDir.resolve(uploadedFile.filename()), StandardCopyOption.REPLACE_EXISTING); + } + } + + CorpusConfig config = new CorpusConfig(); + String name = ctx.formParam("name"); + if (name == null || name.isBlank()){ + ctx.status(400).result("No corpus name given"); + } + config.setName(name); + String author = ctx.formParam("author"); + if (author == null || author.isBlank()) { + ctx.status(400).result("Corpus Author is required."); + return; + } + config.setAuthor(author); + String language = ctx.formParam("language"); + if (language == null || language.isBlank()) { + ctx.status(400).result("Corpus Language is required."); + return; + } + config.setLanguage(language); + config.setDescription(ctx.formParam("description")); + String addToExistingParam = ctx.formParam("addToExistingCorpus"); + boolean addToExisting = addToExistingParam != null && Boolean.parseBoolean(addToExistingParam); + config.setAddToExistingCorpus(addToExisting); + +// Annotations + CorpusAnnotationConfig annotations = new CorpusAnnotationConfig(); + annotations.setSentence(ctx.formParam("sentence") != null); + annotations.setLemma(ctx.formParam("lemma") != null); + annotations.setNamedEntity(ctx.formParam("namedEntity") != null); + annotations.setSentiment(ctx.formParam("sentiment") != null); + annotations.setEmotion(ctx.formParam("emotion") != null); + annotations.setTime(ctx.formParam("time") != null); + annotations.setGeoNames(ctx.formParam("geoNames") != null); + annotations.setWikipediaLink(ctx.formParam("wikipediaLink") != null); + annotations.setImage(ctx.formParam("image") != null); + annotations.setUnifiedTopic(ctx.formParam("unifiedTopic") != null); + annotations.setOCRPage(ctx.formParam("OCRPage") != null); + annotations.setOCRParagraph(ctx.formParam("OCRParagraph") != null); + annotations.setOCRBlock(ctx.formParam("OCRBlock") != null); + annotations.setOCRLine(ctx.formParam("OCRLine") != null); + + TaxonConfig taxonConfig = new TaxonConfig(); + taxonConfig.setAnnotated(ctx.formParam("taxonAnnotated") != null); + taxonConfig.setBiofidOnthologyAnnotated(ctx.formParam("biofidOnthologyAnnotated") != null); + + annotations.setTaxon(taxonConfig); + config.setAnnotations(annotations); + +// Other Settings + OtherConfig otherConfig = new OtherConfig(); + otherConfig.setEnableEmbeddings(ctx.formParam("enableEmbeddings") != null); + otherConfig.setEnableRAGBot(ctx.formParam("enableRAGBot") != null); + otherConfig.setIncludeKeywordDistribution(ctx.formParam("includeKeywordDistribution") != null); + otherConfig.setEnableS3Storage(ctx.formParam("enableS3Storage") != null); + config.setOther(otherConfig); + + Gson gson = new GsonBuilder().setPrettyPrinting().create(); + String jsonString = gson.toJson(config); + Files.writeString(rootDir.resolve("corpusConfig.json"),jsonString,StandardCharsets.UTF_8); + + String numThreadStr = ctx.formParam("numThreads"); + int numThreads = (numThreadStr != null && !numThreadStr.isBlank()) ? Integer.parseInt(numThreadStr) : 1; + String casView = ctx.formParam("casView"); + if(casView != null && casView.isBlank()) casView = null; + int importerNumber = 1; + Importer importer = new Importer(serviceContext,rootDir.toString(),importerNumber,importId,casView); + + String logTitle = (addToExisting ? "ADD_TO:" : "UPLOAD_NEW:") + name; + UCEImport uceImport = new UCEImport(importId,logTitle,ImportStatus.STARTING); + Integer fileCount = ExceptionUtils.tryCatchLog(importer::getXMICountInPath, + (ex) -> logger.warn("IO Error counting upload files.",ex)); + uceImport.setTotalDocuments(fileCount == null ? -1 : fileCount); + db.saveOrUpdateUceImport(uceImport); + CompletableFuture.runAsync(() -> { + try{ + importer.start(numThreads); + } catch (DatabaseOperationException e) { + logger.error("Error during asynchronous corpus uplaod import",e); + }finally { + try { + org.apache.commons.io.FileUtils.deleteDirectory(rootDir.toFile()); + } catch (IOException e) { + logger.warn("Could not delete temp upload dir: " + rootDir,e); + } + } + }); + + ctx.status(200).result("Upload sucessfull. Import started with ID: " + importId); + + } catch (IOException e) { + logger.error("Error handling file upload import", e); + ctx.status(500).result("Error during upload " + e.getMessage()); + } catch (DatabaseOperationException e) { + logger.error("Error saving/updating database during Uce Import", e); + ctx.status(500).result("Error during saving/updating database " + e.getMessage()); + } + } } diff --git a/uce.portal/uce.web/src/main/resources/languageTranslations.json b/uce.portal/uce.web/src/main/resources/languageTranslations.json index f34ce979..185db241 100644 --- a/uce.portal/uce.web/src/main/resources/languageTranslations.json +++ b/uce.portal/uce.web/src/main/resources/languageTranslations.json @@ -538,5 +538,9 @@ "sentenceTopicFlow": { "de-DE": "Satz-Themenfluss", "en-EN": "Sentence Topic Flow" + }, + "sentenceSentiment": { + "de-DE": "Satz-Sentiment", + "en-EN": "Sentence Sentiment" } } \ No newline at end of file