JabRef · liamsebestyen · Apr 1, 2025 · Apr 1, 2025 · Apr 1, 2025 · Apr 1, 2025
diff --git a/src/main/java/org/jabref/logic/importer/fileformat/PdfMergeMetadataImporter.java b/src/main/java/org/jabref/logic/importer/fileformat/PdfMergeMetadataImporter.java
@@ -161,17 +161,67 @@ private void fetchData(BibEntry candidate, StandardField field, IdBasedFetcher f
     }
 
     private static BibEntry mergeCandidates(Stream<BibEntry> candidates) {
-        final BibEntry entry = new BibEntry();
-        candidates.forEach(entry::mergeWith);
+        // Convert the stream to a list so we can iterate over the list twice
+        List<BibEntry> candidateList = candidates.toList();
 
-        // Retain online links only
-        List<LinkedFile> onlineLinks = entry.getFiles().stream().filter(LinkedFile::isOnlineLink).toList();
+
+        BibEntry entry = new BibEntry();
+
+        //  Score titles to find the "best" title among candidates
+        int bestTitleScore = -1;
+        String bestTitle = null;
+
+        for (BibEntry candidate : candidateList) {
+            Optional<String> candidateTitle = candidate.getField(StandardField.TITLE);
+            if (candidateTitle.isPresent()) {
+                int score = calculateTitleScore(candidateTitle.get());
+                if (score > bestTitleScore) {
+                    bestTitleScore = score;
+                    bestTitle = candidateTitle.get();
+                }
+            }
+        }
+
+        // Merge all fields from the candidates, same as previous method
+        candidateList.forEach(entry::mergeWith);
+
+        // Override the best title we found
+        if (bestTitle != null) {
+            entry.setField(StandardField.TITLE, bestTitle);
+        }
+
+
+        List<LinkedFile> onlineLinks = entry.getFiles().stream()
+                .filter(LinkedFile::isOnlineLink)
+                .toList();
         entry.clearField(StandardField.FILE);
         entry.addFiles(onlineLinks);
 
         return entry;
     }
 
+    private static int calculateTitleScore(String title) {
+        //for every word in the title, plus one point
+        int wordCount = title.trim().split("\\s+").length;
+        if(wordcount > 35){
+            wordcount = -2; //super long titles are less favourable
+        }
+
+        //if the title ends in .ccc or .cccc where c is any alphabetic char, minus 10 points
+        int endsInExtension= title.matches(".*\\.[a-zA-Z]{3,4}") ? -10 : 0;
+
+        int endsWithFileExtension = 0;
+
+        if (title.matches("(?i).*(\\.(pdf|docx?|txt|jpg|png))$")){
-        if (title.matches("(?i).*(\\.(pdf|docx?|txt|jpg|png))$")){
+        if (title.matches("(?i).*(\\.(pdf|doc|docx|odt|txt|jpg|jpeg|png))$")){
-        if (title.matches("(?i).*(\\.(pdf|docx?|txt|jpg|png))$")){
+        if (title.matches("(?i).*(\\.(pdf|doc|docx|odt|txt|jpg|jpeg|png))$")){
+            //Check for some common file extensions, remove points if contains these common filepath endings.
+            endsWithFileExtension = -10; // subtract ten more points for file extension ending, very undesirable.
+        }
+        return wordcount + endsinExtension + endsWithFileExtension;
+    }
+
+
+
+
     /**
      * Imports the BibTeX data from the given PDF file and relativized the paths of each linked file based on the context and the file preferences.
      */