Skip to content

Commit dbd9aa8

Browse files
committed
Improve cleanup of facts and titles, with more manual steps
1 parent 5ed837a commit dbd9aa8

File tree

1 file changed

+10
-2
lines changed

1 file changed

+10
-2
lines changed

main.go

Lines changed: 10 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,6 @@ import (
66
"bufio"
77
"flag"
88
"fmt"
9-
"html"
109
"io"
1110
"log"
1211
"os"
@@ -606,7 +605,16 @@ func (p *TripleAggregateToWikiPageConverter) convertUriToWikiTitle(uri string, u
606605
// Clean up strange characters
607606
factTitle = str.Replace(factTitle, "[", "(", -1)
608607
factTitle = str.Replace(factTitle, "]", ")", -1)
609-
factTitle = html.EscapeString(factTitle)
608+
factTitle = str.Replace(factTitle, "{", "(", -1)
609+
factTitle = str.Replace(factTitle, "}", ")", -1)
610+
factTitle = str.Replace(factTitle, "|", " ", -1)
611+
factTitle = str.Replace(factTitle, "#", " ", -1)
612+
factTitle = str.Replace(factTitle, "<", "less than", -1)
613+
factTitle = str.Replace(factTitle, ">", "greater than", -1)
614+
factTitle = str.Replace(factTitle, "?", " ", -1)
615+
factTitle = str.Replace(factTitle, "&", " ", -1)
616+
factTitle = str.Replace(factTitle, ".", " ", -1)
617+
factTitle = str.Replace(factTitle, "=", "-", -1)
610618

611619
// Clean up according to regexes
612620
for _, r := range p.cleanUpRegexes {

0 commit comments

Comments
 (0)