Initial commit after restructure

This commit is contained in:
Daniel
2018-08-13 14:14:27 +02:00
commit bdeddc41f9
177 changed files with 26108 additions and 0 deletions

56
analytics/algs/lms.go Normal file
View File

@@ -0,0 +1,56 @@
// Copyright Safing ICS Technologies GmbH. Use of this source code is governed by the AGPL license that can be found in the LICENSE file.
package algs
import (
"strings"
)
func LmsScoreOfDomain(domain string) float64 {
var totalScore float64
domain = strings.ToLower(domain)
subjects := strings.Split(domain, ".")
// ignore the last two parts
if len(subjects) <= 3 {
return 100
}
subjects = subjects[:len(subjects)-3]
var totalLength int
for _, subject := range subjects {
totalLength += len(subject)
}
for _, subject := range subjects {
// calculate score, weigh it and add it
if len(subject) > 0 {
totalScore += LmsScore(subject) * (float64(len(subject)) / float64(totalLength))
}
}
return totalScore
}
func LmsScore(subject string) float64 {
lms_start := -1
lms_stop := -1
longest_lms := 0
for i, c := range subject {
if int(c) >= int('a') && int(c) <= int('z') {
if lms_start == -1 {
lms_start = i
}
} else {
if lms_start > -1 {
lms_stop = i
if lms_stop-lms_start > longest_lms {
longest_lms = lms_stop - lms_start
}
lms_start = -1
}
}
}
if lms_stop == -1 {
longest_lms = len(subject)
}
// fmt.Printf("algs: lms score of %s is %.2f\n", subject, (float64(longest_lms) * 100.0 / float64(len(subject))))
return (float64(longest_lms) * 100.0 / float64(len(subject)))
}

View File

@@ -0,0 +1,19 @@
// Copyright Safing ICS Technologies GmbH. Use of this source code is governed by the AGPL license that can be found in the LICENSE file.
package algs
import "testing"
func TestLmsScoreOfDomain(t *testing.T) {
testDomain(t, "g.symcd.com.", 100, 100)
testDomain(t, "www.google.com.", 100, 100)
testDomain(t, "55ttt5.12abc3.test.com.", 50, 50)
testDomain(t, "mbtq6opnuodp34gcrma65fxacgxv5ukr7lq6xuhr4mhoibe7.yvqptrozfbnqyemchpovw3q5xwjibuxfsgb72mix3znhpfhc.i2n7jh2gadqaadck3zs3vg3hbv5pkmwzeay4gc75etyettbb.isi5mhmowtfriu33uxzmgvjur5g2p3tloynwohfrggee6fkn.meop7kqyd5gwxxa3.er.spotify.com.", 0, 30)
}
func testDomain(t *testing.T, domain string, min, max float64) {
score := LmsScoreOfDomain(domain)
if score < min || score > max {
t.Errorf("domain %s has scored %.2f, but should be between %.0f and %.0f", domain, score, min, max)
}
}