-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathtrain.go
81 lines (74 loc) · 2.01 KB
/
train.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
package chatfreely
import (
"github.com/mb-14/gomarkov"
"github.com/writeas/go-writeas/v3"
"log"
"net/url"
"os"
"strings"
"sync"
)
const writeasURL = "https://write.as"
func fetchBlogPosts(alias, instance string) ([]writeas.Post, error) {
// Normalize and correctly parse instance
if instance == "" {
instance = writeasURL
}
if !strings.HasPrefix(instance, "http") {
instance = "https://" + instance
}
host, err := url.Parse(instance)
if err != nil {
return nil, err
}
host.Path = "/api"
// Set up WriteFreely API client
log.Printf("Fetching blog posts from '%s' on %s (via %s)...", alias, host.Host, host.String())
var c *writeas.Client
if instance == writeasURL {
c = writeas.NewClient()
// Write.as requires an application key to get around rate limiting
c.SetApplicationKey(os.Getenv("WRITEAS_APP_KEY"))
} else {
c = writeas.NewClientWith(writeas.Config{
URL: host.String(),
})
}
var posts *[]writeas.Post
var allPosts []writeas.Post
i := 1
for i == 1 || len(*posts) != 0 {
log.Printf("Page %d...", i)
posts, err = c.GetCollectionPosts(alias, i)
if err != nil {
return nil, err
}
allPosts = append(allPosts, *posts...)
i++
}
return allPosts, err
}
// BuildModel creates a model with the given order, fetching posts from the given collection via the WriteFreely API.
func BuildModel(alias, instance string, order int) (*gomarkov.Chain, error) {
posts, err := fetchBlogPosts(alias, instance)
if err != nil {
return nil, err
}
return BuildModelWithPosts(posts, order)
}
// BuildModelWithPosts creates a model with the given order for the given posts.
func BuildModelWithPosts(posts []writeas.Post, order int) (*gomarkov.Chain, error) {
chain := gomarkov.NewChain(order)
var wg sync.WaitGroup
wg.Add(len(posts))
log.Printf("Adding %d posts to markov chain...", len(posts))
for _, storyID := range posts {
go func(p writeas.Post) {
defer wg.Done()
log.Printf("\"%s\"", p.Title)
chain.Add(strings.Split(p.Content, " "))
}(storyID)
}
wg.Wait()
return chain, nil
}