oh yeah, go can do that multiple file thing
This commit is contained in:
parent
3ae62454db
commit
8a12f277b1
80
poll/cli.go
Normal file
80
poll/cli.go
Normal file
@ -0,0 +1,80 @@
|
||||
package main
|
||||
|
||||
import (
|
||||
"encoding/binary"
|
||||
"encoding/json"
|
||||
"fmt"
|
||||
"net"
|
||||
"log"
|
||||
"io"
|
||||
"os"
|
||||
)
|
||||
|
||||
func handleClient(commandClient net.Conn, runninginstances *[]RunningInstance, instanceReportChan chan InstanceReport) {
|
||||
|
||||
sizebyte := make([]byte, 4)
|
||||
var commandmap CommandMap
|
||||
var responseback ResponseBack
|
||||
n, err := io.ReadFull(commandClient, sizebyte)
|
||||
if n != 4 {
|
||||
fmt.Println("Did not read 4 bytes, failure.")
|
||||
os.Exit(1)
|
||||
}
|
||||
jsonsize := int(binary.LittleEndian.Uint32(sizebyte))
|
||||
jsonbyte := make([]byte, jsonsize)
|
||||
n, err = io.ReadFull(commandClient, jsonbyte)
|
||||
if n != jsonsize {
|
||||
fmt.Println("Failued to read json size of ", n)
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
err = json.Unmarshal(jsonbyte, &commandmap)
|
||||
if err != nil {
|
||||
fmt.Println("Unable to unmarshal")
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
switch commandmap.Type {
|
||||
case "status":
|
||||
responseback.Message = "Ok"
|
||||
case "add":
|
||||
log.Print("Manually added instance: " + commandmap.Endpoint)
|
||||
var q InstanceReport
|
||||
q.endpoint = commandmap.Endpoint
|
||||
q.status = NEW_INSTANCE
|
||||
|
||||
instanceReportChan <- q
|
||||
|
||||
responseback.Message = "Added " + commandmap.Endpoint
|
||||
case "suspend":
|
||||
fmt.Println("Suspend")
|
||||
case "resume":
|
||||
fmt.Println("Resume")
|
||||
default:
|
||||
fmt.Println("Something else")
|
||||
}
|
||||
|
||||
|
||||
responseback.Type = "status"
|
||||
responseback.RunningInstances = *runninginstances
|
||||
|
||||
responsebytes, err := json.Marshal(responseback)
|
||||
if err != nil {
|
||||
fmt.Println("Error: ", err)
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
n = len(responsebytes)
|
||||
binary.LittleEndian.PutUint32(sizebyte, uint32(n))
|
||||
|
||||
commandClient.Write(sizebyte)
|
||||
|
||||
responsebyte, err := json.Marshal(responseback)
|
||||
if err != nil {
|
||||
fmt.Println("Error response back: ", err)
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
commandClient.Write(responsebyte)
|
||||
commandClient.Close()
|
||||
}
|
459
poll/engine.go
459
poll/engine.go
@ -1,459 +0,0 @@
|
||||
package main
|
||||
|
||||
import (
|
||||
"github.com/microcosm-cc/bluemonday"
|
||||
"github.com/jackc/pgx/pgxpool"
|
||||
_ "net/http/pprof"
|
||||
"encoding/binary"
|
||||
"encoding/json"
|
||||
"crypto/sha1"
|
||||
"io/ioutil"
|
||||
"net/http"
|
||||
"context"
|
||||
"strings"
|
||||
"html"
|
||||
"time"
|
||||
"fmt"
|
||||
"net"
|
||||
"log"
|
||||
"io"
|
||||
"os"
|
||||
)
|
||||
|
||||
const (
|
||||
NEW_INSTANCE = 0
|
||||
RUNNING = 200
|
||||
TOOMANYREQUESTS = 429
|
||||
CLIENT_ISSUE = 600
|
||||
ONION_PROTOCOL = 601
|
||||
BAD_RESPONSE = 602
|
||||
NO_CONNECTION = 603
|
||||
BAD_NODEINFO = 604
|
||||
)
|
||||
|
||||
// Parsing Unmarshal JSON type
|
||||
type ReportPost struct {
|
||||
|
||||
// Retrieved values
|
||||
Id string `json:"id"`
|
||||
Url string `json:"url"`
|
||||
Account AccountType
|
||||
Content string `json:"content"`
|
||||
Created_at string `json:"created_at"`
|
||||
|
||||
// Derived values
|
||||
normalized string
|
||||
posthash []byte
|
||||
}
|
||||
|
||||
type AccountType struct {
|
||||
Acct string `json:"acct"`
|
||||
Avatar string `json:"avatar"`
|
||||
Bot bool `json:"bot"`
|
||||
Created_at string `json:"created_at"`
|
||||
Display_name string `json:"display_name"`
|
||||
Url string `json:"url"`
|
||||
}
|
||||
|
||||
// Used to report a new instance to main
|
||||
type InstanceReport struct {
|
||||
endpoint string
|
||||
status int
|
||||
|
||||
min_id string
|
||||
numposts int
|
||||
}
|
||||
|
||||
// Instance's new min_id value
|
||||
type RunningInstance struct {
|
||||
Endpoint string `json:"endpoint"`
|
||||
Software string `json:"software"`
|
||||
Min_id string
|
||||
Status int `json:"status"`
|
||||
LastRun string `json:"lastrun"`
|
||||
}
|
||||
|
||||
type NodeInfoSoftware struct {
|
||||
Name string `json:"name"`
|
||||
Version string `json:"version"`
|
||||
}
|
||||
|
||||
type NodeInfo struct {
|
||||
Software NodeInfoSoftware `json:"software"`
|
||||
}
|
||||
|
||||
type CommandMap struct {
|
||||
Type string `json:"Type"`
|
||||
Endpoint string `json:"Endpoint"`
|
||||
}
|
||||
|
||||
type ResponseBack struct {
|
||||
Type string `json:"Type"`
|
||||
Message string `json:"Message"`
|
||||
RunningInstances []RunningInstance `json:"RunningInstances"`
|
||||
}
|
||||
|
||||
func handleClient(commandClient net.Conn, runninginstances *[]RunningInstance, instanceReportChan chan InstanceReport) {
|
||||
|
||||
sizebyte := make([]byte, 4)
|
||||
var commandmap CommandMap
|
||||
var responseback ResponseBack
|
||||
n, err := io.ReadFull(commandClient, sizebyte)
|
||||
if n != 4 {
|
||||
fmt.Println("Did not read 4 bytes, failure.")
|
||||
os.Exit(1)
|
||||
}
|
||||
jsonsize := int(binary.LittleEndian.Uint32(sizebyte))
|
||||
jsonbyte := make([]byte, jsonsize)
|
||||
n, err = io.ReadFull(commandClient, jsonbyte)
|
||||
if n != jsonsize {
|
||||
fmt.Println("Failued to read json size of ", n)
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
err = json.Unmarshal(jsonbyte, &commandmap)
|
||||
if err != nil {
|
||||
fmt.Println("Unable to unmarshal")
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
switch commandmap.Type {
|
||||
case "status":
|
||||
responseback.Message = "Ok"
|
||||
case "add":
|
||||
log.Print("Manually added instance: " + commandmap.Endpoint)
|
||||
var q InstanceReport
|
||||
q.endpoint = commandmap.Endpoint
|
||||
q.status = NEW_INSTANCE
|
||||
|
||||
instanceReportChan <- q
|
||||
|
||||
responseback.Message = "Added " + commandmap.Endpoint
|
||||
case "suspend":
|
||||
fmt.Println("Suspend")
|
||||
case "resume":
|
||||
fmt.Println("Resume")
|
||||
default:
|
||||
fmt.Println("Something else")
|
||||
}
|
||||
|
||||
|
||||
responseback.Type = "status"
|
||||
responseback.RunningInstances = *runninginstances
|
||||
|
||||
responsebytes, err := json.Marshal(responseback)
|
||||
if err != nil {
|
||||
fmt.Println("Error: ", err)
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
n = len(responsebytes)
|
||||
binary.LittleEndian.PutUint32(sizebyte, uint32(n))
|
||||
|
||||
commandClient.Write(sizebyte)
|
||||
|
||||
responsebyte, err := json.Marshal(responseback)
|
||||
if err != nil {
|
||||
fmt.Println("Error response back: ", err)
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
commandClient.Write(responsebyte)
|
||||
commandClient.Close()
|
||||
}
|
||||
|
||||
/*
|
||||
* This code can be refactored per
|
||||
* https://golang.org/pkg/encoding/binary/
|
||||
* But for now, this should be sufficient
|
||||
*/
|
||||
/*
|
||||
func parseCommand(c net.Conn) {
|
||||
rawCommand := make([]byte, 1)
|
||||
}
|
||||
*/
|
||||
|
||||
func AppendIfMissing(hay []string, needle string) []string {
|
||||
for _, ele := range hay {
|
||||
if ele == needle {
|
||||
return hay
|
||||
}
|
||||
}
|
||||
return append(hay, needle)
|
||||
}
|
||||
|
||||
func StartInstancePoll(instancereport InstanceReport, reportPostChan chan ReportPost, instanceReportChan chan InstanceReport) {
|
||||
p := bluemonday.NewPolicy()
|
||||
newposts := make([]ReportPost, 0)
|
||||
|
||||
// Only placing this here to later have the option of using
|
||||
// an HTTP client via a SOCKS5 Tor proxy
|
||||
if strings.Contains(instancereport.endpoint, ".onion") == true {
|
||||
instanceReportChan <- InstanceReport{instancereport.endpoint, ONION_PROTOCOL, "", 0}
|
||||
return
|
||||
}
|
||||
|
||||
api_timeline := "https://" + instancereport.endpoint + "/api/v1/timelines/public?min_id=" + instancereport.min_id
|
||||
resp, err := http.Get(api_timeline)
|
||||
if err != nil {
|
||||
instanceReportChan <- InstanceReport{instancereport.endpoint, CLIENT_ISSUE, "", 0}
|
||||
return
|
||||
}
|
||||
|
||||
body, err := ioutil.ReadAll(resp.Body)
|
||||
err = json.Unmarshal(body, &newposts)
|
||||
if err != nil {
|
||||
// instanceReportChan <- InstanceReport{instancereport.endpoint, resp.StatusCode, "", 0}
|
||||
instanceReportChan <- InstanceReport{instancereport.endpoint, BAD_RESPONSE, "", 0}
|
||||
return
|
||||
}
|
||||
|
||||
newinstances := make([]string, 0)
|
||||
min_id := ""
|
||||
numposts := 0
|
||||
for _, newpost := range newposts {
|
||||
|
||||
if newpost.Account.Acct == "" {
|
||||
continue
|
||||
}
|
||||
|
||||
posthash := sha1.New()
|
||||
|
||||
at_sign := strings.Index(newpost.Account.Acct, "@")
|
||||
|
||||
if at_sign == -1 {
|
||||
at_sign = len(newpost.Account.Acct)
|
||||
newpost.Account.Acct += "@" + instancereport.endpoint
|
||||
}
|
||||
|
||||
// Calculate the post hash
|
||||
fmt.Fprint(posthash, newpost.Url)
|
||||
fmt.Fprint(posthash, newpost.normalized)
|
||||
fmt.Fprint(posthash, newpost.Account.Acct)
|
||||
fmt.Fprint(posthash, newpost.Account.Display_name)
|
||||
newpost.posthash = posthash.Sum(nil)
|
||||
|
||||
newpost.normalized = html.UnescapeString(strings.ToLower(p.Sanitize(newpost.Content)))
|
||||
|
||||
reportPostChan <- newpost
|
||||
|
||||
// Check min_id
|
||||
if newpost.Id > min_id {
|
||||
min_id = newpost.Id
|
||||
}
|
||||
numposts = numposts + 1
|
||||
|
||||
newinstance := newpost.Account.Acct[at_sign+1:]
|
||||
newinstances = AppendIfMissing(newinstances, newinstance)
|
||||
}
|
||||
|
||||
for _, newinstance := range newinstances {
|
||||
var q InstanceReport
|
||||
q.endpoint = newinstance
|
||||
q.status = NEW_INSTANCE
|
||||
q.min_id = ""
|
||||
q.numposts = 0
|
||||
instanceReportChan <- q
|
||||
}
|
||||
|
||||
instanceReportChan <- InstanceReport{instancereport.endpoint, resp.StatusCode, min_id, numposts}
|
||||
}
|
||||
|
||||
func DeferPollRun(instancereport InstanceReport, runninginstances *[]RunningInstance, instanceReportChan chan InstanceReport, reportPostChan chan ReportPost) {
|
||||
|
||||
delay := 10
|
||||
if instancereport.status == RUNNING && instancereport.numposts <= 10 {
|
||||
delay = 10
|
||||
} else if instancereport.status == RUNNING && instancereport.numposts > 10 {
|
||||
delay = 15
|
||||
} else if instancereport.status == 429 {
|
||||
delay = 30
|
||||
} else {
|
||||
fmt.Println("error, status code is ------------->: ", instancereport.status)
|
||||
os.Exit(1)
|
||||
}
|
||||
time.Sleep(time.Second * time.Duration(delay))
|
||||
|
||||
go StartInstancePoll(instancereport, reportPostChan, instanceReportChan)
|
||||
}
|
||||
|
||||
// Change this to return a proper "err"
|
||||
func GetNodeInfo(endpoint string, nodeinfo *NodeInfo) {
|
||||
api_nodeinfo := "https://" + endpoint + "/nodeinfo/2.0.json"
|
||||
http_client := http.Client{Timeout: 5 * time.Second}
|
||||
resp, err := http_client.Get(api_nodeinfo)
|
||||
if err != nil {
|
||||
return
|
||||
}
|
||||
|
||||
body, err := ioutil.ReadAll(resp.Body)
|
||||
err = json.Unmarshal(body, &nodeinfo)
|
||||
if err != nil {
|
||||
// fmt.Println("Unmarshal 2");
|
||||
return
|
||||
}
|
||||
}
|
||||
|
||||
func NewInstance(endpoint string, runninginstances *[]RunningInstance, instanceReportChan chan InstanceReport, reportPostChan chan ReportPost) {
|
||||
var nodeinfo NodeInfo
|
||||
|
||||
if endpoint == "" {
|
||||
return
|
||||
}
|
||||
|
||||
// No repeats
|
||||
for _, runninginstance := range *runninginstances {
|
||||
if runninginstance.Endpoint == endpoint {
|
||||
return
|
||||
}
|
||||
}
|
||||
|
||||
// Check node type
|
||||
GetNodeInfo(endpoint, &nodeinfo)
|
||||
if nodeinfo.Software.Name == "" {
|
||||
go func() {
|
||||
var q InstanceReport
|
||||
q.endpoint = endpoint
|
||||
q.status = BAD_NODEINFO
|
||||
instanceReportChan <- q
|
||||
return
|
||||
}()
|
||||
}
|
||||
|
||||
newinstance := RunningInstance{endpoint, "", "", NEW_INSTANCE, "Queued"}
|
||||
*runninginstances = append(*runninginstances, newinstance)
|
||||
|
||||
if nodeinfo.Software.Name == "pleroma" || nodeinfo.Software.Name == "mastodon" {
|
||||
var newinstancereport InstanceReport
|
||||
newinstancereport.endpoint = endpoint
|
||||
newinstancereport.status = 0
|
||||
newinstancereport.min_id = ""
|
||||
newinstancereport.numposts = 0
|
||||
go StartInstancePoll(newinstancereport, reportPostChan, instanceReportChan)
|
||||
}
|
||||
}
|
||||
|
||||
func writePost(pool *pgxpool.Pool, reportpost ReportPost) {
|
||||
conn, err := pool.Acquire(context.Background())
|
||||
if err != nil {
|
||||
log.Fatal("Error connecting to database:", err)
|
||||
os.Exit(1)
|
||||
}
|
||||
defer conn.Release()
|
||||
|
||||
// Insert new account if new
|
||||
var accountid int
|
||||
err = conn.QueryRow(context.Background(), "INSERT INTO accounts (acct, avatar, bot, created_at, display_name, url) VALUES($1, $2, $3, $4, $5, $6) ON CONFLICT(acct) DO UPDATE SET acct=EXCLUDED.acct RETURNING id", reportpost.Account.Acct, reportpost.Account.Avatar, reportpost.Account.Bot, reportpost.Account.Created_at, reportpost.Account.Display_name, reportpost.Account.Url).Scan(&accountid)
|
||||
if err != nil {
|
||||
fmt.Println("First ", err)
|
||||
fmt.Println("--------------------------")
|
||||
fmt.Println("Reported error: ", err)
|
||||
fmt.Println("Account Acct: ", reportpost.Account.Acct)
|
||||
fmt.Println("Account Avatar: ", reportpost.Account.Avatar)
|
||||
fmt.Println("Account Avatar len: ", len(reportpost.Account.Avatar))
|
||||
fmt.Println("Account Bot: ", reportpost.Account.Bot)
|
||||
fmt.Println("Account Created_at: ", reportpost.Account.Created_at)
|
||||
fmt.Println("Account Display: ", reportpost.Account.Display_name)
|
||||
fmt.Println("Account URL: ", reportpost.Account.Url)
|
||||
fmt.Println(reportpost)
|
||||
fmt.Println("--------------------------")
|
||||
os.Exit(1) // For now I want this to die and learn why it failed
|
||||
return
|
||||
}
|
||||
|
||||
// Insert new post if new
|
||||
_, err = conn.Exec(context.Background(), "INSERT INTO posts (url, content, created_at, normalized, account_id, posthash) VALUES ($1, $2, $3, $4, $5, $6) ON CONFLICT (posthash) DO NOTHING", reportpost.Url, reportpost.Content, reportpost.Created_at, reportpost.normalized, accountid, reportpost.posthash)
|
||||
if err != nil { // For now I want to know why this failed.
|
||||
fmt.Println("Second ", err)
|
||||
fmt.Println("--------------------------")
|
||||
fmt.Println("Reported error: ", err)
|
||||
fmt.Println("Url: ", reportpost.Url)
|
||||
fmt.Println("Content: ", reportpost.Content)
|
||||
fmt.Println("Created_at: ", reportpost.Created_at)
|
||||
fmt.Println("normalized: ", reportpost.normalized)
|
||||
fmt.Println("account_id", accountid)
|
||||
fmt.Println("posthash: ", reportpost.posthash)
|
||||
fmt.Println("--------------------------")
|
||||
os.Exit(1) // For now I want this to die and learn why it failed
|
||||
return
|
||||
}
|
||||
}
|
||||
|
||||
func SuspendInstance(suspendinstance InstanceReport, runninginstances *[]RunningInstance) {
|
||||
for i, runninginstance := range *runninginstances {
|
||||
if runninginstance.Endpoint == suspendinstance.endpoint {
|
||||
(*runninginstances)[i].Status = suspendinstance.status
|
||||
(*runninginstances)[i].LastRun = time.Now().Format("2006.01.02-15:04:05")
|
||||
return
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
func engine() {
|
||||
|
||||
// Current instances
|
||||
runninginstances := make([]RunningInstance, 0)
|
||||
|
||||
// Initial Setup
|
||||
reportPostChan := make(chan ReportPost, 2000)
|
||||
instanceReportChan := make(chan InstanceReport, 100)
|
||||
|
||||
// Setup Database
|
||||
pool, err := pgxpool.Connect(context.Background(), "postgres://postgres@127.0.0.1/fedilogue")
|
||||
if err != nil {
|
||||
fmt.Fprintln(os.Stderr, "Unable to connect to database:", err)
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
l, err := net.Listen("tcp", "127.0.0.1:5555")
|
||||
if err != nil {
|
||||
fmt.Println(err)
|
||||
return
|
||||
}
|
||||
defer l.Close()
|
||||
|
||||
commandClient := make(chan net.Conn)
|
||||
|
||||
go func(l net.Listener) {
|
||||
for {
|
||||
c, err := l.Accept()
|
||||
if err != nil {
|
||||
fmt.Println("Error on accept")
|
||||
commandClient <- nil
|
||||
return
|
||||
}
|
||||
commandClient <- c
|
||||
}
|
||||
}(l)
|
||||
|
||||
for {
|
||||
select {
|
||||
case c := <-commandClient: // New client connection
|
||||
go handleClient(c, &runninginstances, instanceReportChan)
|
||||
case v := <-reportPostChan: // New Post
|
||||
go writePost(pool, v)
|
||||
case w := <-instanceReportChan: // Start or suspend instance
|
||||
if w.status == NEW_INSTANCE {
|
||||
NewInstance(w.endpoint, &runninginstances, instanceReportChan, reportPostChan)
|
||||
} else if w.status == RUNNING || w.status == TOOMANYREQUESTS {
|
||||
for i, runninginstance := range runninginstances {
|
||||
if runninginstance.Endpoint == w.endpoint {
|
||||
runninginstances[i].Min_id = w.min_id
|
||||
runninginstances[i].Status = w.status
|
||||
runninginstances[i].LastRun = time.Now().Format("2006.01.02-15:04:05")
|
||||
}
|
||||
}
|
||||
go DeferPollRun(w, &runninginstances, instanceReportChan, reportPostChan)
|
||||
} else {
|
||||
SuspendInstance(w, &runninginstances)
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
func main() {
|
||||
go engine()
|
||||
log.Println("serving on port 8080")
|
||||
log.Fatal(http.ListenAndServe(":8080", nil))
|
||||
}
|
74
poll/headers.go
Normal file
74
poll/headers.go
Normal file
@ -0,0 +1,74 @@
|
||||
package main
|
||||
|
||||
const (
|
||||
NEW_INSTANCE = 0
|
||||
RUNNING = 200
|
||||
TOOMANYREQUESTS = 429
|
||||
CLIENT_ISSUE = 600
|
||||
ONION_PROTOCOL = 601
|
||||
BAD_RESPONSE = 602
|
||||
NO_CONNECTION = 603
|
||||
BAD_NODEINFO = 604
|
||||
)
|
||||
|
||||
// Parsing Unmarshal JSON type
|
||||
type ReportPost struct {
|
||||
|
||||
// Retrieved values
|
||||
Id string `json:"id"`
|
||||
Url string `json:"url"`
|
||||
Account AccountType
|
||||
Content string `json:"content"`
|
||||
Created_at string `json:"created_at"`
|
||||
|
||||
// Derived values
|
||||
normalized string
|
||||
posthash []byte
|
||||
}
|
||||
|
||||
type AccountType struct {
|
||||
Acct string `json:"acct"`
|
||||
Avatar string `json:"avatar"`
|
||||
Bot bool `json:"bot"`
|
||||
Created_at string `json:"created_at"`
|
||||
Display_name string `json:"display_name"`
|
||||
Url string `json:"url"`
|
||||
}
|
||||
|
||||
// Used to report a new instance to main
|
||||
type InstanceReport struct {
|
||||
endpoint string
|
||||
status int
|
||||
|
||||
min_id string
|
||||
numposts int
|
||||
}
|
||||
|
||||
// Instance's new min_id value
|
||||
type RunningInstance struct {
|
||||
Endpoint string `json:"endpoint"`
|
||||
Software string `json:"software"`
|
||||
Min_id string
|
||||
Status int `json:"status"`
|
||||
LastRun string `json:"lastrun"`
|
||||
}
|
||||
|
||||
type NodeInfoSoftware struct {
|
||||
Name string `json:"name"`
|
||||
Version string `json:"version"`
|
||||
}
|
||||
|
||||
type NodeInfo struct {
|
||||
Software NodeInfoSoftware `json:"software"`
|
||||
}
|
||||
|
||||
type CommandMap struct {
|
||||
Type string `json:"Type"`
|
||||
Endpoint string `json:"Endpoint"`
|
||||
}
|
||||
|
||||
type ResponseBack struct {
|
||||
Type string `json:"Type"`
|
||||
Message string `json:"Message"`
|
||||
RunningInstances []RunningInstance `json:"RunningInstances"`
|
||||
}
|
175
poll/instance.go
Normal file
175
poll/instance.go
Normal file
@ -0,0 +1,175 @@
|
||||
package main
|
||||
|
||||
import (
|
||||
"github.com/microcosm-cc/bluemonday"
|
||||
"encoding/json"
|
||||
"crypto/sha1"
|
||||
"io/ioutil"
|
||||
"net/http"
|
||||
"strings"
|
||||
"html"
|
||||
"time"
|
||||
"fmt"
|
||||
"os"
|
||||
)
|
||||
|
||||
func DeferPollRun(instancereport InstanceReport, runninginstances *[]RunningInstance, instanceReportChan chan InstanceReport, reportPostChan chan ReportPost) {
|
||||
|
||||
delay := 10
|
||||
if instancereport.status == RUNNING && instancereport.numposts <= 10 {
|
||||
delay = 10
|
||||
} else if instancereport.status == RUNNING && instancereport.numposts > 10 {
|
||||
delay = 15
|
||||
} else if instancereport.status == 429 {
|
||||
delay = 30
|
||||
} else {
|
||||
fmt.Println("error, status code is ------------->: ", instancereport.status)
|
||||
os.Exit(1)
|
||||
}
|
||||
time.Sleep(time.Second * time.Duration(delay))
|
||||
|
||||
go StartInstancePoll(instancereport, reportPostChan, instanceReportChan)
|
||||
}
|
||||
|
||||
func StartInstancePoll(instancereport InstanceReport, reportPostChan chan ReportPost, instanceReportChan chan InstanceReport) {
|
||||
p := bluemonday.NewPolicy()
|
||||
newposts := make([]ReportPost, 0)
|
||||
|
||||
// Only placing this here to later have the option of using
|
||||
// an HTTP client via a SOCKS5 Tor proxy
|
||||
if strings.Contains(instancereport.endpoint, ".onion") == true {
|
||||
instanceReportChan <- InstanceReport{instancereport.endpoint, ONION_PROTOCOL, "", 0}
|
||||
return
|
||||
}
|
||||
|
||||
api_timeline := "https://" + instancereport.endpoint + "/api/v1/timelines/public?limit=40&min_id=" + instancereport.min_id
|
||||
resp, err := http.Get(api_timeline)
|
||||
if err != nil {
|
||||
instanceReportChan <- InstanceReport{instancereport.endpoint, CLIENT_ISSUE, "", 0}
|
||||
return
|
||||
}
|
||||
|
||||
body, err := ioutil.ReadAll(resp.Body)
|
||||
err = json.Unmarshal(body, &newposts)
|
||||
if err != nil {
|
||||
// instanceReportChan <- InstanceReport{instancereport.endpoint, resp.StatusCode, "", 0}
|
||||
instanceReportChan <- InstanceReport{instancereport.endpoint, BAD_RESPONSE, "", 0}
|
||||
return
|
||||
}
|
||||
|
||||
newinstances := make([]string, 0)
|
||||
min_id := ""
|
||||
numposts := 0
|
||||
for _, newpost := range newposts {
|
||||
|
||||
if newpost.Account.Acct == "" {
|
||||
continue
|
||||
}
|
||||
|
||||
posthash := sha1.New()
|
||||
|
||||
at_sign := strings.Index(newpost.Account.Acct, "@")
|
||||
|
||||
if at_sign == -1 {
|
||||
at_sign = len(newpost.Account.Acct)
|
||||
newpost.Account.Acct += "@" + instancereport.endpoint
|
||||
}
|
||||
|
||||
// Calculate the post hash
|
||||
fmt.Fprint(posthash, newpost.Url)
|
||||
fmt.Fprint(posthash, newpost.normalized)
|
||||
fmt.Fprint(posthash, newpost.Account.Acct)
|
||||
fmt.Fprint(posthash, newpost.Account.Display_name)
|
||||
newpost.posthash = posthash.Sum(nil)
|
||||
|
||||
newpost.normalized = html.UnescapeString(strings.ToLower(p.Sanitize(newpost.Content)))
|
||||
|
||||
reportPostChan <- newpost
|
||||
|
||||
// Check min_id
|
||||
if newpost.Id > min_id {
|
||||
min_id = newpost.Id
|
||||
}
|
||||
numposts = numposts + 1
|
||||
|
||||
newinstance := newpost.Account.Acct[at_sign+1:]
|
||||
newinstances = AppendIfMissing(newinstances, newinstance)
|
||||
}
|
||||
|
||||
for _, newinstance := range newinstances {
|
||||
var q InstanceReport
|
||||
q.endpoint = newinstance
|
||||
q.status = NEW_INSTANCE
|
||||
q.min_id = ""
|
||||
q.numposts = 0
|
||||
instanceReportChan <- q
|
||||
}
|
||||
|
||||
instanceReportChan <- InstanceReport{instancereport.endpoint, resp.StatusCode, min_id, numposts}
|
||||
}
|
||||
|
||||
// Change this to return a proper "err"
|
||||
func GetNodeInfo(endpoint string, nodeinfo *NodeInfo) {
|
||||
api_nodeinfo := "https://" + endpoint + "/nodeinfo/2.0.json"
|
||||
http_client := http.Client{Timeout: 5 * time.Second}
|
||||
resp, err := http_client.Get(api_nodeinfo)
|
||||
if err != nil {
|
||||
return
|
||||
}
|
||||
|
||||
body, err := ioutil.ReadAll(resp.Body)
|
||||
err = json.Unmarshal(body, &nodeinfo)
|
||||
if err != nil {
|
||||
// fmt.Println("Unmarshal 2");
|
||||
return
|
||||
}
|
||||
}
|
||||
|
||||
func NewInstance(endpoint string, runninginstances *[]RunningInstance, instanceReportChan chan InstanceReport, reportPostChan chan ReportPost) {
|
||||
var nodeinfo NodeInfo
|
||||
|
||||
if endpoint == "" {
|
||||
return
|
||||
}
|
||||
|
||||
// No repeats
|
||||
for _, runninginstance := range *runninginstances {
|
||||
if runninginstance.Endpoint == endpoint {
|
||||
return
|
||||
}
|
||||
}
|
||||
|
||||
// Check node type
|
||||
GetNodeInfo(endpoint, &nodeinfo)
|
||||
if nodeinfo.Software.Name == "" {
|
||||
go func() {
|
||||
var q InstanceReport
|
||||
q.endpoint = endpoint
|
||||
q.status = BAD_NODEINFO
|
||||
instanceReportChan <- q
|
||||
return
|
||||
}()
|
||||
}
|
||||
|
||||
newinstance := RunningInstance{endpoint, "", "", NEW_INSTANCE, "Queued"}
|
||||
*runninginstances = append(*runninginstances, newinstance)
|
||||
|
||||
if nodeinfo.Software.Name == "pleroma" || nodeinfo.Software.Name == "mastodon" {
|
||||
var newinstancereport InstanceReport
|
||||
newinstancereport.endpoint = endpoint
|
||||
newinstancereport.status = 0
|
||||
newinstancereport.min_id = ""
|
||||
newinstancereport.numposts = 0
|
||||
go StartInstancePoll(newinstancereport, reportPostChan, instanceReportChan)
|
||||
}
|
||||
}
|
||||
|
||||
func SuspendInstance(suspendinstance InstanceReport, runninginstances *[]RunningInstance) {
|
||||
for i, runninginstance := range *runninginstances {
|
||||
if runninginstance.Endpoint == suspendinstance.endpoint {
|
||||
(*runninginstances)[i].Status = suspendinstance.status
|
||||
(*runninginstances)[i].LastRun = time.Now().Format("2006.01.02-15:04:05")
|
||||
return
|
||||
}
|
||||
}
|
||||
}
|
136
poll/main.go
Normal file
136
poll/main.go
Normal file
@ -0,0 +1,136 @@
|
||||
package main
|
||||
|
||||
import (
|
||||
"github.com/jackc/pgx/pgxpool"
|
||||
_ "net/http/pprof"
|
||||
"net/http"
|
||||
"context"
|
||||
"time"
|
||||
"fmt"
|
||||
"net"
|
||||
"log"
|
||||
"os"
|
||||
)
|
||||
|
||||
func AppendIfMissing(hay []string, needle string) []string {
|
||||
for _, ele := range hay {
|
||||
if ele == needle {
|
||||
return hay
|
||||
}
|
||||
}
|
||||
return append(hay, needle)
|
||||
}
|
||||
|
||||
func writePost(pool *pgxpool.Pool, reportpost ReportPost) {
|
||||
conn, err := pool.Acquire(context.Background())
|
||||
if err != nil {
|
||||
log.Fatal("Error connecting to database:", err)
|
||||
os.Exit(1)
|
||||
}
|
||||
defer conn.Release()
|
||||
|
||||
// Insert new account if new
|
||||
var accountid int
|
||||
err = conn.QueryRow(context.Background(), "INSERT INTO accounts (acct, avatar, bot, created_at, display_name, url) VALUES($1, $2, $3, $4, $5, $6) ON CONFLICT(acct) DO UPDATE SET acct=EXCLUDED.acct RETURNING id", reportpost.Account.Acct, reportpost.Account.Avatar, reportpost.Account.Bot, reportpost.Account.Created_at, reportpost.Account.Display_name, reportpost.Account.Url).Scan(&accountid)
|
||||
if err != nil {
|
||||
fmt.Println("First ", err)
|
||||
fmt.Println("--------------------------")
|
||||
fmt.Println("Reported error: ", err)
|
||||
fmt.Println("Account Acct: ", reportpost.Account.Acct)
|
||||
fmt.Println("Account Avatar: ", reportpost.Account.Avatar)
|
||||
fmt.Println("Account Avatar len: ", len(reportpost.Account.Avatar))
|
||||
fmt.Println("Account Bot: ", reportpost.Account.Bot)
|
||||
fmt.Println("Account Created_at: ", reportpost.Account.Created_at)
|
||||
fmt.Println("Account Display: ", reportpost.Account.Display_name)
|
||||
fmt.Println("Account URL: ", reportpost.Account.Url)
|
||||
fmt.Println(reportpost)
|
||||
fmt.Println("--------------------------")
|
||||
os.Exit(1) // For now I want this to die and learn why it failed
|
||||
return
|
||||
}
|
||||
|
||||
// Insert new post if new
|
||||
_, err = conn.Exec(context.Background(), "INSERT INTO posts (url, content, created_at, normalized, account_id, posthash) VALUES ($1, $2, $3, $4, $5, $6) ON CONFLICT (posthash) DO NOTHING", reportpost.Url, reportpost.Content, reportpost.Created_at, reportpost.normalized, accountid, reportpost.posthash)
|
||||
if err != nil { // For now I want to know why this failed.
|
||||
fmt.Println("Second ", err)
|
||||
fmt.Println("--------------------------")
|
||||
fmt.Println("Reported error: ", err)
|
||||
fmt.Println("Url: ", reportpost.Url)
|
||||
fmt.Println("Content: ", reportpost.Content)
|
||||
fmt.Println("Created_at: ", reportpost.Created_at)
|
||||
fmt.Println("normalized: ", reportpost.normalized)
|
||||
fmt.Println("account_id", accountid)
|
||||
fmt.Println("posthash: ", reportpost.posthash)
|
||||
fmt.Println("--------------------------")
|
||||
os.Exit(1) // For now I want this to die and learn why it failed
|
||||
return
|
||||
}
|
||||
}
|
||||
|
||||
func engine() {
|
||||
|
||||
// Current instances
|
||||
runninginstances := make([]RunningInstance, 0)
|
||||
|
||||
// Initial Setup
|
||||
reportPostChan := make(chan ReportPost, 2000)
|
||||
instanceReportChan := make(chan InstanceReport, 20)
|
||||
|
||||
// Setup Database
|
||||
pool, err := pgxpool.Connect(context.Background(), "postgres://postgres@127.0.0.1/fedilogue")
|
||||
if err != nil {
|
||||
fmt.Fprintln(os.Stderr, "Unable to connect to database:", err)
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
l, err := net.Listen("tcp", "127.0.0.1:5555")
|
||||
if err != nil {
|
||||
fmt.Println(err)
|
||||
return
|
||||
}
|
||||
defer l.Close()
|
||||
|
||||
commandClient := make(chan net.Conn)
|
||||
|
||||
go func(l net.Listener) {
|
||||
for {
|
||||
c, err := l.Accept()
|
||||
if err != nil {
|
||||
fmt.Println("Error on accept")
|
||||
commandClient <- nil
|
||||
return
|
||||
}
|
||||
commandClient <- c
|
||||
}
|
||||
}(l)
|
||||
|
||||
for {
|
||||
select {
|
||||
case c := <-commandClient: // New client connection
|
||||
go handleClient(c, &runninginstances, instanceReportChan)
|
||||
case v := <-reportPostChan: // New Post
|
||||
go writePost(pool, v)
|
||||
case w := <-instanceReportChan: // Start or suspend instance
|
||||
if w.status == NEW_INSTANCE {
|
||||
NewInstance(w.endpoint, &runninginstances, instanceReportChan, reportPostChan)
|
||||
} else if w.status == RUNNING || w.status == TOOMANYREQUESTS {
|
||||
for i, runninginstance := range runninginstances {
|
||||
if runninginstance.Endpoint == w.endpoint {
|
||||
runninginstances[i].Min_id = w.min_id
|
||||
runninginstances[i].Status = w.status
|
||||
runninginstances[i].LastRun = time.Now().Format("2006.01.02-15:04:05")
|
||||
}
|
||||
}
|
||||
go DeferPollRun(w, &runninginstances, instanceReportChan, reportPostChan)
|
||||
} else {
|
||||
SuspendInstance(w, &runninginstances)
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
func main() {
|
||||
go engine()
|
||||
log.Println("serving on port 8080")
|
||||
log.Fatal(http.ListenAndServe(":8080", nil))
|
||||
}
|
Loading…
x
Reference in New Issue
Block a user