summaryrefslogtreecommitdiff
path: root/lex-fetch/at/at.go
blob: 44efb27c40705ca53e467efc8d01263c734b6d51 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
package at

import (
	"encoding/json"
	"fmt"
	"log/slog"
	"maps"
	"math"
	"net/http"
	"net/url"
	"slices"
	"strconv"
	"strings"
	"sync"
	"time"

	"push-f.com/lex-surf/internal/lex"
	"push-f.com/lex-surf/lex-fetch/progress"
)

type Fetcher struct{}

const concurrentRequests = 4

func (s *Fetcher) Fetch(log *slog.Logger, client *http.Client, progress *progress.Reporter) ([]lex.Law, error) {
	// The API is documented in https://data.bka.gv.at/ris/ogd/v2.6/Documents/Dokumentation_OGD-RIS_API.pdf.

	// Consolidated laws can only be queried via the Bundesrecht endpoint which returns individual paragraphs.
	// Since we'll get multiple results for each law, we're saving results into a hash map.
	lawsMap := make(map[string]lex.Law)

	// TODO: also query laws from the past and future
	date := time.Now().Format("2006-01-02")

	data, err := fetchPage(client, date, 1)
	if err != nil {
		return nil, fmt.Errorf("failed to fetch first page: %w", err)
	}
	totalResults, _ := strconv.Atoi(data.Hits.Text)
	if totalResults == 0 {
		return nil, fmt.Errorf("API returned 0 results")
	}
	totalPages := int(math.Ceil(float64(totalResults) / 100))
	progress.Total = totalPages
	assign(lawsMap, data.OgdDocumentReference)

	semaphore := make(chan struct{}, concurrentRequests)
	var wg sync.WaitGroup
	var mu sync.Mutex
	var retErr error
	var retErrPage int
	var errOnce sync.Once

	for page := 2; page <= totalPages; page++ {
		if retErr != nil {
			return nil, fmt.Errorf("failed to fetch page %d: %w", retErrPage, retErr)
		}
		wg.Add(1)
		semaphore <- struct{}{}

		go func(p int) {
			defer wg.Done()
			defer func() { <-semaphore }()

			data, err := fetchPage(client, date, page)
			progress.ReportProgress(page)
			if err != nil {
				errOnce.Do(func() {
					retErr = err
					retErrPage = p
				})
			}
			mu.Lock()
			assign(lawsMap, data.OgdDocumentReference)
			mu.Unlock()
		}(page)
	}
	laws := slices.SortedFunc(maps.Values(lawsMap), func(a, b lex.Law) int {
		if a.Title > b.Title {
			return 1
		} else if a.Title < b.Title {
			return -1
		}
		return 0
	})
	return laws, nil
}

func fetchPage(client *http.Client, date string, page int) (*ogdDocumentResults, error) {
	req, err := http.NewRequest("GET", "https://data.bka.gv.at/ris/api/v2.6/Bundesrecht", nil)
	if err != nil {
		return nil, fmt.Errorf("build request: %w", err)
	}
	req.URL.RawQuery = url.Values{
		"Appl":              {"BrKons"},      // Bundesrecht konsolidiert
		"Typ":               {"BG oder BVG"}, // Bundesgesetz or Bundesverfassungsgesetz
		"DokumenteProSeite": {"OneHundred"},
		"Seitennummer":      {strconv.Itoa(page)},
		"FassungVom":        {date},
	}.Encode()
	resp, err := client.Do(req)
	if err != nil {
		return nil, fmt.Errorf("send request: %w", err)
	}

	if resp.StatusCode != 200 {
		return nil, fmt.Errorf("unexpected status code %d", resp.StatusCode)
	}

	var data brKonsResult

	err = json.NewDecoder(resp.Body).Decode(&data)
	if err != nil {
		return nil, fmt.Errorf("JSON decode: %w", err)
	}

	result := data.OgdSearchResult

	if result.Error != nil {
		return nil, fmt.Errorf("error response: %s", result.Error)
	}

	return result.OgdDocumentResults, nil
}

func assign(laws map[string]lex.Law, paraDocs []document) {
	for _, paraDoc := range paraDocs {
		para := paraDoc.Data.Metadaten.Bundesrecht
		law := lex.Law{
			Title: para.Kurztitel,
			URL:   para.BrKons.GesamteRechtsvorschriftUrl,
		}
		if para.BrKons.Abkuerzung != nil {
			law.Abbr = *para.BrKons.Abkuerzung
			redir := strings.ToLower(*para.BrKons.Abkuerzung)
			redir = strings.ReplaceAll(redir, ")", "")
			redir = strings.ReplaceAll(redir, "(", "")
			redir = strings.ReplaceAll(redir, " – ", "-")
			redir = strings.ReplaceAll(redir, " ", "-")
			redir = strings.ReplaceAll(redir, "\u00A0", "-")
			redir = strings.ReplaceAll(redir, "ä", "ae")
			redir = strings.ReplaceAll(redir, "ü", "ue")
			redir = strings.ReplaceAll(redir, "ö", "oe")
			redir = strings.ReplaceAll(redir, "ß", "ss")
			law.Redir = redir
		}
		laws[para.BrKons.Gesetzesnummer] = law
	}
}

type brKonsResult struct {
	OgdSearchResult struct {
		Error *struct {
			Applikation string
			Message     string
		}
		OgdDocumentResults *ogdDocumentResults
	}
}

type ogdDocumentResults struct {
	Hits struct {
		Text string `json:"#text"`
	}
	OgdDocumentReference []document
}

type document struct {
	Data struct {
		Metadaten struct {
			Bundesrecht struct {
				Kurztitel string
				BrKons    struct {
					GesamteRechtsvorschriftUrl string
					Abkuerzung                 *string
					Gesetzesnummer             string
				}
			}
		}
	}
}