Build and release tooling:
- Makefile with help as default; targets: build/build-amd64/build-arm64,
test, lint, proto, pkg-deb, docker, docker-push, clean, plus
install-deps (+ three sub-targets for apt / Go toolchain / Go tools).
- internal/version package; -ldflags -X injects Version/Commit/Date into
every binary. -version flag on all four binaries (nginx-logtail version
for the CLI).
- Dockerfile takes VERSION/COMMIT/DATE build-args and forwards them.
- .deb output lands in build/; .gitignore ignores /build/.
Debian package:
- debian/build-deb.sh packages all four static binaries into a single
nginx-logtail_<ver>_<arch>.deb using dpkg-deb.
- Binary layout: /usr/sbin/nginx-logtail-{collector,aggregator,frontend}
and /usr/bin/nginx-logtail.
- nginx-logtail(8) manpage.
- Three systemd units (collector, aggregator, frontend) shipped under
/lib/systemd/system/. Installed but never enabled or started — the
operator opts in per host.
- Collector runs as _logtail:www-data (log access); aggregator and
frontend as _logtail:_logtail. postinst creates the system user/group
idempotently.
- Single shared env file /etc/default/nginx-logtail rendered from a
template at first install with %HOSTNAME% substituted. Sensible
defaults for every COLLECTOR_*, AGGREGATOR_*, FRONTEND_* variable;
plus COLLECTOR_ARGS / AGGREGATOR_ARGS / FRONTEND_ARGS escape hatches
appended to ExecStart. Not a dpkg conffile: operator edits survive
upgrades and dpkg --purge removes it.
Versioned UDP wire format:
- ParseUDPLine dispatches on a leading "v<N>\t" tag; v1 routes to the
existing 12-field parser. Unknown/missing versions fail closed so
future v2 parsers can land before emitters are upgraded.
- Tests updated; design.md FR-2.2 rewritten to make the version tag
normative.
Docs:
- README.md gains a Quick Start (Debian / Docker Compose / from source).
- user-guide.md rewritten around Installation and Configuration: full
env-var table, UDP-only default explained, precise file/UDP log_format
layouts, note that operators can emit "0" for unknown \$is_tor / \$asn.
- Drilldown cycle, frontend filter table, and CLI --group-by list all
include source_tag. UDP counters documented in the Prometheus section.
Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
160 lines
4.2 KiB
Go
160 lines
4.2 KiB
Go
package main
|
|
|
|
import (
|
|
"fmt"
|
|
"net"
|
|
"strconv"
|
|
"strings"
|
|
)
|
|
|
|
// LogRecord holds the dimensions extracted from a single nginx log line.
|
|
type LogRecord struct {
|
|
Website string
|
|
ClientPrefix string
|
|
URI string
|
|
Status string
|
|
IsTor bool
|
|
ASN int32
|
|
Method string
|
|
BodyBytesSent int64
|
|
RequestTime float64
|
|
SourceTag string
|
|
}
|
|
|
|
// fileSourceTag is the SourceTag assigned to records read from on-disk log
|
|
// files, which pre-date the tag concept. Mirrors nginx's fallback label.
|
|
const fileSourceTag = "direct"
|
|
|
|
// ParseLine parses a tab-separated logtail log line from a file:
|
|
//
|
|
// $host \t $remote_addr \t $msec \t $request_method \t $request_uri \t $status \t $body_bytes_sent \t $request_time \t $is_tor \t $asn
|
|
//
|
|
// The is_tor (field 9) and asn (field 10) fields are optional for backward
|
|
// compatibility with older log files that omit them; they default to false/0
|
|
// when absent. SourceTag is always set to "direct" (file origin has no tag).
|
|
// Returns false for lines with fewer than 8 fields.
|
|
func ParseLine(line string, v4bits, v6bits int) (LogRecord, bool) {
|
|
fields := strings.SplitN(line, "\t", 10)
|
|
if len(fields) < 8 {
|
|
return LogRecord{}, false
|
|
}
|
|
prefix, ok := truncateIP(fields[1], v4bits, v6bits)
|
|
if !ok {
|
|
return LogRecord{}, false
|
|
}
|
|
isTor := len(fields) >= 9 && fields[8] == "1"
|
|
var asn int32
|
|
if len(fields) == 10 {
|
|
if n, err := strconv.ParseInt(fields[9], 10, 32); err == nil {
|
|
asn = int32(n)
|
|
}
|
|
}
|
|
return LogRecord{
|
|
Website: fields[0],
|
|
ClientPrefix: prefix,
|
|
URI: stripQuery(fields[4]),
|
|
Status: fields[5],
|
|
IsTor: isTor,
|
|
ASN: asn,
|
|
Method: fields[3],
|
|
BodyBytesSent: parseInt(fields[6]),
|
|
RequestTime: parseFloat(fields[7]),
|
|
SourceTag: fileSourceTag,
|
|
}, true
|
|
}
|
|
|
|
// ParseUDPLine dispatches on the version prefix emitted by
|
|
// nginx-ipng-stats-plugin's ipng_stats_logtail directive. The wire format is
|
|
// "v<N>\t<payload>", where <payload> is version-specific. Unknown or missing
|
|
// versions return false so operators can roll out a v2 parser before
|
|
// upgrading emitters.
|
|
func ParseUDPLine(line string, v4bits, v6bits int) (LogRecord, bool) {
|
|
i := strings.IndexByte(line, '\t')
|
|
if i < 0 {
|
|
return LogRecord{}, false
|
|
}
|
|
switch line[:i] {
|
|
case "v1":
|
|
return parseUDPLineV1(line[i+1:], v4bits, v6bits)
|
|
default:
|
|
return LogRecord{}, false
|
|
}
|
|
}
|
|
|
|
// parseUDPLineV1 parses the v1 payload (12 tab-separated fields):
|
|
//
|
|
// $host \t $remote_addr \t $request_method \t $request_uri \t $status \t
|
|
// $body_bytes_sent \t $request_time \t $is_tor \t $asn \t
|
|
// $ipng_source_tag \t $server_addr \t $scheme
|
|
//
|
|
// server_addr and scheme are parsed but discarded.
|
|
func parseUDPLineV1(payload string, v4bits, v6bits int) (LogRecord, bool) {
|
|
fields := strings.Split(payload, "\t")
|
|
if len(fields) != 12 {
|
|
return LogRecord{}, false
|
|
}
|
|
prefix, ok := truncateIP(fields[1], v4bits, v6bits)
|
|
if !ok {
|
|
return LogRecord{}, false
|
|
}
|
|
var asn int32
|
|
if n, err := strconv.ParseInt(fields[8], 10, 32); err == nil {
|
|
asn = int32(n)
|
|
}
|
|
return LogRecord{
|
|
Website: fields[0],
|
|
ClientPrefix: prefix,
|
|
URI: stripQuery(fields[3]),
|
|
Status: fields[4],
|
|
IsTor: fields[7] == "1",
|
|
ASN: asn,
|
|
Method: fields[2],
|
|
BodyBytesSent: parseInt(fields[5]),
|
|
RequestTime: parseFloat(fields[6]),
|
|
SourceTag: fields[9],
|
|
}, true
|
|
}
|
|
|
|
func stripQuery(uri string) string {
|
|
if i := strings.IndexByte(uri, '?'); i >= 0 {
|
|
return uri[:i]
|
|
}
|
|
return uri
|
|
}
|
|
|
|
func parseInt(s string) int64 {
|
|
n, _ := strconv.ParseInt(s, 10, 64)
|
|
return n
|
|
}
|
|
|
|
func parseFloat(s string) float64 {
|
|
f, _ := strconv.ParseFloat(s, 64)
|
|
return f
|
|
}
|
|
|
|
// truncateIP masks addr to the given prefix length depending on IP version.
|
|
// Returns the CIDR string (e.g. "1.2.3.0/24") and true on success.
|
|
func truncateIP(addr string, v4bits, v6bits int) (string, bool) {
|
|
ip := net.ParseIP(addr)
|
|
if ip == nil {
|
|
return "", false
|
|
}
|
|
|
|
var bits int
|
|
if ip.To4() != nil {
|
|
ip = ip.To4()
|
|
bits = v4bits
|
|
} else {
|
|
ip = ip.To16()
|
|
bits = v6bits
|
|
}
|
|
|
|
mask := net.CIDRMask(bits, len(ip)*8)
|
|
masked := make(net.IP, len(ip))
|
|
for i := range ip {
|
|
masked[i] = ip[i] & mask[i]
|
|
}
|
|
|
|
return fmt.Sprintf("%s/%d", masked.String(), bits), true
|
|
}
|