c74c94d616
We are not using them anymore. The only nettest still using the legacy netx implementation is tor, for which setting these fields is useless, because it performs each measurement into a separate goroutine. Hence, let us start removing this part of the legacy netx codebase, which is hampering progress in other areas. Occurred to me while doing testing for the recent changes in error mapping (https://github.com/ooni/probe/issues/1505).
483 lines
14 KiB
Go
483 lines
14 KiB
Go
// Package oonidatamodel contains the OONI data model.
|
|
//
|
|
// The input of this package is data generated by netx and the
|
|
// output is a format consistent with OONI specs.
|
|
//
|
|
// Deprecated by the archival package.
|
|
package oonidatamodel
|
|
|
|
import (
|
|
"encoding/base64"
|
|
"encoding/json"
|
|
"errors"
|
|
"net"
|
|
"net/http"
|
|
"strconv"
|
|
"strings"
|
|
"unicode/utf8"
|
|
|
|
"github.com/ooni/probe-cli/v3/internal/engine/legacy/netx/modelx"
|
|
"github.com/ooni/probe-cli/v3/internal/engine/legacy/oonitemplates"
|
|
"github.com/ooni/probe-cli/v3/internal/engine/model"
|
|
"github.com/ooni/probe-cli/v3/internal/engine/netx/errorx"
|
|
"github.com/ooni/probe-cli/v3/internal/engine/netx/tlsx"
|
|
)
|
|
|
|
// ExtSpec describes a data format extension
|
|
type ExtSpec struct {
|
|
Name string // extension name
|
|
V int64 // extension version
|
|
}
|
|
|
|
// AddTo adds the current ExtSpec to the specified measurement
|
|
func (spec ExtSpec) AddTo(m *model.Measurement) {
|
|
if m.Extensions == nil {
|
|
m.Extensions = make(map[string]int64)
|
|
}
|
|
m.Extensions[spec.Name] = spec.V
|
|
}
|
|
|
|
var (
|
|
// ExtDNS is the version of df-002-dnst.md
|
|
ExtDNS = ExtSpec{Name: "dnst", V: 0}
|
|
|
|
// ExtNetevents is the version of df-008-netevents.md
|
|
ExtNetevents = ExtSpec{Name: "netevents", V: 0}
|
|
|
|
// ExtHTTP is the version of df-001-httpt.md
|
|
ExtHTTP = ExtSpec{Name: "httpt", V: 0}
|
|
|
|
// ExtTCPConnect is the version of df-005-tcpconnect.md
|
|
ExtTCPConnect = ExtSpec{Name: "tcpconnect", V: 0}
|
|
|
|
// ExtTLSHandshake is the version of df-006-tlshandshake.md
|
|
ExtTLSHandshake = ExtSpec{Name: "tlshandshake", V: 0}
|
|
)
|
|
|
|
// TCPConnectStatus contains the TCP connect status.
|
|
type TCPConnectStatus struct {
|
|
Failure *string `json:"failure"`
|
|
Success bool `json:"success"`
|
|
}
|
|
|
|
// TCPConnectEntry contains one of the entries that are part
|
|
// of the "tcp_connect" key of a OONI report.
|
|
type TCPConnectEntry struct {
|
|
IP string `json:"ip"`
|
|
Port int `json:"port"`
|
|
Status TCPConnectStatus `json:"status"`
|
|
T float64 `json:"t"`
|
|
}
|
|
|
|
// TCPConnectList is a list of TCPConnectEntry
|
|
type TCPConnectList []TCPConnectEntry
|
|
|
|
// NewTCPConnectList creates a new TCPConnectList
|
|
func NewTCPConnectList(results oonitemplates.Results) TCPConnectList {
|
|
var out TCPConnectList
|
|
for _, connect := range results.Connects {
|
|
// We assume Go is passing us legit data structs
|
|
ip, sport, _ := net.SplitHostPort(connect.RemoteAddress)
|
|
iport, _ := strconv.Atoi(sport)
|
|
out = append(out, TCPConnectEntry{
|
|
IP: ip,
|
|
Port: iport,
|
|
Status: TCPConnectStatus{
|
|
Failure: makeFailure(connect.Error),
|
|
Success: connect.Error == nil,
|
|
},
|
|
T: connect.DurationSinceBeginning.Seconds(),
|
|
})
|
|
}
|
|
return out
|
|
}
|
|
|
|
func makeFailure(err error) (s *string) {
|
|
if err != nil {
|
|
serio := err.Error()
|
|
s = &serio
|
|
}
|
|
return
|
|
}
|
|
|
|
// HTTPTor contains Tor information
|
|
type HTTPTor struct {
|
|
ExitIP *string `json:"exit_ip"`
|
|
ExitName *string `json:"exit_name"`
|
|
IsTor bool `json:"is_tor"`
|
|
}
|
|
|
|
// MaybeBinaryValue is a possibly binary string. We use this helper class
|
|
// to define a custom JSON encoder that allows us to choose the proper
|
|
// representation depending on whether the Value field is valid UTF-8 or not.
|
|
type MaybeBinaryValue struct {
|
|
Value string
|
|
}
|
|
|
|
// MarshalJSON marshals a string-like to JSON following the OONI spec that
|
|
// says that UTF-8 content is represened as string and non-UTF-8 content is
|
|
// instead represented using `{"format":"base64","data":"..."}`.
|
|
func (hb MaybeBinaryValue) MarshalJSON() ([]byte, error) {
|
|
if utf8.ValidString(hb.Value) {
|
|
return json.Marshal(hb.Value)
|
|
}
|
|
er := make(map[string]string)
|
|
er["format"] = "base64"
|
|
er["data"] = base64.StdEncoding.EncodeToString([]byte(hb.Value))
|
|
return json.Marshal(er)
|
|
}
|
|
|
|
// UnmarshalJSON is the opposite of MarshalJSON.
|
|
func (hb *MaybeBinaryValue) UnmarshalJSON(d []byte) error {
|
|
if err := json.Unmarshal(d, &hb.Value); err == nil {
|
|
return nil
|
|
}
|
|
er := make(map[string]string)
|
|
if err := json.Unmarshal(d, &er); err != nil {
|
|
return err
|
|
}
|
|
if v, ok := er["format"]; !ok || v != "base64" {
|
|
return errors.New("missing or invalid format field")
|
|
}
|
|
if _, ok := er["data"]; !ok {
|
|
return errors.New("missing data field")
|
|
}
|
|
b64, err := base64.StdEncoding.DecodeString(er["data"])
|
|
if err != nil {
|
|
return err
|
|
}
|
|
hb.Value = string(b64)
|
|
return nil
|
|
}
|
|
|
|
// HTTPBody is an HTTP body. As an implementation note, this type must be
|
|
// an alias for the MaybeBinaryValue type, otherwise the specific serialisation
|
|
// mechanism implemented by MaybeBinaryValue is not working.
|
|
type HTTPBody = MaybeBinaryValue
|
|
|
|
// HTTPHeaders contains HTTP headers. This headers representation is
|
|
// deprecated in favour of HTTPHeadersList since data format 0.3.0.
|
|
type HTTPHeaders map[string]MaybeBinaryValue
|
|
|
|
// HTTPHeader is a single HTTP header.
|
|
type HTTPHeader struct {
|
|
Key string
|
|
Value MaybeBinaryValue
|
|
}
|
|
|
|
// MarshalJSON marshals a single HTTP header to a tuple where the first
|
|
// element is a string and the second element is maybe-binary data.
|
|
func (hh HTTPHeader) MarshalJSON() ([]byte, error) {
|
|
if utf8.ValidString(hh.Value.Value) {
|
|
return json.Marshal([]string{hh.Key, hh.Value.Value})
|
|
}
|
|
value := make(map[string]string)
|
|
value["format"] = "base64"
|
|
value["data"] = base64.StdEncoding.EncodeToString([]byte(hh.Value.Value))
|
|
return json.Marshal([]interface{}{hh.Key, value})
|
|
}
|
|
|
|
// UnmarshalJSON is the opposite of MarshalJSON.
|
|
func (hh *HTTPHeader) UnmarshalJSON(d []byte) error {
|
|
var pair []interface{}
|
|
if err := json.Unmarshal(d, &pair); err != nil {
|
|
return err
|
|
}
|
|
if len(pair) != 2 {
|
|
return errors.New("unexpected pair length")
|
|
}
|
|
key, ok := pair[0].(string)
|
|
if !ok {
|
|
return errors.New("the key is not a string")
|
|
}
|
|
value, ok := pair[1].(string)
|
|
if !ok {
|
|
mapvalue, ok := pair[1].(map[string]interface{})
|
|
if !ok {
|
|
return errors.New("the value is neither a string nor a map[string]interface{}")
|
|
}
|
|
if _, ok := mapvalue["format"]; !ok {
|
|
return errors.New("missing format")
|
|
}
|
|
if v, ok := mapvalue["format"].(string); !ok || v != "base64" {
|
|
return errors.New("invalid format")
|
|
}
|
|
if _, ok := mapvalue["data"]; !ok {
|
|
return errors.New("missing data field")
|
|
}
|
|
v, ok := mapvalue["data"].(string)
|
|
if !ok {
|
|
return errors.New("the data field is not a string")
|
|
}
|
|
b64, err := base64.StdEncoding.DecodeString(v)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
value = string(b64)
|
|
}
|
|
hh.Key, hh.Value = key, MaybeBinaryValue{Value: value}
|
|
return nil
|
|
}
|
|
|
|
// HTTPHeadersList is a list of headers.
|
|
type HTTPHeadersList []HTTPHeader
|
|
|
|
// HTTPRequest contains an HTTP request.
|
|
//
|
|
// Headers are a map in Web Connectivity data format but
|
|
// we have added support for a list since data format version
|
|
// equal to 0.2.1 (later renamed to 0.3.0).
|
|
type HTTPRequest struct {
|
|
Body HTTPBody `json:"body"`
|
|
BodyIsTruncated bool `json:"body_is_truncated"`
|
|
HeadersList HTTPHeadersList `json:"headers_list"`
|
|
Headers HTTPHeaders `json:"headers"`
|
|
Method string `json:"method"`
|
|
Tor HTTPTor `json:"tor"`
|
|
URL string `json:"url"`
|
|
}
|
|
|
|
// HTTPResponse contains an HTTP response.
|
|
//
|
|
// Headers are a map in Web Connectivity data format but
|
|
// we have added support for a list since data format version
|
|
// equal to 0.2.1 (later renamed to 0.3.0).
|
|
type HTTPResponse struct {
|
|
Body HTTPBody `json:"body"`
|
|
BodyIsTruncated bool `json:"body_is_truncated"`
|
|
Code int64 `json:"code"`
|
|
HeadersList HTTPHeadersList `json:"headers_list"`
|
|
Headers HTTPHeaders `json:"headers"`
|
|
}
|
|
|
|
// RequestEntry is one of the entries that are part of
|
|
// the "requests" key of a OONI report.
|
|
type RequestEntry struct {
|
|
Failure *string `json:"failure"`
|
|
Request HTTPRequest `json:"request"`
|
|
Response HTTPResponse `json:"response"`
|
|
}
|
|
|
|
// RequestList is a list of RequestEntry
|
|
type RequestList []RequestEntry
|
|
|
|
func addheaders(
|
|
source http.Header,
|
|
destList *HTTPHeadersList,
|
|
destMap *HTTPHeaders,
|
|
) {
|
|
for key, values := range source {
|
|
for index, value := range values {
|
|
value := MaybeBinaryValue{Value: value}
|
|
// With the map representation we can only represent a single
|
|
// value for every key. Hence the list representation.
|
|
if index == 0 {
|
|
(*destMap)[key] = value
|
|
}
|
|
*destList = append(*destList, HTTPHeader{
|
|
Key: key,
|
|
Value: value,
|
|
})
|
|
}
|
|
}
|
|
}
|
|
|
|
// NewRequestList returns the list for "requests"
|
|
func NewRequestList(results oonitemplates.Results) RequestList {
|
|
var out RequestList
|
|
in := results.HTTPRequests
|
|
// OONI's data format wants more recent request first
|
|
for idx := len(in) - 1; idx >= 0; idx-- {
|
|
var entry RequestEntry
|
|
entry.Failure = makeFailure(in[idx].Error)
|
|
entry.Request.Headers = make(HTTPHeaders)
|
|
addheaders(
|
|
in[idx].RequestHeaders, &entry.Request.HeadersList,
|
|
&entry.Request.Headers,
|
|
)
|
|
entry.Request.Method = in[idx].RequestMethod
|
|
entry.Request.URL = in[idx].RequestURL
|
|
entry.Request.Body.Value = string(in[idx].RequestBodySnap)
|
|
entry.Request.BodyIsTruncated = in[idx].MaxBodySnapSize > 0 &&
|
|
int64(len(in[idx].RequestBodySnap)) >= in[idx].MaxBodySnapSize
|
|
entry.Response.Headers = make(HTTPHeaders)
|
|
addheaders(
|
|
in[idx].ResponseHeaders, &entry.Response.HeadersList,
|
|
&entry.Response.Headers,
|
|
)
|
|
entry.Response.Code = in[idx].ResponseStatusCode
|
|
entry.Response.Body.Value = string(in[idx].ResponseBodySnap)
|
|
entry.Response.BodyIsTruncated = in[idx].MaxBodySnapSize > 0 &&
|
|
int64(len(in[idx].ResponseBodySnap)) >= in[idx].MaxBodySnapSize
|
|
out = append(out, entry)
|
|
}
|
|
return out
|
|
}
|
|
|
|
// DNSAnswerEntry is the answer to a DNS query
|
|
type DNSAnswerEntry struct {
|
|
AnswerType string `json:"answer_type"`
|
|
Hostname string `json:"hostname,omitempty"`
|
|
IPv4 string `json:"ipv4,omitempty"`
|
|
IPv6 string `json:"ipv6,omitempty"`
|
|
TTL *uint32 `json:"ttl"`
|
|
}
|
|
|
|
// DNSQueryEntry is a DNS query with possibly an answer
|
|
type DNSQueryEntry struct {
|
|
Answers []DNSAnswerEntry `json:"answers"`
|
|
Engine string `json:"engine"`
|
|
Failure *string `json:"failure"`
|
|
Hostname string `json:"hostname"`
|
|
QueryType string `json:"query_type"`
|
|
ResolverHostname *string `json:"resolver_hostname"`
|
|
ResolverPort *string `json:"resolver_port"`
|
|
ResolverAddress string `json:"resolver_address"`
|
|
T float64 `json:"t"`
|
|
}
|
|
|
|
type (
|
|
// DNSQueriesList is a list of DNS queries
|
|
DNSQueriesList []DNSQueryEntry
|
|
dnsQueryType string
|
|
)
|
|
|
|
// NewDNSQueriesList returns a list of DNS queries.
|
|
func NewDNSQueriesList(results oonitemplates.Results) DNSQueriesList {
|
|
// TODO(bassosimone): add support for CNAME lookups.
|
|
var out DNSQueriesList
|
|
for _, resolve := range results.Resolves {
|
|
for _, qtype := range []dnsQueryType{"A", "AAAA"} {
|
|
entry := qtype.makequeryentry(resolve)
|
|
for _, addr := range resolve.Addresses {
|
|
if qtype.ipoftype(addr) {
|
|
entry.Answers = append(entry.Answers, qtype.makeanswerentry(addr))
|
|
}
|
|
}
|
|
out = append(out, entry)
|
|
}
|
|
}
|
|
return out
|
|
}
|
|
|
|
func (qtype dnsQueryType) ipoftype(addr string) bool {
|
|
switch qtype {
|
|
case "A":
|
|
return strings.Contains(addr, ":") == false
|
|
case "AAAA":
|
|
return strings.Contains(addr, ":") == true
|
|
}
|
|
return false
|
|
}
|
|
|
|
func (qtype dnsQueryType) makeanswerentry(addr string) DNSAnswerEntry {
|
|
answer := DNSAnswerEntry{AnswerType: string(qtype)}
|
|
switch qtype {
|
|
case "A":
|
|
answer.IPv4 = addr
|
|
case "AAAA":
|
|
answer.IPv6 = addr
|
|
}
|
|
return answer
|
|
}
|
|
|
|
func (qtype dnsQueryType) makequeryentry(resolve *modelx.ResolveDoneEvent) DNSQueryEntry {
|
|
return DNSQueryEntry{
|
|
Engine: resolve.TransportNetwork,
|
|
Failure: makeFailure(resolve.Error),
|
|
Hostname: resolve.Hostname,
|
|
QueryType: string(qtype),
|
|
ResolverAddress: resolve.TransportAddress,
|
|
T: resolve.DurationSinceBeginning.Seconds(),
|
|
}
|
|
}
|
|
|
|
// NetworkEvent is a network event.
|
|
type NetworkEvent struct {
|
|
Address string `json:"address,omitempty"`
|
|
Failure *string `json:"failure"`
|
|
NumBytes int64 `json:"num_bytes,omitempty"`
|
|
Operation string `json:"operation"`
|
|
Proto string `json:"proto"`
|
|
T float64 `json:"t"`
|
|
}
|
|
|
|
// NetworkEventsList is a list of network events.
|
|
type NetworkEventsList []*NetworkEvent
|
|
|
|
var protocolName = map[bool]string{
|
|
true: "tcp",
|
|
false: "udp",
|
|
}
|
|
|
|
// NewNetworkEventsList returns a list of DNS queries.
|
|
func NewNetworkEventsList(results oonitemplates.Results) NetworkEventsList {
|
|
var out NetworkEventsList
|
|
for _, in := range results.NetworkEvents {
|
|
if in.Connect != nil {
|
|
out = append(out, &NetworkEvent{
|
|
Address: in.Connect.RemoteAddress,
|
|
Failure: makeFailure(in.Connect.Error),
|
|
Operation: errorx.ConnectOperation,
|
|
T: in.Connect.DurationSinceBeginning.Seconds(),
|
|
})
|
|
// fallthrough
|
|
}
|
|
if in.Read != nil {
|
|
out = append(out, &NetworkEvent{
|
|
Failure: makeFailure(in.Read.Error),
|
|
Operation: errorx.ReadOperation,
|
|
NumBytes: in.Read.NumBytes,
|
|
T: in.Read.DurationSinceBeginning.Seconds(),
|
|
})
|
|
// fallthrough
|
|
}
|
|
if in.Write != nil {
|
|
out = append(out, &NetworkEvent{
|
|
Failure: makeFailure(in.Write.Error),
|
|
Operation: errorx.WriteOperation,
|
|
NumBytes: in.Write.NumBytes,
|
|
T: in.Write.DurationSinceBeginning.Seconds(),
|
|
})
|
|
// fallthrough
|
|
}
|
|
}
|
|
return out
|
|
}
|
|
|
|
// TLSHandshake contains TLS handshake data
|
|
type TLSHandshake struct {
|
|
CipherSuite string `json:"cipher_suite"`
|
|
Failure *string `json:"failure"`
|
|
NegotiatedProtocol string `json:"negotiated_protocol"`
|
|
PeerCertificates []MaybeBinaryValue `json:"peer_certificates"`
|
|
T float64 `json:"t"`
|
|
TLSVersion string `json:"tls_version"`
|
|
}
|
|
|
|
// TLSHandshakesList is a list of TLS handshakes
|
|
type TLSHandshakesList []TLSHandshake
|
|
|
|
// NewTLSHandshakesList creates a new TLSHandshakesList
|
|
func NewTLSHandshakesList(results oonitemplates.Results) TLSHandshakesList {
|
|
var out TLSHandshakesList
|
|
for _, in := range results.TLSHandshakes {
|
|
out = append(out, TLSHandshake{
|
|
CipherSuite: tlsx.CipherSuiteString(in.ConnectionState.CipherSuite),
|
|
Failure: makeFailure(in.Error),
|
|
NegotiatedProtocol: in.ConnectionState.NegotiatedProtocol,
|
|
PeerCertificates: makePeerCerts(in.ConnectionState.PeerCertificates),
|
|
T: in.DurationSinceBeginning.Seconds(),
|
|
TLSVersion: tlsx.VersionString(in.ConnectionState.Version),
|
|
})
|
|
}
|
|
return out
|
|
}
|
|
|
|
func makePeerCerts(in []modelx.X509Certificate) (out []MaybeBinaryValue) {
|
|
for _, e := range in {
|
|
out = append(out, MaybeBinaryValue{Value: string(e.Data)})
|
|
}
|
|
return
|
|
}
|