2021-02-02 12:05:47 +01:00
|
|
|
package webconnectivity
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"errors"
|
|
|
|
"net"
|
|
|
|
"net/url"
|
|
|
|
"strconv"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/ooni/probe-cli/v3/internal/engine/experiment/webconnectivity/internal"
|
|
|
|
"github.com/ooni/probe-cli/v3/internal/engine/netx/archival"
|
2022-01-03 13:53:23 +01:00
|
|
|
"github.com/ooni/probe-cli/v3/internal/model"
|
2021-02-02 12:05:47 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
const (
|
|
|
|
testName = "web_connectivity"
|
2021-10-05 12:52:19 +02:00
|
|
|
testVersion = "0.4.1"
|
2021-02-02 12:05:47 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
// Config contains the experiment config.
|
|
|
|
type Config struct{}
|
|
|
|
|
|
|
|
// TestKeys contains webconnectivity test keys.
|
|
|
|
type TestKeys struct {
|
|
|
|
Agent string `json:"agent"`
|
|
|
|
ClientResolver string `json:"client_resolver"`
|
|
|
|
Retries *int64 `json:"retries"` // unused
|
|
|
|
SOCKSProxy *string `json:"socksproxy"` // unused
|
|
|
|
|
2021-03-23 16:46:46 +01:00
|
|
|
// For now mostly TCP/TLS "connect" experiment but we are
|
|
|
|
// considering adding more events. An open question is
|
|
|
|
// currently how to properly tag these events so that it
|
|
|
|
// is rather obvious where they come from.
|
|
|
|
//
|
|
|
|
// See https://github.com/ooni/probe/issues/1413.
|
|
|
|
NetworkEvents []archival.NetworkEvent `json:"network_events"`
|
|
|
|
TLSHandshakes []archival.TLSHandshake `json:"tls_handshakes"`
|
|
|
|
|
2021-02-02 12:05:47 +01:00
|
|
|
// DNS experiment
|
|
|
|
Queries []archival.DNSQueryEntry `json:"queries"`
|
|
|
|
DNSExperimentFailure *string `json:"dns_experiment_failure"`
|
|
|
|
DNSAnalysisResult
|
|
|
|
|
|
|
|
// Control experiment
|
|
|
|
ControlFailure *string `json:"control_failure"`
|
|
|
|
ControlRequest ControlRequest `json:"-"`
|
|
|
|
Control ControlResponse `json:"control"`
|
|
|
|
|
2021-03-23 16:46:46 +01:00
|
|
|
// TCP/TLS "connect" experiment
|
2021-02-02 12:05:47 +01:00
|
|
|
TCPConnect []archival.TCPConnectEntry `json:"tcp_connect"`
|
|
|
|
TCPConnectSuccesses int `json:"-"`
|
|
|
|
TCPConnectAttempts int `json:"-"`
|
|
|
|
|
|
|
|
// HTTP experiment
|
|
|
|
Requests []archival.RequestEntry `json:"requests"`
|
|
|
|
HTTPExperimentFailure *string `json:"http_experiment_failure"`
|
|
|
|
HTTPAnalysisResult
|
|
|
|
|
|
|
|
// Top-level analysis
|
|
|
|
Summary
|
2021-10-05 12:52:19 +02:00
|
|
|
|
|
|
|
// DNSRuntime is the time to run all DNS checks.
|
|
|
|
DNSRuntime time.Duration `json:"x_dns_runtime"`
|
|
|
|
|
|
|
|
// THRuntime is the total time to invoke all test helpers.
|
|
|
|
THRuntime time.Duration `json:"x_th_runtime"`
|
|
|
|
|
|
|
|
// TCPTLSRuntime is the total time to perform TCP/TLS "connects".
|
|
|
|
TCPTLSRuntime time.Duration `json:"x_tcptls_runtime"`
|
|
|
|
|
|
|
|
// HTTPRuntime is the total time to perform the HTTP GET.
|
|
|
|
HTTPRuntime time.Duration `json:"x_http_runtime"`
|
2021-02-02 12:05:47 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Measurer performs the measurement.
|
|
|
|
type Measurer struct {
|
|
|
|
Config Config
|
|
|
|
}
|
|
|
|
|
|
|
|
// NewExperimentMeasurer creates a new ExperimentMeasurer.
|
|
|
|
func NewExperimentMeasurer(config Config) model.ExperimentMeasurer {
|
|
|
|
return Measurer{Config: config}
|
|
|
|
}
|
|
|
|
|
|
|
|
// ExperimentName implements ExperimentMeasurer.ExperExperimentName.
|
|
|
|
func (m Measurer) ExperimentName() string {
|
|
|
|
return testName
|
|
|
|
}
|
|
|
|
|
|
|
|
// ExperimentVersion implements ExperimentMeasurer.ExperExperimentVersion.
|
|
|
|
func (m Measurer) ExperimentVersion() string {
|
|
|
|
return testVersion
|
|
|
|
}
|
|
|
|
|
|
|
|
var (
|
|
|
|
// ErrNoAvailableTestHelpers is emitted when there are no available test helpers.
|
|
|
|
ErrNoAvailableTestHelpers = errors.New("no available helpers")
|
|
|
|
|
|
|
|
// ErrNoInput indicates that no input was provided
|
|
|
|
ErrNoInput = errors.New("no input provided")
|
|
|
|
|
|
|
|
// ErrInputIsNotAnURL indicates that the input is not an URL.
|
|
|
|
ErrInputIsNotAnURL = errors.New("input is not an URL")
|
|
|
|
|
|
|
|
// ErrUnsupportedInput indicates that the input URL scheme is unsupported.
|
|
|
|
ErrUnsupportedInput = errors.New("unsupported input scheme")
|
|
|
|
)
|
|
|
|
|
2021-03-23 16:46:46 +01:00
|
|
|
// Tags describing the section of this experiment in which
|
|
|
|
// the data has been collected.
|
|
|
|
const (
|
|
|
|
// DNSExperimentTag is a tag indicating the DNS experiment.
|
|
|
|
DNSExperimentTag = "dns_experiment"
|
|
|
|
|
|
|
|
// TCPTLSExperimentTag is a tag indicating the connect experiment.
|
|
|
|
TCPTLSExperimentTag = "tcptls_experiment"
|
|
|
|
|
|
|
|
// HTTPExperimentTag is a tag indicating the HTTP experiment.
|
|
|
|
HTTPExperimentTag = "http_experiment"
|
|
|
|
)
|
|
|
|
|
2021-02-02 12:05:47 +01:00
|
|
|
// Run implements ExperimentMeasurer.Run.
|
|
|
|
func (m Measurer) Run(
|
|
|
|
ctx context.Context,
|
|
|
|
sess model.ExperimentSession,
|
|
|
|
measurement *model.Measurement,
|
|
|
|
callbacks model.ExperimentCallbacks,
|
|
|
|
) error {
|
|
|
|
ctx, cancel := context.WithTimeout(ctx, 60*time.Second)
|
|
|
|
defer cancel()
|
|
|
|
tk := new(TestKeys)
|
|
|
|
measurement.TestKeys = tk
|
|
|
|
tk.Agent = "redirect"
|
|
|
|
tk.ClientResolver = sess.ResolverIP()
|
|
|
|
if measurement.Input == "" {
|
|
|
|
return ErrNoInput
|
|
|
|
}
|
|
|
|
URL, err := url.Parse(string(measurement.Input))
|
|
|
|
if err != nil {
|
|
|
|
return ErrInputIsNotAnURL
|
|
|
|
}
|
|
|
|
if URL.Scheme != "http" && URL.Scheme != "https" {
|
|
|
|
return ErrUnsupportedInput
|
|
|
|
}
|
|
|
|
// 1. find test helper
|
|
|
|
testhelpers, _ := sess.GetTestHelpersByName("web-connectivity")
|
2022-01-03 13:53:23 +01:00
|
|
|
var testhelper *model.OOAPIService
|
2021-02-02 12:05:47 +01:00
|
|
|
for _, th := range testhelpers {
|
|
|
|
if th.Type == "https" {
|
|
|
|
testhelper = &th
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if testhelper == nil {
|
|
|
|
return ErrNoAvailableTestHelpers
|
|
|
|
}
|
|
|
|
measurement.TestHelpers = map[string]interface{}{
|
|
|
|
"backend": testhelper,
|
|
|
|
}
|
|
|
|
// 2. perform the DNS lookup step
|
2021-10-05 12:52:19 +02:00
|
|
|
dnsBegin := time.Now()
|
2021-03-23 16:46:46 +01:00
|
|
|
dnsResult := DNSLookup(ctx, DNSLookupConfig{
|
|
|
|
Begin: measurement.MeasurementStartTimeSaved,
|
|
|
|
Session: sess, URL: URL})
|
2021-10-05 12:52:19 +02:00
|
|
|
tk.DNSRuntime = time.Since(dnsBegin)
|
2021-02-02 12:05:47 +01:00
|
|
|
tk.Queries = append(tk.Queries, dnsResult.TestKeys.Queries...)
|
|
|
|
tk.DNSExperimentFailure = dnsResult.Failure
|
|
|
|
epnts := NewEndpoints(URL, dnsResult.Addresses())
|
|
|
|
sess.Logger().Infof("using control: %s", testhelper.Address)
|
|
|
|
// 3. perform the control measurement
|
2021-10-05 12:52:19 +02:00
|
|
|
thBegin := time.Now()
|
2021-02-02 12:05:47 +01:00
|
|
|
tk.Control, err = Control(ctx, sess, testhelper.Address, ControlRequest{
|
|
|
|
HTTPRequest: URL.String(),
|
|
|
|
HTTPRequestHeaders: map[string][]string{
|
2022-05-25 09:54:50 +02:00
|
|
|
"Accept": {model.HTTPHeaderAccept},
|
|
|
|
"Accept-Language": {model.HTTPHeaderAcceptLanguage},
|
|
|
|
"User-Agent": {model.HTTPHeaderUserAgent},
|
2021-02-02 12:05:47 +01:00
|
|
|
},
|
|
|
|
TCPConnect: epnts.Endpoints(),
|
|
|
|
})
|
2021-10-05 12:52:19 +02:00
|
|
|
tk.THRuntime = time.Since(thBegin)
|
2021-02-02 12:05:47 +01:00
|
|
|
tk.ControlFailure = archival.NewFailure(err)
|
|
|
|
// 4. analyze DNS results
|
|
|
|
if tk.ControlFailure == nil {
|
|
|
|
tk.DNSAnalysisResult = DNSAnalysis(URL, dnsResult, tk.Control)
|
|
|
|
}
|
|
|
|
sess.Logger().Infof("DNS analysis result: %+v", internal.StringPointerToString(
|
|
|
|
tk.DNSAnalysisResult.DNSConsistency))
|
|
|
|
// 5. perform TCP/TLS connects
|
2021-03-23 16:46:46 +01:00
|
|
|
//
|
|
|
|
// TODO(bassosimone): here we should also follow the IP addresses
|
|
|
|
// returned by the control experiment.
|
|
|
|
//
|
|
|
|
// See https://github.com/ooni/probe/issues/1414
|
2021-10-05 12:52:19 +02:00
|
|
|
tcptlsBegin := time.Now()
|
2021-02-02 12:05:47 +01:00
|
|
|
connectsResult := Connects(ctx, ConnectsConfig{
|
2021-03-23 16:46:46 +01:00
|
|
|
Begin: measurement.MeasurementStartTimeSaved,
|
2021-02-02 12:05:47 +01:00
|
|
|
Session: sess,
|
|
|
|
TargetURL: URL,
|
|
|
|
URLGetterURLs: epnts.URLs(),
|
|
|
|
})
|
2021-10-05 12:52:19 +02:00
|
|
|
tk.TCPTLSRuntime = time.Since(tcptlsBegin)
|
2021-02-02 12:05:47 +01:00
|
|
|
sess.Logger().Infof(
|
|
|
|
"TCP/TLS endpoints: %d/%d reachable", connectsResult.Successes, connectsResult.Total)
|
|
|
|
for _, tcpkeys := range connectsResult.AllKeys {
|
|
|
|
// rewrite TCPConnect to include blocking information - it is very
|
|
|
|
// sad that we're storing analysis result inside the measurement
|
|
|
|
tk.TCPConnect = append(tk.TCPConnect, ComputeTCPBlocking(
|
|
|
|
tcpkeys.TCPConnect, tk.Control.TCPConnect)...)
|
2021-03-23 16:46:46 +01:00
|
|
|
for _, ev := range tcpkeys.NetworkEvents {
|
|
|
|
ev.Tags = []string{TCPTLSExperimentTag}
|
|
|
|
tk.NetworkEvents = append(tk.NetworkEvents, ev)
|
|
|
|
}
|
|
|
|
for _, ev := range tcpkeys.TLSHandshakes {
|
|
|
|
ev.Tags = []string{TCPTLSExperimentTag}
|
|
|
|
tk.TLSHandshakes = append(tk.TLSHandshakes, ev)
|
|
|
|
}
|
2021-02-02 12:05:47 +01:00
|
|
|
}
|
|
|
|
tk.TCPConnectAttempts = connectsResult.Total
|
|
|
|
tk.TCPConnectSuccesses = connectsResult.Successes
|
|
|
|
// 6. perform HTTP/HTTPS measurement
|
2021-10-05 12:52:19 +02:00
|
|
|
httpBegin := time.Now()
|
2021-02-02 12:05:47 +01:00
|
|
|
httpResult := HTTPGet(ctx, HTTPGetConfig{
|
|
|
|
Addresses: dnsResult.Addresses(),
|
2021-03-23 16:46:46 +01:00
|
|
|
Begin: measurement.MeasurementStartTimeSaved,
|
2021-02-02 12:05:47 +01:00
|
|
|
Session: sess,
|
|
|
|
TargetURL: URL,
|
|
|
|
})
|
2021-10-05 12:52:19 +02:00
|
|
|
tk.HTTPRuntime = time.Since(httpBegin)
|
2021-02-02 12:05:47 +01:00
|
|
|
tk.HTTPExperimentFailure = httpResult.Failure
|
|
|
|
tk.Requests = append(tk.Requests, httpResult.TestKeys.Requests...)
|
|
|
|
// 7. compare HTTP measurement to control
|
|
|
|
tk.HTTPAnalysisResult = HTTPAnalysis(httpResult.TestKeys, tk.Control)
|
|
|
|
tk.HTTPAnalysisResult.Log(sess.Logger())
|
|
|
|
tk.Summary = Summarize(tk)
|
|
|
|
tk.Summary.Log(sess.Logger())
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// ComputeTCPBlocking will return a copy of the input TCPConnect structure
|
|
|
|
// where we set the Blocking value depending on the control results.
|
|
|
|
func ComputeTCPBlocking(measurement []archival.TCPConnectEntry,
|
|
|
|
control map[string]ControlTCPConnectResult) (out []archival.TCPConnectEntry) {
|
|
|
|
out = []archival.TCPConnectEntry{}
|
|
|
|
for _, me := range measurement {
|
|
|
|
epnt := net.JoinHostPort(me.IP, strconv.Itoa(me.Port))
|
|
|
|
if ce, ok := control[epnt]; ok {
|
|
|
|
v := ce.Failure == nil && me.Status.Failure != nil
|
|
|
|
me.Status.Blocked = &v
|
|
|
|
}
|
|
|
|
out = append(out, me)
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// SummaryKeys contains summary keys for this experiment.
|
|
|
|
//
|
2022-05-09 09:33:18 +02:00
|
|
|
// Note that this structure is part of the ABI contract with ooniprobe
|
2021-02-02 12:05:47 +01:00
|
|
|
// therefore we should be careful when changing it.
|
|
|
|
type SummaryKeys struct {
|
|
|
|
Accessible bool `json:"accessible"`
|
|
|
|
Blocking string `json:"blocking"`
|
|
|
|
IsAnomaly bool `json:"-"`
|
|
|
|
}
|
|
|
|
|
|
|
|
// GetSummaryKeys implements model.ExperimentMeasurer.GetSummaryKeys.
|
|
|
|
func (m Measurer) GetSummaryKeys(measurement *model.Measurement) (interface{}, error) {
|
|
|
|
sk := SummaryKeys{IsAnomaly: false}
|
|
|
|
tk, ok := measurement.TestKeys.(*TestKeys)
|
|
|
|
if !ok {
|
|
|
|
return sk, errors.New("invalid test keys type")
|
|
|
|
}
|
|
|
|
sk.IsAnomaly = tk.BlockingReason != nil
|
|
|
|
if tk.BlockingReason != nil {
|
|
|
|
sk.Blocking = *tk.BlockingReason
|
|
|
|
}
|
|
|
|
sk.Accessible = tk.Accessible != nil && *tk.Accessible
|
|
|
|
return sk, nil
|
|
|
|
}
|