api.go 37 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179
  1. /*
  2. * Copyright (c) 2016, Psiphon Inc.
  3. * All rights reserved.
  4. *
  5. * This program is free software: you can redistribute it and/or modify
  6. * it under the terms of the GNU General Public License as published by
  7. * the Free Software Foundation, either version 3 of the License, or
  8. * (at your option) any later version.
  9. *
  10. * This program is distributed in the hope that it will be useful,
  11. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  13. * GNU General Public License for more details.
  14. *
  15. * You should have received a copy of the GNU General Public License
  16. * along with this program. If not, see <http://www.gnu.org/licenses/>.
  17. *
  18. */
  19. package server
  20. import (
  21. "crypto/subtle"
  22. "encoding/json"
  23. "errors"
  24. "fmt"
  25. "net"
  26. "regexp"
  27. "runtime/debug"
  28. "strconv"
  29. "strings"
  30. "unicode"
  31. "github.com/Psiphon-Labs/psiphon-tunnel-core/psiphon/common"
  32. "github.com/Psiphon-Labs/psiphon-tunnel-core/psiphon/common/protocol"
  33. "github.com/Psiphon-Labs/psiphon-tunnel-core/psiphon/common/tactics"
  34. )
  35. const (
  36. MAX_API_PARAMS_SIZE = 256 * 1024 // 256KB
  37. PADDING_MAX_BYTES = 16 * 1024
  38. CLIENT_PLATFORM_ANDROID = "Android"
  39. CLIENT_PLATFORM_WINDOWS = "Windows"
  40. CLIENT_PLATFORM_IOS = "iOS"
  41. )
  42. // sshAPIRequestHandler routes Psiphon API requests transported as
  43. // JSON objects via the SSH request mechanism.
  44. //
  45. // The API request handlers, handshakeAPIRequestHandler, etc., are
  46. // reused by webServer which offers the Psiphon API via web transport.
  47. //
  48. // The API request parameters and event log values follow the legacy
  49. // psi_web protocol and naming conventions. The API is compatible with
  50. // all tunnel-core clients but are not backwards compatible with all
  51. // legacy clients.
  52. //
  53. func sshAPIRequestHandler(
  54. support *SupportServices,
  55. geoIPData GeoIPData,
  56. authorizedAccessTypes []string,
  57. name string,
  58. requestPayload []byte) ([]byte, error) {
  59. // Notes:
  60. //
  61. // - For SSH requests, MAX_API_PARAMS_SIZE is implicitly enforced
  62. // by max SSH request packet size.
  63. //
  64. // - The param protocol.PSIPHON_API_HANDSHAKE_AUTHORIZATIONS is an
  65. // array of base64-encoded strings; the base64 representation should
  66. // not be decoded to []byte values. The default behavior of
  67. // https://golang.org/pkg/encoding/json/#Unmarshal for a target of
  68. // type map[string]interface{} will unmarshal a base64-encoded string
  69. // to a string, not a decoded []byte, as required.
  70. var params common.APIParameters
  71. err := json.Unmarshal(requestPayload, &params)
  72. if err != nil {
  73. return nil, common.ContextError(
  74. fmt.Errorf("invalid payload for request name: %s: %s", name, err))
  75. }
  76. return dispatchAPIRequestHandler(
  77. support,
  78. protocol.PSIPHON_SSH_API_PROTOCOL,
  79. geoIPData,
  80. authorizedAccessTypes,
  81. name,
  82. params)
  83. }
  84. // dispatchAPIRequestHandler is the common dispatch point for both
  85. // web and SSH API requests.
  86. func dispatchAPIRequestHandler(
  87. support *SupportServices,
  88. apiProtocol string,
  89. geoIPData GeoIPData,
  90. authorizedAccessTypes []string,
  91. name string,
  92. params common.APIParameters) (response []byte, reterr error) {
  93. // Recover from and log any unexpected panics caused by user input
  94. // handling bugs. User inputs should be properly validated; this
  95. // mechanism is only a last resort to prevent the process from
  96. // terminating in the case of a bug.
  97. defer func() {
  98. if e := recover(); e != nil {
  99. if intentionalPanic, ok := e.(IntentionalPanicError); ok {
  100. panic(intentionalPanic)
  101. } else {
  102. log.LogPanicRecover(e, debug.Stack())
  103. reterr = common.ContextError(errors.New("request handler panic"))
  104. }
  105. }
  106. }()
  107. // Before invoking the handlers, enforce some preconditions:
  108. //
  109. // - A handshake request must precede any other requests.
  110. // - When the handshake results in a traffic rules state where
  111. // the client is immediately exhausted, no requests
  112. // may succeed. This case ensures that blocked clients do
  113. // not log "connected", etc.
  114. //
  115. // Only one handshake request may be made. There is no check here
  116. // to enforce that handshakeAPIRequestHandler will be called at
  117. // most once. The SetHandshakeState call in handshakeAPIRequestHandler
  118. // enforces that only a single handshake is made; enforcing that there
  119. // ensures no race condition even if concurrent requests are
  120. // in flight.
  121. if name != protocol.PSIPHON_API_HANDSHAKE_REQUEST_NAME {
  122. // TODO: same session-ID-lookup TODO in handshakeAPIRequestHandler
  123. // applies here.
  124. sessionID, err := getStringRequestParam(params, "client_session_id")
  125. if err == nil {
  126. // Note: follows/duplicates baseRequestParams validation
  127. if !isHexDigits(support.Config, sessionID) {
  128. err = errors.New("invalid param: client_session_id")
  129. }
  130. }
  131. if err != nil {
  132. return nil, common.ContextError(err)
  133. }
  134. completed, exhausted, err := support.TunnelServer.GetClientHandshaked(sessionID)
  135. if err != nil {
  136. return nil, common.ContextError(err)
  137. }
  138. if !completed {
  139. return nil, common.ContextError(errors.New("handshake not completed"))
  140. }
  141. if exhausted {
  142. return nil, common.ContextError(errors.New("exhausted after handshake"))
  143. }
  144. }
  145. switch name {
  146. case protocol.PSIPHON_API_HANDSHAKE_REQUEST_NAME:
  147. return handshakeAPIRequestHandler(support, apiProtocol, geoIPData, params)
  148. case protocol.PSIPHON_API_CONNECTED_REQUEST_NAME:
  149. return connectedAPIRequestHandler(support, geoIPData, authorizedAccessTypes, params)
  150. case protocol.PSIPHON_API_STATUS_REQUEST_NAME:
  151. return statusAPIRequestHandler(support, geoIPData, authorizedAccessTypes, params)
  152. case protocol.PSIPHON_API_CLIENT_VERIFICATION_REQUEST_NAME:
  153. return clientVerificationAPIRequestHandler(support, geoIPData, authorizedAccessTypes, params)
  154. }
  155. return nil, common.ContextError(fmt.Errorf("invalid request name: %s", name))
  156. }
  157. var handshakeRequestParams = append(
  158. append(
  159. // Note: legacy clients may not send "session_id" in handshake
  160. []requestParamSpec{{"session_id", isHexDigits, requestParamOptional}},
  161. tacticsParams...),
  162. baseRequestParams...)
  163. // handshakeAPIRequestHandler implements the "handshake" API request.
  164. // Clients make the handshake immediately after establishing a tunnel
  165. // connection; the response tells the client what homepage to open, what
  166. // stats to record, etc.
  167. func handshakeAPIRequestHandler(
  168. support *SupportServices,
  169. apiProtocol string,
  170. geoIPData GeoIPData,
  171. params common.APIParameters) ([]byte, error) {
  172. // Note: ignoring "known_servers" params
  173. err := validateRequestParams(support.Config, params, baseRequestParams)
  174. if err != nil {
  175. return nil, common.ContextError(err)
  176. }
  177. sessionID, _ := getStringRequestParam(params, "client_session_id")
  178. sponsorID, _ := getStringRequestParam(params, "sponsor_id")
  179. clientVersion, _ := getStringRequestParam(params, "client_version")
  180. clientPlatform, _ := getStringRequestParam(params, "client_platform")
  181. isMobile := isMobileClientPlatform(clientPlatform)
  182. normalizedPlatform := normalizeClientPlatform(clientPlatform)
  183. var authorizations []string
  184. if params[protocol.PSIPHON_API_HANDSHAKE_AUTHORIZATIONS] != nil {
  185. authorizations, err = getStringArrayRequestParam(params, protocol.PSIPHON_API_HANDSHAKE_AUTHORIZATIONS)
  186. if err != nil {
  187. return nil, common.ContextError(err)
  188. }
  189. }
  190. // Note: no guarantee that PsinetDatabase won't reload between database calls
  191. db := support.PsinetDatabase
  192. httpsRequestRegexes := db.GetHttpsRequestRegexes(sponsorID)
  193. // Flag the SSH client as having completed its handshake. This
  194. // may reselect traffic rules and starts allowing port forwards.
  195. // TODO: in the case of SSH API requests, the actual sshClient could
  196. // be passed in and used here. The session ID lookup is only strictly
  197. // necessary to support web API requests.
  198. activeAuthorizationIDs, authorizedAccessTypes, err := support.TunnelServer.SetClientHandshakeState(
  199. sessionID,
  200. handshakeState{
  201. completed: true,
  202. apiProtocol: apiProtocol,
  203. apiParams: copyBaseRequestParams(params),
  204. expectDomainBytes: len(httpsRequestRegexes) > 0,
  205. },
  206. authorizations)
  207. if err != nil {
  208. return nil, common.ContextError(err)
  209. }
  210. tacticsPayload, err := support.TacticsServer.GetTacticsPayload(
  211. common.GeoIPData(geoIPData), params)
  212. if err != nil {
  213. return nil, common.ContextError(err)
  214. }
  215. var marshaledTacticsPayload []byte
  216. if tacticsPayload != nil {
  217. marshaledTacticsPayload, err = json.Marshal(tacticsPayload)
  218. if err != nil {
  219. return nil, common.ContextError(err)
  220. }
  221. // Log a metric when new tactics are issued. Logging here indicates that
  222. // the handshake tactics mechanism is active; but logging for every
  223. // handshake creates unneccesary log data.
  224. if len(tacticsPayload.Tactics) > 0 {
  225. logFields := getRequestLogFields(
  226. tactics.TACTICS_METRIC_EVENT_NAME,
  227. geoIPData,
  228. authorizedAccessTypes,
  229. params,
  230. handshakeRequestParams)
  231. logFields[tactics.NEW_TACTICS_TAG_LOG_FIELD_NAME] = tacticsPayload.Tag
  232. logFields[tactics.IS_TACTICS_REQUEST_LOG_FIELD_NAME] = false
  233. log.LogRawFieldsWithTimestamp(logFields)
  234. }
  235. }
  236. // The log comes _after_ SetClientHandshakeState, in case that call rejects
  237. // the state change (for example, if a second handshake is performed)
  238. //
  239. // The handshake event is no longer shipped to log consumers, so this is
  240. // simply a diagnostic log. Since the "server_tunnel" event includes all
  241. // common API parameters and "handshake_completed" flag, this handshake
  242. // log is mostly redundant and set to debug level.
  243. log.WithContextFields(
  244. getRequestLogFields(
  245. "",
  246. geoIPData,
  247. authorizedAccessTypes,
  248. params,
  249. baseRequestParams)).Debug("handshake")
  250. pad_response, _ := getPaddingSizeRequestParam(params, "pad_response")
  251. handshakeResponse := protocol.HandshakeResponse{
  252. SSHSessionID: sessionID,
  253. Homepages: db.GetRandomizedHomepages(sponsorID, geoIPData.Country, isMobile),
  254. UpgradeClientVersion: db.GetUpgradeClientVersion(clientVersion, normalizedPlatform),
  255. PageViewRegexes: make([]map[string]string, 0),
  256. HttpsRequestRegexes: httpsRequestRegexes,
  257. EncodedServerList: db.DiscoverServers(geoIPData.DiscoveryValue),
  258. ClientRegion: geoIPData.Country,
  259. ServerTimestamp: common.GetCurrentTimestamp(),
  260. ActiveAuthorizationIDs: activeAuthorizationIDs,
  261. TacticsPayload: marshaledTacticsPayload,
  262. Padding: strings.Repeat(" ", pad_response),
  263. }
  264. responsePayload, err := json.Marshal(handshakeResponse)
  265. if err != nil {
  266. return nil, common.ContextError(err)
  267. }
  268. return responsePayload, nil
  269. }
  270. var connectedRequestParams = append(
  271. []requestParamSpec{
  272. {"session_id", isHexDigits, 0},
  273. {"last_connected", isLastConnected, 0},
  274. {"establishment_duration", isIntString, requestParamOptional | requestParamLogStringAsInt}},
  275. baseRequestParams...)
  276. // updateOnConnectedParamNames are connected request parameters which are
  277. // copied to update data logged with server_tunnel: these fields either only
  278. // ship with or ship newer data with connected requests.
  279. var updateOnConnectedParamNames = []string{
  280. "last_connected",
  281. "establishment_duration",
  282. "upstream_bytes_fragmented",
  283. "upstream_min_bytes_written",
  284. "upstream_max_bytes_written",
  285. "upstream_min_delayed",
  286. "upstream_max_delayed",
  287. }
  288. // connectedAPIRequestHandler implements the "connected" API request.
  289. // Clients make the connected request once a tunnel connection has been
  290. // established and at least once per day. The last_connected input value,
  291. // which should be a connected_timestamp output from a previous connected
  292. // response, is used to calculate unique user stats.
  293. // connected_timestamp is truncated as a privacy measure.
  294. func connectedAPIRequestHandler(
  295. support *SupportServices,
  296. geoIPData GeoIPData,
  297. authorizedAccessTypes []string,
  298. params common.APIParameters) ([]byte, error) {
  299. err := validateRequestParams(support.Config, params, connectedRequestParams)
  300. if err != nil {
  301. return nil, common.ContextError(err)
  302. }
  303. // Update, for server_tunnel logging, upstream fragmentor metrics, as the
  304. // client may have performed more upstream fragmentation since the
  305. // previous metrics reported by the handshake request. Also, additional
  306. // fields reported only in the connected request, are added to
  307. // server_tunnel here.
  308. // TODO: same session-ID-lookup TODO in handshakeAPIRequestHandler
  309. // applies here.
  310. sessionID, _ := getStringRequestParam(params, "client_session_id")
  311. err = support.TunnelServer.UpdateClientAPIParameters(
  312. sessionID, copyUpdateOnConnectedParams(params))
  313. if err != nil {
  314. return nil, common.ContextError(err)
  315. }
  316. log.LogRawFieldsWithTimestamp(
  317. getRequestLogFields(
  318. "connected",
  319. geoIPData,
  320. authorizedAccessTypes,
  321. params,
  322. connectedRequestParams))
  323. pad_response, _ := getPaddingSizeRequestParam(params, "pad_response")
  324. connectedResponse := protocol.ConnectedResponse{
  325. ConnectedTimestamp: common.TruncateTimestampToHour(common.GetCurrentTimestamp()),
  326. Padding: strings.Repeat(" ", pad_response),
  327. }
  328. responsePayload, err := json.Marshal(connectedResponse)
  329. if err != nil {
  330. return nil, common.ContextError(err)
  331. }
  332. return responsePayload, nil
  333. }
  334. var statusRequestParams = append(
  335. []requestParamSpec{
  336. {"session_id", isHexDigits, 0},
  337. {"connected", isBooleanFlag, requestParamLogFlagAsBool}},
  338. baseRequestParams...)
  339. var remoteServerListStatParams = []requestParamSpec{
  340. {"session_id", isHexDigits, requestParamOptional},
  341. {"propagation_channel_id", isHexDigits, requestParamOptional},
  342. {"sponsor_id", isHexDigits, requestParamOptional},
  343. {"client_version", isAnyString, requestParamOptional},
  344. {"client_platform", isAnyString, requestParamOptional},
  345. {"client_build_rev", isAnyString, requestParamOptional},
  346. {"client_download_timestamp", isISO8601Date, 0},
  347. {"url", isAnyString, 0},
  348. {"etag", isAnyString, 0},
  349. }
  350. var failedTunnelStatParams = append(
  351. []requestParamSpec{
  352. {"session_id", isHexDigits, 0},
  353. {"client_failed_timestamp", isISO8601Date, 0},
  354. {"tunnel_error", isAnyString, 0}},
  355. baseRequestParams...)
  356. // statusAPIRequestHandler implements the "status" API request.
  357. // Clients make periodic status requests which deliver client-side
  358. // recorded data transfer and tunnel duration stats.
  359. // Note from psi_web implementation: no input validation on domains;
  360. // any string is accepted (regex transform may result in arbitrary
  361. // string). Stats processor must handle this input with care.
  362. func statusAPIRequestHandler(
  363. support *SupportServices,
  364. geoIPData GeoIPData,
  365. authorizedAccessTypes []string,
  366. params common.APIParameters) ([]byte, error) {
  367. err := validateRequestParams(support.Config, params, statusRequestParams)
  368. if err != nil {
  369. return nil, common.ContextError(err)
  370. }
  371. sessionID, _ := getStringRequestParam(params, "client_session_id")
  372. statusData, err := getJSONObjectRequestParam(params, "statusData")
  373. if err != nil {
  374. return nil, common.ContextError(err)
  375. }
  376. // Logs are queued until the input is fully validated. Otherwise, stats
  377. // could be double counted if the client has a bug in its request
  378. // formatting: partial stats would be logged (counted), the request would
  379. // fail, and clients would then resend all the same stats again.
  380. logQueue := make([]LogFields, 0)
  381. // Domain bytes transferred stats
  382. // Older clients may not submit this data
  383. // Clients are expected to send host_bytes/domain_bytes stats only when
  384. // configured to do so in the handshake reponse. Legacy clients may still
  385. // report "(OTHER)" host_bytes when no regexes are set. Drop those stats.
  386. domainBytesExpected, err := support.TunnelServer.ExpectClientDomainBytes(sessionID)
  387. if err != nil {
  388. return nil, common.ContextError(err)
  389. }
  390. if domainBytesExpected && statusData["host_bytes"] != nil {
  391. hostBytes, err := getMapStringInt64RequestParam(statusData, "host_bytes")
  392. if err != nil {
  393. return nil, common.ContextError(err)
  394. }
  395. for domain, bytes := range hostBytes {
  396. domainBytesFields := getRequestLogFields(
  397. "domain_bytes",
  398. geoIPData,
  399. authorizedAccessTypes,
  400. params,
  401. statusRequestParams)
  402. domainBytesFields["domain"] = domain
  403. domainBytesFields["bytes"] = bytes
  404. logQueue = append(logQueue, domainBytesFields)
  405. }
  406. }
  407. // Limitation: for "persistent" stats, host_id and geolocation is time-of-sending
  408. // not time-of-recording.
  409. // Remote server list download persistent stats.
  410. // Older clients may not submit this data.
  411. if statusData["remote_server_list_stats"] != nil {
  412. remoteServerListStats, err := getJSONObjectArrayRequestParam(statusData, "remote_server_list_stats")
  413. if err != nil {
  414. return nil, common.ContextError(err)
  415. }
  416. for _, remoteServerListStat := range remoteServerListStats {
  417. err := validateRequestParams(support.Config, remoteServerListStat, remoteServerListStatParams)
  418. if err != nil {
  419. return nil, common.ContextError(err)
  420. }
  421. // remote_server_list defaults to using the common params from the
  422. // outer statusRequestParams
  423. remoteServerListFields := getRequestLogFields(
  424. "remote_server_list",
  425. geoIPData,
  426. authorizedAccessTypes,
  427. params,
  428. statusRequestParams)
  429. for name, value := range remoteServerListStat {
  430. remoteServerListFields[name] = value
  431. }
  432. logQueue = append(logQueue, remoteServerListFields)
  433. }
  434. }
  435. // Failed tunnel persistent stats.
  436. // Older clients may not submit this data.
  437. if statusData["failed_tunnel_stats"] != nil {
  438. failedTunnelStats, err := getJSONObjectArrayRequestParam(statusData, "failed_tunnel_stats")
  439. if err != nil {
  440. return nil, common.ContextError(err)
  441. }
  442. for _, failedTunnelStat := range failedTunnelStats {
  443. // failed_tunnel supplies a full set of common params, but the
  444. // server secret must use the corect value from the outer
  445. // statusRequestParams
  446. failedTunnelStat["server_secret"] = params["server_secret"]
  447. err := validateRequestParams(support.Config, failedTunnelStat, failedTunnelStatParams)
  448. if err != nil {
  449. return nil, common.ContextError(err)
  450. }
  451. failedTunnelFields := getRequestLogFields(
  452. "failed_tunnel",
  453. geoIPData,
  454. authorizedAccessTypes,
  455. failedTunnelStat,
  456. failedTunnelStatParams)
  457. logQueue = append(logQueue, failedTunnelFields)
  458. }
  459. }
  460. for _, logItem := range logQueue {
  461. log.LogRawFieldsWithTimestamp(logItem)
  462. }
  463. pad_response, _ := getPaddingSizeRequestParam(params, "pad_response")
  464. return make([]byte, pad_response), nil
  465. }
  466. // clientVerificationAPIRequestHandler is just a compliance stub
  467. // for older Android clients that still send verification requests
  468. func clientVerificationAPIRequestHandler(
  469. support *SupportServices,
  470. geoIPData GeoIPData,
  471. authorizedAccessTypes []string,
  472. params common.APIParameters) ([]byte, error) {
  473. return make([]byte, 0), nil
  474. }
  475. var tacticsParams = []requestParamSpec{
  476. {tactics.STORED_TACTICS_TAG_PARAMETER_NAME, isAnyString, requestParamOptional},
  477. {tactics.SPEED_TEST_SAMPLES_PARAMETER_NAME, nil, requestParamOptional | requestParamJSON},
  478. }
  479. var tacticsRequestParams = append(
  480. append(
  481. []requestParamSpec{{"session_id", isHexDigits, 0}},
  482. tacticsParams...),
  483. baseRequestParams...)
  484. func getTacticsAPIParameterValidator(config *Config) common.APIParameterValidator {
  485. return func(params common.APIParameters) error {
  486. return validateRequestParams(config, params, tacticsRequestParams)
  487. }
  488. }
  489. func getTacticsAPIParameterLogFieldFormatter() common.APIParameterLogFieldFormatter {
  490. return func(geoIPData common.GeoIPData, params common.APIParameters) common.LogFields {
  491. logFields := getRequestLogFields(
  492. tactics.TACTICS_METRIC_EVENT_NAME,
  493. GeoIPData(geoIPData),
  494. nil, // authorizedAccessTypes are not known yet
  495. params,
  496. tacticsRequestParams)
  497. return common.LogFields(logFields)
  498. }
  499. }
  500. type requestParamSpec struct {
  501. name string
  502. validator func(*Config, string) bool
  503. flags uint32
  504. }
  505. const (
  506. requestParamOptional = 1
  507. requestParamNotLogged = 2
  508. requestParamArray = 4
  509. requestParamJSON = 8
  510. requestParamLogStringAsInt = 16
  511. requestParamLogStringLengthAsInt = 32
  512. requestParamLogFlagAsBool = 64
  513. )
  514. // baseRequestParams is the list of required and optional
  515. // request parameters; derived from COMMON_INPUTS and
  516. // OPTIONAL_COMMON_INPUTS in psi_web.
  517. // Each param is expected to be a string, unless requestParamArray
  518. // is specified, in which case an array of string is expected.
  519. var baseRequestParams = []requestParamSpec{
  520. {"server_secret", isServerSecret, requestParamNotLogged},
  521. {"client_session_id", isHexDigits, requestParamNotLogged},
  522. {"propagation_channel_id", isHexDigits, 0},
  523. {"sponsor_id", isHexDigits, 0},
  524. {"client_version", isIntString, requestParamLogStringAsInt},
  525. {"client_platform", isClientPlatform, 0},
  526. {"client_build_rev", isHexDigits, requestParamOptional},
  527. {"relay_protocol", isRelayProtocol, 0},
  528. {"tunnel_whole_device", isBooleanFlag, requestParamOptional | requestParamLogFlagAsBool},
  529. {"device_region", isAnyString, requestParamOptional},
  530. {"ssh_client_version", isAnyString, requestParamOptional},
  531. {"upstream_proxy_type", isUpstreamProxyType, requestParamOptional},
  532. {"upstream_proxy_custom_header_names", isAnyString, requestParamOptional | requestParamArray},
  533. {"meek_dial_address", isDialAddress, requestParamOptional},
  534. {"meek_resolved_ip_address", isIPAddress, requestParamOptional},
  535. {"meek_sni_server_name", isDomain, requestParamOptional},
  536. {"meek_host_header", isHostHeader, requestParamOptional},
  537. {"meek_transformed_host_name", isBooleanFlag, requestParamOptional | requestParamLogFlagAsBool},
  538. {"user_agent", isAnyString, requestParamOptional},
  539. {"tls_profile", isAnyString, requestParamOptional},
  540. {"server_entry_region", isRegionCode, requestParamOptional},
  541. {"server_entry_source", isServerEntrySource, requestParamOptional},
  542. {"server_entry_timestamp", isISO8601Date, requestParamOptional},
  543. {tactics.APPLIED_TACTICS_TAG_PARAMETER_NAME, isAnyString, requestParamOptional},
  544. {"dial_port_number", isIntString, requestParamOptional | requestParamLogStringAsInt},
  545. {"quic_version", isAnyString, requestParamOptional},
  546. {"quic_dial_sni_address", isAnyString, requestParamOptional},
  547. {"upstream_bytes_fragmented", isIntString, requestParamOptional | requestParamLogStringAsInt},
  548. {"upstream_min_bytes_written", isIntString, requestParamOptional | requestParamLogStringAsInt},
  549. {"upstream_max_bytes_written", isIntString, requestParamOptional | requestParamLogStringAsInt},
  550. {"upstream_min_delayed", isIntString, requestParamOptional | requestParamLogStringAsInt},
  551. {"upstream_max_delayed", isIntString, requestParamOptional | requestParamLogStringAsInt},
  552. {"padding", isAnyString, requestParamOptional | requestParamLogStringLengthAsInt},
  553. {"pad_response", isIntString, requestParamOptional | requestParamLogStringAsInt},
  554. {"is_replay", isBooleanFlag, requestParamOptional | requestParamLogFlagAsBool},
  555. {"egress_region", isRegionCode, requestParamOptional},
  556. {"dial_duration", isIntString, requestParamOptional | requestParamLogStringAsInt},
  557. {"candidate_number", isIntString, requestParamOptional | requestParamLogStringAsInt},
  558. }
  559. func validateRequestParams(
  560. config *Config,
  561. params common.APIParameters,
  562. expectedParams []requestParamSpec) error {
  563. for _, expectedParam := range expectedParams {
  564. value := params[expectedParam.name]
  565. if value == nil {
  566. if expectedParam.flags&requestParamOptional != 0 {
  567. continue
  568. }
  569. return common.ContextError(
  570. fmt.Errorf("missing param: %s", expectedParam.name))
  571. }
  572. var err error
  573. switch {
  574. case expectedParam.flags&requestParamArray != 0:
  575. err = validateStringArrayRequestParam(config, expectedParam, value)
  576. case expectedParam.flags&requestParamJSON != 0:
  577. // No validation: the JSON already unmarshalled; the parameter
  578. // user will validate that the JSON contains the expected
  579. // objects/data.
  580. // TODO: without validation, any valid JSON will be logged
  581. // by getRequestLogFields, even if the parameter user validates
  582. // and rejects the parameter.
  583. default:
  584. err = validateStringRequestParam(config, expectedParam, value)
  585. }
  586. if err != nil {
  587. return common.ContextError(err)
  588. }
  589. }
  590. return nil
  591. }
  592. // copyBaseRequestParams makes a copy of the params which
  593. // includes only the baseRequestParams.
  594. func copyBaseRequestParams(params common.APIParameters) common.APIParameters {
  595. // Note: not a deep copy; assumes baseRequestParams values
  596. // are all scalar types (int, string, etc.)
  597. paramsCopy := make(common.APIParameters)
  598. for _, baseParam := range baseRequestParams {
  599. value := params[baseParam.name]
  600. if value == nil {
  601. continue
  602. }
  603. paramsCopy[baseParam.name] = value
  604. }
  605. return paramsCopy
  606. }
  607. func copyUpdateOnConnectedParams(params common.APIParameters) common.APIParameters {
  608. // Note: not a deep copy
  609. paramsCopy := make(common.APIParameters)
  610. for _, name := range updateOnConnectedParamNames {
  611. value := params[name]
  612. if value == nil {
  613. continue
  614. }
  615. paramsCopy[name] = value
  616. }
  617. return paramsCopy
  618. }
  619. func validateStringRequestParam(
  620. config *Config,
  621. expectedParam requestParamSpec,
  622. value interface{}) error {
  623. strValue, ok := value.(string)
  624. if !ok {
  625. return common.ContextError(
  626. fmt.Errorf("unexpected string param type: %s", expectedParam.name))
  627. }
  628. if !expectedParam.validator(config, strValue) {
  629. return common.ContextError(
  630. fmt.Errorf("invalid param: %s: %s", expectedParam.name, strValue))
  631. }
  632. return nil
  633. }
  634. func validateStringArrayRequestParam(
  635. config *Config,
  636. expectedParam requestParamSpec,
  637. value interface{}) error {
  638. arrayValue, ok := value.([]interface{})
  639. if !ok {
  640. return common.ContextError(
  641. fmt.Errorf("unexpected string param type: %s", expectedParam.name))
  642. }
  643. for _, value := range arrayValue {
  644. err := validateStringRequestParam(config, expectedParam, value)
  645. if err != nil {
  646. return common.ContextError(err)
  647. }
  648. }
  649. return nil
  650. }
  651. // getRequestLogFields makes LogFields to log the API event following
  652. // the legacy psi_web and current ELK naming conventions.
  653. func getRequestLogFields(
  654. eventName string,
  655. geoIPData GeoIPData,
  656. authorizedAccessTypes []string,
  657. params common.APIParameters,
  658. expectedParams []requestParamSpec) LogFields {
  659. logFields := make(LogFields)
  660. if eventName != "" {
  661. logFields["event_name"] = eventName
  662. }
  663. // In psi_web, the space replacement was done to accommodate space
  664. // delimited logging, which is no longer required; we retain the
  665. // transformation so that stats aggregation isn't impacted.
  666. logFields["client_region"] = strings.Replace(geoIPData.Country, " ", "_", -1)
  667. logFields["client_city"] = strings.Replace(geoIPData.City, " ", "_", -1)
  668. logFields["client_isp"] = strings.Replace(geoIPData.ISP, " ", "_", -1)
  669. if len(authorizedAccessTypes) > 0 {
  670. logFields["authorized_access_types"] = authorizedAccessTypes
  671. }
  672. if params == nil {
  673. return logFields
  674. }
  675. for _, expectedParam := range expectedParams {
  676. if expectedParam.flags&requestParamNotLogged != 0 {
  677. continue
  678. }
  679. value := params[expectedParam.name]
  680. if value == nil {
  681. // Special case: older clients don't send this value,
  682. // so log a default.
  683. if expectedParam.name == "tunnel_whole_device" {
  684. value = "0"
  685. } else {
  686. // Skip omitted, optional params
  687. continue
  688. }
  689. }
  690. switch v := value.(type) {
  691. case string:
  692. strValue := v
  693. // Special cases:
  694. // - Number fields are encoded as integer types.
  695. // - For ELK performance we record certain domain-or-IP
  696. // fields as one of two different values based on type;
  697. // we also omit port from these host:port fields for now.
  698. // - Boolean fields that come into the api as "1"/"0"
  699. // must be logged as actual boolean values
  700. switch expectedParam.name {
  701. case "meek_dial_address":
  702. host, _, _ := net.SplitHostPort(strValue)
  703. if isIPAddress(nil, host) {
  704. logFields["meek_dial_ip_address"] = host
  705. } else {
  706. logFields["meek_dial_domain"] = host
  707. }
  708. case "upstream_proxy_type":
  709. // Submitted value could be e.g., "SOCKS5" or "socks5"; log lowercase
  710. logFields[expectedParam.name] = strings.ToLower(strValue)
  711. case tactics.SPEED_TEST_SAMPLES_PARAMETER_NAME:
  712. // Due to a client bug, clients may deliever an incorrect ""
  713. // value for speed_test_samples via the web API protocol. Omit
  714. // the field in this case.
  715. default:
  716. if expectedParam.flags&requestParamLogStringAsInt != 0 {
  717. intValue, _ := strconv.Atoi(strValue)
  718. logFields[expectedParam.name] = intValue
  719. } else if expectedParam.flags&requestParamLogStringLengthAsInt != 0 {
  720. logFields[expectedParam.name] = len(strValue)
  721. } else if expectedParam.flags&requestParamLogFlagAsBool != 0 {
  722. // Submitted value could be "0" or "1"
  723. // "0" and non "0"/"1" values should be transformed to false
  724. // "1" should be transformed to true
  725. if strValue == "1" {
  726. logFields[expectedParam.name] = true
  727. } else {
  728. logFields[expectedParam.name] = false
  729. }
  730. } else {
  731. logFields[expectedParam.name] = strValue
  732. }
  733. }
  734. case []interface{}:
  735. if expectedParam.name == tactics.SPEED_TEST_SAMPLES_PARAMETER_NAME {
  736. logFields[expectedParam.name] = makeSpeedTestSamplesLogField(v)
  737. } else {
  738. logFields[expectedParam.name] = v
  739. }
  740. default:
  741. logFields[expectedParam.name] = v
  742. }
  743. }
  744. return logFields
  745. }
  746. // makeSpeedTestSamplesLogField renames the tactics.SpeedTestSample json tag
  747. // fields to more verbose names for metrics.
  748. func makeSpeedTestSamplesLogField(samples []interface{}) []interface{} {
  749. // TODO: use reflection and add additional tags, e.g.,
  750. // `json:"s" log:"timestamp"` to remove hard-coded
  751. // tag value dependency?
  752. logSamples := make([]interface{}, len(samples))
  753. for i, sample := range samples {
  754. logSample := make(map[string]interface{})
  755. if m, ok := sample.(map[string]interface{}); ok {
  756. for k, v := range m {
  757. logK := k
  758. switch k {
  759. case "s":
  760. logK = "timestamp"
  761. case "r":
  762. logK = "server_region"
  763. case "p":
  764. logK = "relay_protocol"
  765. case "t":
  766. logK = "round_trip_time_ms"
  767. case "u":
  768. logK = "bytes_up"
  769. case "d":
  770. logK = "bytes_down"
  771. }
  772. logSample[logK] = v
  773. }
  774. }
  775. logSamples[i] = logSample
  776. }
  777. return logSamples
  778. }
  779. func getStringRequestParam(params common.APIParameters, name string) (string, error) {
  780. if params[name] == nil {
  781. return "", common.ContextError(fmt.Errorf("missing param: %s", name))
  782. }
  783. value, ok := params[name].(string)
  784. if !ok {
  785. return "", common.ContextError(fmt.Errorf("invalid param: %s", name))
  786. }
  787. return value, nil
  788. }
  789. func getInt64RequestParam(params common.APIParameters, name string) (int64, error) {
  790. if params[name] == nil {
  791. return 0, common.ContextError(fmt.Errorf("missing param: %s", name))
  792. }
  793. value, ok := params[name].(float64)
  794. if !ok {
  795. return 0, common.ContextError(fmt.Errorf("invalid param: %s", name))
  796. }
  797. return int64(value), nil
  798. }
  799. func getPaddingSizeRequestParam(params common.APIParameters, name string) (int, error) {
  800. value, err := getInt64RequestParam(params, name)
  801. if err != nil {
  802. return 0, common.ContextError(err)
  803. }
  804. if value < 0 {
  805. value = 0
  806. }
  807. if value > PADDING_MAX_BYTES {
  808. value = PADDING_MAX_BYTES
  809. }
  810. return int(value), nil
  811. }
  812. func getJSONObjectRequestParam(params common.APIParameters, name string) (common.APIParameters, error) {
  813. if params[name] == nil {
  814. return nil, common.ContextError(fmt.Errorf("missing param: %s", name))
  815. }
  816. // Note: generic unmarshal of JSON produces map[string]interface{}, not common.APIParameters
  817. value, ok := params[name].(map[string]interface{})
  818. if !ok {
  819. return nil, common.ContextError(fmt.Errorf("invalid param: %s", name))
  820. }
  821. return common.APIParameters(value), nil
  822. }
  823. func getJSONObjectArrayRequestParam(params common.APIParameters, name string) ([]common.APIParameters, error) {
  824. if params[name] == nil {
  825. return nil, common.ContextError(fmt.Errorf("missing param: %s", name))
  826. }
  827. value, ok := params[name].([]interface{})
  828. if !ok {
  829. return nil, common.ContextError(fmt.Errorf("invalid param: %s", name))
  830. }
  831. result := make([]common.APIParameters, len(value))
  832. for i, item := range value {
  833. // Note: generic unmarshal of JSON produces map[string]interface{}, not common.APIParameters
  834. resultItem, ok := item.(map[string]interface{})
  835. if !ok {
  836. return nil, common.ContextError(fmt.Errorf("invalid param: %s", name))
  837. }
  838. result[i] = common.APIParameters(resultItem)
  839. }
  840. return result, nil
  841. }
  842. func getMapStringInt64RequestParam(params common.APIParameters, name string) (map[string]int64, error) {
  843. if params[name] == nil {
  844. return nil, common.ContextError(fmt.Errorf("missing param: %s", name))
  845. }
  846. // TODO: can't use common.APIParameters type?
  847. value, ok := params[name].(map[string]interface{})
  848. if !ok {
  849. return nil, common.ContextError(fmt.Errorf("invalid param: %s", name))
  850. }
  851. result := make(map[string]int64)
  852. for k, v := range value {
  853. numValue, ok := v.(float64)
  854. if !ok {
  855. return nil, common.ContextError(fmt.Errorf("invalid param: %s", name))
  856. }
  857. result[k] = int64(numValue)
  858. }
  859. return result, nil
  860. }
  861. func getStringArrayRequestParam(params common.APIParameters, name string) ([]string, error) {
  862. if params[name] == nil {
  863. return nil, common.ContextError(fmt.Errorf("missing param: %s", name))
  864. }
  865. value, ok := params[name].([]interface{})
  866. if !ok {
  867. return nil, common.ContextError(fmt.Errorf("invalid param: %s", name))
  868. }
  869. result := make([]string, len(value))
  870. for i, v := range value {
  871. strValue, ok := v.(string)
  872. if !ok {
  873. return nil, common.ContextError(fmt.Errorf("invalid param: %s", name))
  874. }
  875. result[i] = strValue
  876. }
  877. return result, nil
  878. }
  879. // Normalize reported client platform. Android clients, for example, report
  880. // OS version, rooted status, and Google Play build status in the clientPlatform
  881. // string along with "Android".
  882. func normalizeClientPlatform(clientPlatform string) string {
  883. if strings.Contains(strings.ToLower(clientPlatform), strings.ToLower(CLIENT_PLATFORM_ANDROID)) {
  884. return CLIENT_PLATFORM_ANDROID
  885. } else if strings.HasPrefix(clientPlatform, CLIENT_PLATFORM_IOS) {
  886. return CLIENT_PLATFORM_IOS
  887. }
  888. return CLIENT_PLATFORM_WINDOWS
  889. }
  890. func isAnyString(config *Config, value string) bool {
  891. return true
  892. }
  893. func isMobileClientPlatform(clientPlatform string) bool {
  894. normalizedClientPlatform := normalizeClientPlatform(clientPlatform)
  895. return normalizedClientPlatform == CLIENT_PLATFORM_ANDROID ||
  896. normalizedClientPlatform == CLIENT_PLATFORM_IOS
  897. }
  898. // Input validators follow the legacy validations rules in psi_web.
  899. func isServerSecret(config *Config, value string) bool {
  900. return subtle.ConstantTimeCompare(
  901. []byte(value),
  902. []byte(config.WebServerSecret)) == 1
  903. }
  904. func isHexDigits(_ *Config, value string) bool {
  905. // Allows both uppercase in addition to lowercase, for legacy support.
  906. return -1 == strings.IndexFunc(value, func(c rune) bool {
  907. return !unicode.Is(unicode.ASCII_Hex_Digit, c)
  908. })
  909. }
  910. func isDigits(_ *Config, value string) bool {
  911. return -1 == strings.IndexFunc(value, func(c rune) bool {
  912. return c < '0' || c > '9'
  913. })
  914. }
  915. func isIntString(_ *Config, value string) bool {
  916. _, err := strconv.Atoi(value)
  917. return err == nil
  918. }
  919. func isClientPlatform(_ *Config, value string) bool {
  920. return -1 == strings.IndexFunc(value, func(c rune) bool {
  921. // Note: stricter than psi_web's Python string.whitespace
  922. return unicode.Is(unicode.White_Space, c)
  923. })
  924. }
  925. func isRelayProtocol(_ *Config, value string) bool {
  926. return common.Contains(protocol.SupportedTunnelProtocols, value)
  927. }
  928. func isBooleanFlag(_ *Config, value string) bool {
  929. return value == "0" || value == "1"
  930. }
  931. func isUpstreamProxyType(_ *Config, value string) bool {
  932. value = strings.ToLower(value)
  933. return value == "http" || value == "socks5" || value == "socks4a"
  934. }
  935. func isRegionCode(_ *Config, value string) bool {
  936. if len(value) != 2 {
  937. return false
  938. }
  939. return -1 == strings.IndexFunc(value, func(c rune) bool {
  940. return c < 'A' || c > 'Z'
  941. })
  942. }
  943. func isDialAddress(_ *Config, value string) bool {
  944. // "<host>:<port>", where <host> is a domain or IP address
  945. parts := strings.Split(value, ":")
  946. if len(parts) != 2 {
  947. return false
  948. }
  949. if !isIPAddress(nil, parts[0]) && !isDomain(nil, parts[0]) {
  950. return false
  951. }
  952. if !isDigits(nil, parts[1]) {
  953. return false
  954. }
  955. port, err := strconv.Atoi(parts[1])
  956. if err != nil {
  957. return false
  958. }
  959. return port > 0 && port < 65536
  960. }
  961. func isIPAddress(_ *Config, value string) bool {
  962. return net.ParseIP(value) != nil
  963. }
  964. var isDomainRegex = regexp.MustCompile("[a-zA-Z\\d-]{1,63}$")
  965. func isDomain(_ *Config, value string) bool {
  966. // From: http://stackoverflow.com/questions/2532053/validate-a-hostname-string
  967. //
  968. // "ensures that each segment
  969. // * contains at least one character and a maximum of 63 characters
  970. // * consists only of allowed characters
  971. // * doesn't begin or end with a hyphen"
  972. //
  973. if len(value) > 255 {
  974. return false
  975. }
  976. value = strings.TrimSuffix(value, ".")
  977. for _, part := range strings.Split(value, ".") {
  978. // Note: regexp doesn't support the following Perl expression which
  979. // would check for '-' prefix/suffix: "(?!-)[a-zA-Z\\d-]{1,63}(?<!-)$"
  980. if strings.HasPrefix(part, "-") || strings.HasSuffix(part, "-") {
  981. return false
  982. }
  983. if !isDomainRegex.Match([]byte(part)) {
  984. return false
  985. }
  986. }
  987. return true
  988. }
  989. func isHostHeader(_ *Config, value string) bool {
  990. // "<host>:<port>", where <host> is a domain or IP address and ":<port>" is optional
  991. if strings.Contains(value, ":") {
  992. return isDialAddress(nil, value)
  993. }
  994. return isIPAddress(nil, value) || isDomain(nil, value)
  995. }
  996. func isServerEntrySource(_ *Config, value string) bool {
  997. return common.Contains(protocol.SupportedServerEntrySources, value)
  998. }
  999. var isISO8601DateRegex = regexp.MustCompile(
  1000. "(?P<year>[0-9]{4})-(?P<month>[0-9]{1,2})-(?P<day>[0-9]{1,2})T(?P<hour>[0-9]{2}):(?P<minute>[0-9]{2}):(?P<second>[0-9]{2})(\\.(?P<fraction>[0-9]+))?(?P<timezone>Z|(([-+])([0-9]{2}):([0-9]{2})))")
  1001. func isISO8601Date(_ *Config, value string) bool {
  1002. return isISO8601DateRegex.Match([]byte(value))
  1003. }
  1004. func isLastConnected(_ *Config, value string) bool {
  1005. return value == "None" || value == "Unknown" || isISO8601Date(nil, value)
  1006. }