psinet.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484
  1. /*
  2. * Copyright (c) 2016, Psiphon Inc.
  3. * All rights reserved.
  4. *
  5. * This program is free software: you can redistribute it and/or modify
  6. * it under the terms of the GNU General Public License as published by
  7. * the Free Software Foundation, either version 3 of the License, or
  8. * (at your option) any later version.
  9. *
  10. * This program is distributed in the hope that it will be useful,
  11. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  13. * GNU General Public License for more details.
  14. *
  15. * You should have received a copy of the GNU General Public License
  16. * along with this program. If not, see <http://www.gnu.org/licenses/>.
  17. *
  18. */
  19. // Package psiphon/server/psinet implements psinet database services. The psinet
  20. // database is a JSON-format file containing information about the Psiphon network,
  21. // including sponsors, home pages, stats regexes, available upgrades, and other
  22. // servers for discovery. This package also implements the Psiphon discovery algorithm.
  23. package psinet
  24. import (
  25. "encoding/hex"
  26. "encoding/json"
  27. "fmt"
  28. "math"
  29. "strconv"
  30. "strings"
  31. "time"
  32. "github.com/Psiphon-Labs/psiphon-tunnel-core/psiphon/common"
  33. )
  34. // Database serves Psiphon API data requests. It's safe for
  35. // concurrent usage. The Reload function supports hot reloading
  36. // of Psiphon network data while the server is running.
  37. type Database struct {
  38. common.ReloadableFile
  39. Hosts map[string]Host `json:"hosts"`
  40. Servers []Server `json:"servers"`
  41. Sponsors map[string]Sponsor `json:"sponsors"`
  42. Versions map[string][]ClientVersion `json:"client_versions"`
  43. }
  44. type Host struct {
  45. DatacenterName string `json:"datacenter_name"`
  46. Id string `json:"id"`
  47. IpAddress string `json:"ip_address"`
  48. IsTCS bool `json:"is_TCS"`
  49. MeekCookieEncryptionPublicKey string `json:"meek_cookie_encryption_public_key"`
  50. MeekServerObfuscatedKey string `json:"meek_server_obfuscated_key"`
  51. MeekServerPort int `json:"meek_server_port"`
  52. Region string `json:"region"`
  53. }
  54. type Server struct {
  55. AlternateSshObfuscatedPorts []string `json:"alternate_ssh_obfuscated_ports"`
  56. Capabilities map[string]bool `json:"capabilities"`
  57. DiscoveryDateRange []string `json:"discovery_date_range"`
  58. EgressIpAddress string `json:"egress_ip_address"`
  59. HostId string `json:"host_id"`
  60. Id string `json:"id"`
  61. InternalIpAddress string `json:"internal_ip_address"`
  62. IpAddress string `json:"ip_address"`
  63. IsEmbedded bool `json:"is_embedded"`
  64. IsPermanent bool `json:"is_permanent"`
  65. PropogationChannelId string `json:"propagation_channel_id"`
  66. SshHostKey string `json:"ssh_host_key"`
  67. SshObfuscatedKey string `json:"ssh_obfuscated_key"`
  68. SshObfuscatedPort int `json:"ssh_obfuscated_port"`
  69. SshPassword string `json:"ssh_password"`
  70. SshPort string `json:"ssh_port"`
  71. SshUsername string `json:"ssh_username"`
  72. WebServerCertificate string `json:"web_server_certificate"`
  73. WebServerPort string `json:"web_server_port"`
  74. WebServerSecret string `json:"web_server_secret"`
  75. }
  76. type Sponsor struct {
  77. Banner string
  78. HomePages map[string][]HomePage `json:"home_pages"`
  79. HttpsRequestRegexes []HttpsRequestRegex `json:"https_request_regexes"`
  80. Id string `json:"id"`
  81. MobileHomePages map[string][]HomePage `json:"mobile_home_pages"`
  82. Name string `json:"name"`
  83. PageViewRegexes []PageViewRegex `json:"page_view_regexes"`
  84. WebsiteBanner string `json:"website_banner"`
  85. WebsiteBannerLink string `json:"website_banner_link"`
  86. }
  87. type ClientVersion struct {
  88. Version string `json:"version"`
  89. }
  90. type HomePage struct {
  91. Region string `json:"region"`
  92. Url string `json:"url"`
  93. }
  94. type HttpsRequestRegex struct {
  95. Regex string `json:"regex"`
  96. Replace string `json:"replace"`
  97. }
  98. type MobileHomePage struct {
  99. Region string `json:"region"`
  100. Url string `json:"url"`
  101. }
  102. type PageViewRegex struct {
  103. Regex string `json:"regex"`
  104. Replace string `json:"replace"`
  105. }
  106. // NewDatabase initializes a Database, calling Reload on the specified
  107. // filename.
  108. func NewDatabase(filename string) (*Database, error) {
  109. database := &Database{}
  110. database.ReloadableFile = common.NewReloadableFile(
  111. filename,
  112. func(fileContent []byte) error {
  113. err := json.Unmarshal(fileContent, &database)
  114. if err != nil {
  115. // On error, state remains the same
  116. // (Unmarshal first validates the provided
  117. // JOSN and then populates the interface)
  118. return common.ContextError(err)
  119. }
  120. return nil
  121. })
  122. _, err := database.Reload()
  123. if err != nil {
  124. return nil, common.ContextError(err)
  125. }
  126. return database, nil
  127. }
  128. // GetHomepages returns a list of home pages for the specified sponsor,
  129. // region, and platform.
  130. func (db *Database) GetHomepages(sponsorID, clientRegion string, isMobilePlatform bool) []string {
  131. db.ReloadableFile.RLock()
  132. defer db.ReloadableFile.RUnlock()
  133. sponsorHomePages := make([]string, 0)
  134. // Sponsor id does not exist: fail gracefully
  135. sponsor, ok := db.Sponsors[sponsorID]
  136. if !ok {
  137. return nil
  138. }
  139. homePages := sponsor.HomePages
  140. if isMobilePlatform {
  141. if sponsor.MobileHomePages != nil {
  142. homePages = sponsor.MobileHomePages
  143. }
  144. }
  145. // Case: lookup succeeded and corresponding homepages found for region
  146. homePagesByRegion, ok := homePages[clientRegion]
  147. if ok {
  148. for _, homePage := range homePagesByRegion {
  149. sponsorHomePages = append(sponsorHomePages, strings.Replace(homePage.Url, "client_region=XX", "client_region="+clientRegion, 1))
  150. }
  151. }
  152. // Case: lookup failed or no corresponding homepages found for region --> use default
  153. if sponsorHomePages == nil {
  154. defaultHomePages, ok := homePages["None"]
  155. if ok {
  156. for _, homePage := range defaultHomePages {
  157. // client_region query parameter substitution
  158. sponsorHomePages = append(sponsorHomePages, strings.Replace(homePage.Url, "client_region=XX", "client_region="+clientRegion, 1))
  159. }
  160. }
  161. }
  162. return sponsorHomePages
  163. }
  164. // GetUpgradeClientVersion returns a new client version when an upgrade is
  165. // indicated for the specified client current version. The result is "" when
  166. // no upgrade is available. Caller should normalize clientPlatform.
  167. func (db *Database) GetUpgradeClientVersion(clientVersion, clientPlatform string) string {
  168. db.ReloadableFile.RLock()
  169. defer db.ReloadableFile.RUnlock()
  170. // Check lastest version number against client version number
  171. clientVersions, ok := db.Versions[clientPlatform]
  172. if !ok {
  173. return ""
  174. }
  175. if len(clientVersions) == 0 {
  176. return ""
  177. }
  178. // NOTE: Assumes versions list is in ascending version order
  179. lastVersion := clientVersions[len(clientVersions)-1].Version
  180. lastVersionInt, err := strconv.Atoi(lastVersion)
  181. if err != nil {
  182. return ""
  183. }
  184. clientVersionInt, err := strconv.Atoi(clientVersion)
  185. if err != nil {
  186. return ""
  187. }
  188. // Return latest version if upgrade needed
  189. if lastVersionInt > clientVersionInt {
  190. return lastVersion
  191. }
  192. return ""
  193. }
  194. // GetHttpsRequestRegexes returns bytes transferred stats regexes for the
  195. // specified sponsor. The result is nil when an unknown sponsorID is provided.
  196. func (db *Database) GetHttpsRequestRegexes(sponsorID string) []map[string]string {
  197. db.ReloadableFile.RLock()
  198. defer db.ReloadableFile.RUnlock()
  199. regexes := make([]map[string]string, 0)
  200. for i := range db.Sponsors[sponsorID].HttpsRequestRegexes {
  201. regex := make(map[string]string)
  202. regex["replace"] = db.Sponsors[sponsorID].HttpsRequestRegexes[i].Replace
  203. regex["regex"] = db.Sponsors[sponsorID].HttpsRequestRegexes[i].Regex
  204. regexes = append(regexes, regex)
  205. }
  206. return regexes
  207. }
  208. // DiscoverServers selects new encoded server entries to be "discovered" by
  209. // the client, using the discoveryValue as the input into the discovery algorithm.
  210. // The server list (db.Servers) loaded from JSON is stored as an array instead of
  211. // a map to ensure servers are discovered deterministically. Each iteration over a
  212. // map in go is seeded with a random value which causes non-deterministic ordering.
  213. func (db *Database) DiscoverServers(discoveryValue int) []string {
  214. db.ReloadableFile.RLock()
  215. defer db.ReloadableFile.RUnlock()
  216. var servers []Server
  217. discoveryDate := time.Now().UTC()
  218. candidateServers := make([]Server, 0)
  219. for _, server := range db.Servers {
  220. var start time.Time
  221. var end time.Time
  222. var err error
  223. // All servers that are discoverable on this day are eligable for discovery
  224. if len(server.DiscoveryDateRange) != 0 {
  225. start, err = time.Parse("2006-01-02T15:04:05", server.DiscoveryDateRange[0])
  226. if err != nil {
  227. continue
  228. }
  229. end, err = time.Parse("2006-01-02T15:04:05", server.DiscoveryDateRange[1])
  230. if err != nil {
  231. continue
  232. }
  233. if discoveryDate.After(start) && discoveryDate.Before(end) {
  234. candidateServers = append(candidateServers, server)
  235. }
  236. }
  237. }
  238. servers = selectServers(candidateServers, discoveryValue)
  239. encodedServerEntries := make([]string, 0)
  240. for _, server := range servers {
  241. encodedServerEntries = append(encodedServerEntries, db.getEncodedServerEntry(server))
  242. }
  243. return encodedServerEntries
  244. }
  245. // Combine client IP address and time-of-day strategies to give out different
  246. // discovery servers to different clients. The aim is to achieve defense against
  247. // enumerability. We also want to achieve a degree of load balancing clients
  248. // and these strategies are expected to have reasonably random distribution,
  249. // even for a cluster of users coming from the same network.
  250. //
  251. // We only select one server: multiple results makes enumeration easier; the
  252. // strategies have a built-in load balancing effect; and date range discoverability
  253. // means a client will actually learn more servers later even if they happen to
  254. // always pick the same result at this point.
  255. //
  256. // This is a blended strategy: as long as there are enough servers to pick from,
  257. // both aspects determine which server is selected. IP address is given the
  258. // priority: if there are only a couple of servers, for example, IP address alone
  259. // determines the outcome.
  260. func selectServers(servers []Server, discoveryValue int) []Server {
  261. TIME_GRANULARITY := 3600
  262. if len(servers) == 0 {
  263. return nil
  264. }
  265. // Current time truncated to an hour
  266. timeInSeconds := int(time.Now().Unix())
  267. timeStrategyValue := timeInSeconds / TIME_GRANULARITY
  268. // Divide servers into buckets. The bucket count is chosen such that the number
  269. // of buckets and the number of items in each bucket are close (using sqrt).
  270. // IP address selects the bucket, time selects the item in the bucket.
  271. // NOTE: this code assumes that the range of possible timeStrategyValues
  272. // and discoveryValues are sufficient to index to all bucket items.
  273. bucketCount := calculateBucketCount(len(servers))
  274. buckets := bucketizeServerList(servers, bucketCount)
  275. bucket := buckets[discoveryValue%len(buckets)]
  276. server := bucket[timeStrategyValue%len(bucket)]
  277. serverList := make([]Server, 1)
  278. serverList[0] = server
  279. return serverList
  280. }
  281. // Number of buckets such that first strategy picks among about the same number
  282. // of choices as the second strategy. Gives an edge to the "outer" strategy.
  283. func calculateBucketCount(length int) int {
  284. return int(math.Ceil(math.Sqrt(float64(length))))
  285. }
  286. // Create bucketCount buckets.
  287. // Each bucket will be of size division or divison-1.
  288. func bucketizeServerList(servers []Server, bucketCount int) [][]Server {
  289. division := float64(len(servers)) / float64(bucketCount)
  290. buckets := make([][]Server, bucketCount)
  291. var currentBucketIndex int = 0
  292. var serverIndex int = 0
  293. for _, server := range servers {
  294. bucketEndIndex := int(math.Floor(division * (float64(currentBucketIndex) + 1)))
  295. buckets[currentBucketIndex] = append(buckets[currentBucketIndex], server)
  296. serverIndex++
  297. if serverIndex > bucketEndIndex {
  298. currentBucketIndex++
  299. }
  300. }
  301. return buckets
  302. }
  303. // Return hex encoded server entry string for comsumption by client.
  304. // Newer clients ignore the legacy fields and only utilize the extended (new) config.
  305. func (db *Database) getEncodedServerEntry(server Server) string {
  306. host, hostExists := db.Hosts[server.HostId]
  307. if !hostExists {
  308. return ""
  309. }
  310. // TCS web server certificate has PEM headers and newlines, so strip those now
  311. // for legacy format compatibility
  312. webServerCertificate := server.WebServerCertificate
  313. if host.IsTCS {
  314. splitCert := strings.Split(server.WebServerCertificate, "\n")
  315. if len(splitCert) <= 2 {
  316. webServerCertificate = ""
  317. } else {
  318. webServerCertificate = strings.Join(splitCert[1:len(splitCert)-2], "")
  319. }
  320. }
  321. // Double-check that we're not giving our blank server credentials
  322. if len(server.IpAddress) <= 1 || len(server.WebServerPort) <= 1 || len(server.WebServerSecret) <= 1 || len(webServerCertificate) <= 1 {
  323. return ""
  324. }
  325. // Extended (new) entry fields are in a JSON string
  326. var extendedConfig struct {
  327. IpAddress string
  328. WebServerPort string
  329. WebServerSecret string
  330. WebServerCertificate string
  331. SshPort int
  332. SshUsername string
  333. SshPassword string
  334. SshHostKey string
  335. SshObfuscatedPort int
  336. SshObfuscatedKey string
  337. Region string
  338. MeekCookieEncryptionPublicKey string
  339. MeekObfuscatedKey string
  340. MeekServerPort int
  341. capabilities []string
  342. }
  343. // NOTE: also putting original values in extended config for easier parsing by new clients
  344. extendedConfig.IpAddress = server.IpAddress
  345. extendedConfig.WebServerPort = server.WebServerPort
  346. extendedConfig.WebServerSecret = server.WebServerSecret
  347. extendedConfig.WebServerCertificate = webServerCertificate
  348. sshPort, err := strconv.Atoi(server.SshPort)
  349. if err != nil {
  350. extendedConfig.SshPort = 0
  351. } else {
  352. extendedConfig.SshPort = sshPort
  353. }
  354. extendedConfig.SshUsername = server.SshUsername
  355. extendedConfig.SshPassword = server.SshPassword
  356. sshHostKeyType, sshHostKey := parseSshKeyString(server.SshHostKey)
  357. if strings.Compare(sshHostKeyType, "ssh-rsa") == 0 {
  358. extendedConfig.SshHostKey = sshHostKey
  359. } else {
  360. extendedConfig.SshHostKey = ""
  361. }
  362. extendedConfig.SshObfuscatedPort = server.SshObfuscatedPort
  363. // Use the latest alternate port unless tunneling through meek
  364. if len(server.AlternateSshObfuscatedPorts) > 0 && !server.Capabilities["UNFRONTED-MEEK"] {
  365. port, err := strconv.Atoi(server.AlternateSshObfuscatedPorts[len(server.AlternateSshObfuscatedPorts)-1])
  366. if err == nil {
  367. extendedConfig.SshObfuscatedPort = port
  368. }
  369. }
  370. extendedConfig.SshObfuscatedKey = server.SshObfuscatedKey
  371. extendedConfig.Region = host.Region
  372. extendedConfig.MeekCookieEncryptionPublicKey = host.MeekCookieEncryptionPublicKey
  373. extendedConfig.MeekServerPort = host.MeekServerPort
  374. extendedConfig.MeekObfuscatedKey = host.MeekServerObfuscatedKey
  375. serverCapabilities := make(map[string]bool, 0)
  376. for capability, enabled := range server.Capabilities {
  377. serverCapabilities[capability] = enabled
  378. }
  379. if serverCapabilities["UNFRONTED-MEEK"] && host.MeekServerPort == 443 {
  380. serverCapabilities["UNFRONTED-MEEK"] = false
  381. serverCapabilities["UNFRONTED-MEEK-HTTPS"] = true
  382. }
  383. for capability, enabled := range serverCapabilities {
  384. if enabled == true {
  385. extendedConfig.capabilities = append(extendedConfig.capabilities, capability)
  386. }
  387. }
  388. jsonDump, err := json.Marshal(extendedConfig)
  389. if err != nil {
  390. return ""
  391. }
  392. // Legacy format + extended (new) config
  393. prefixString := fmt.Sprintf("%s %s %s %s ", server.IpAddress, server.WebServerPort, server.WebServerSecret, webServerCertificate)
  394. return hex.EncodeToString(append([]byte(prefixString)[:], []byte(jsonDump)[:]...))
  395. }
  396. // Parse string of format "ssh-key-type ssh-key".
  397. func parseSshKeyString(sshKeyString string) (keyType string, key string) {
  398. sshKeyArr := strings.Split(sshKeyString, " ")
  399. if len(sshKeyArr) != 2 {
  400. return "", ""
  401. }
  402. return sshKeyArr[0], sshKeyArr[1]
  403. }