process.go 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709
  1. package xray
  2. import (
  3. "bytes"
  4. "encoding/json"
  5. "errors"
  6. "fmt"
  7. "os"
  8. "os/exec"
  9. "path/filepath"
  10. "runtime"
  11. "sort"
  12. "strings"
  13. "sync"
  14. "sync/atomic"
  15. "syscall"
  16. "time"
  17. "github.com/mhsanaei/3x-ui/v3/internal/config"
  18. "github.com/mhsanaei/3x-ui/v3/internal/logger"
  19. "github.com/mhsanaei/3x-ui/v3/internal/util/common"
  20. )
  21. // GetBinaryName returns the Xray binary filename for the current OS and architecture.
  22. func GetBinaryName() string {
  23. arch := runtime.GOARCH
  24. if arch == "arm" {
  25. arch = "arm32"
  26. }
  27. return fmt.Sprintf("xray-%s-%s", runtime.GOOS, arch)
  28. }
  29. // GetBinaryPath returns the full path to the Xray binary executable.
  30. func GetBinaryPath() string {
  31. return config.GetBinFolderPath() + "/" + GetBinaryName()
  32. }
  33. // GetConfigPath returns the path to the Xray configuration file in the binary folder.
  34. func GetConfigPath() string {
  35. return config.GetBinFolderPath() + "/config.json"
  36. }
  37. // GetGeositePath returns the path to the geosite data file used by Xray.
  38. func GetGeositePath() string {
  39. return config.GetBinFolderPath() + "/geosite.dat"
  40. }
  41. // GetGeoipPath returns the path to the geoip data file used by Xray.
  42. func GetGeoipPath() string {
  43. return config.GetBinFolderPath() + "/geoip.dat"
  44. }
  45. // GetIPLimitLogPath returns the path to the IP limit log file.
  46. func GetIPLimitLogPath() string {
  47. return config.GetLogFolder() + "/3xipl.log"
  48. }
  49. // GetIPLimitBannedLogPath returns the path to the banned IP log file.
  50. func GetIPLimitBannedLogPath() string {
  51. return config.GetLogFolder() + "/3xipl-banned.log"
  52. }
  53. // GetIPLimitBannedPrevLogPath returns the path to the previous banned IP log file.
  54. func GetIPLimitBannedPrevLogPath() string {
  55. return config.GetLogFolder() + "/3xipl-banned.prev.log"
  56. }
  57. // GetAccessPersistentLogPath returns the path to the persistent access log file.
  58. func GetAccessPersistentLogPath() string {
  59. return config.GetLogFolder() + "/3xipl-ap.log"
  60. }
  61. // GetAccessPersistentPrevLogPath returns the path to the previous persistent access log file.
  62. func GetAccessPersistentPrevLogPath() string {
  63. return config.GetLogFolder() + "/3xipl-ap.prev.log"
  64. }
  65. // GetAccessLogPath reads the Xray config and returns the access log file path.
  66. func GetAccessLogPath() (string, error) {
  67. config, err := os.ReadFile(GetConfigPath())
  68. if err != nil {
  69. logger.Warningf("Failed to read configuration file: %s", err)
  70. return "", err
  71. }
  72. jsonConfig := map[string]any{}
  73. err = json.Unmarshal([]byte(config), &jsonConfig)
  74. if err != nil {
  75. logger.Warningf("Failed to parse JSON configuration: %s", err)
  76. return "", err
  77. }
  78. if jsonConfig["log"] != nil {
  79. jsonLog := jsonConfig["log"].(map[string]any)
  80. if jsonLog["access"] != nil {
  81. accessLogPath := jsonLog["access"].(string)
  82. return accessLogPath, nil
  83. }
  84. }
  85. return "", err
  86. }
  87. // stopProcess calls Stop on the given Process instance.
  88. func stopProcess(p *Process) {
  89. p.Stop()
  90. }
  91. // Process wraps an Xray process instance and provides management methods.
  92. type Process struct {
  93. *process
  94. }
  95. // NewProcess creates a new Xray process and sets up cleanup on garbage collection.
  96. func NewProcess(xrayConfig *Config) *Process {
  97. p := &Process{newProcess(xrayConfig)}
  98. runtime.SetFinalizer(p, stopProcess)
  99. return p
  100. }
  101. // NewTestProcess creates a new Xray process that uses a specific config file path.
  102. // Used for test runs (e.g. outbound test) so the main config.json is not overwritten.
  103. // The config file at configPath is removed when the process is stopped.
  104. func NewTestProcess(xrayConfig *Config, configPath string) *Process {
  105. p := &Process{newTestProcess(xrayConfig, configPath)}
  106. runtime.SetFinalizer(p, stopProcess)
  107. return p
  108. }
  109. type process struct {
  110. // mu guards the process lifecycle fields (cmd, done, exitErr) which are
  111. // written by Start/startCommand and the waitForCommand goroutine while being
  112. // read concurrently by IsRunning/GetErr/GetResult/Stop from other goroutines
  113. // (status endpoint, check-xray-running job). Snapshot under the lock, then do
  114. // any blocking syscall (Wait/Signal/Kill) on the local copy without holding it.
  115. mu sync.RWMutex
  116. cmd *exec.Cmd
  117. done chan struct{}
  118. version string
  119. apiPort int
  120. // onlineClients is the set of emails active on THIS panel's own xray
  121. // within the online grace window. It is derived only from local xray
  122. // traffic polls (see RefreshLocalOnline) — never from remote-node
  123. // snapshots — so a client connected solely to a remote node is not
  124. // reported online on local inbounds.
  125. onlineClients []string
  126. // localActiveInbounds is the set of THIS panel's inbound tags that
  127. // carried traffic within the same grace window. Xray's user>>>email
  128. // stat aggregates across every inbound a client is attached to, so an
  129. // online email alone can't say which inbound it actually used. Pairing
  130. // it with the inbound>>>tag stat lets the per-inbound view drop a
  131. // multi-inbound client from inbounds that saw no traffic this window.
  132. localActiveInbounds []string
  133. // localLastOnline records, per email, the last time this panel's own
  134. // xray reported traffic for it. RefreshLocalOnline rebuilds
  135. // onlineClients from this map each tick, keeping the local online set
  136. // independent of the shared client_traffics.last_online column — that
  137. // column is bumped by remote-node syncs too and would otherwise leak
  138. // remote-only clients into the local set.
  139. localLastOnline map[string]int64
  140. // localInboundLastActive mirrors localLastOnline for inbound tags: the
  141. // last tick this panel's xray reported traffic through each tag.
  142. // Rebuilt into localActiveInbounds under the same grace window so the
  143. // two signals stay aligned — an email within grace always has the
  144. // inbound it used within grace too.
  145. localInboundLastActive map[string]int64
  146. // nodeOnlineTrees holds, per direct remote node (keyed by that node's
  147. // panel-local id), the GUID-keyed online-emails subtree that node
  148. // reported — its own clients under its panelGuid plus every descendant
  149. // under theirs. Keying the stored value by GUID (not node id) lets the
  150. // master attribute a deeply nested client to the node that physically
  151. // hosts it across a chain (#4983); the outer node-id key is only so a
  152. // failed probe can drop that whole branch's contribution. NodeTrafficSyncJob
  153. // populates entries per cron tick and clears them when a probe fails. The
  154. // mutex guards this map, onlineClients, and localLastOnline above so the
  155. // online getters never see a torn read.
  156. nodeOnlineTrees map[int]map[string][]string
  157. onlineMu sync.RWMutex
  158. // onlineAPISupport caches whether the running core implements the
  159. // online-stats RPCs (GetUsersStats). A new process is created on every
  160. // restart/version switch, so the flag resets to Unknown and is re-probed
  161. // lazily by the first caller.
  162. onlineAPISupport atomic.Int32
  163. config *Config
  164. configPath string // if set, use this path instead of GetConfigPath() and remove on Stop
  165. logWriter *LogWriter
  166. exitErr error
  167. startTime time.Time
  168. intentionalStop atomic.Bool
  169. }
  170. // OnlineAPISupport describes whether the running Xray core implements the
  171. // online-stats API (statsUserOnline + GetUsersStats).
  172. type OnlineAPISupport int32
  173. const (
  174. // OnlineAPIUnknown means support has not been probed yet for this process.
  175. OnlineAPIUnknown OnlineAPISupport = iota
  176. // OnlineAPISupported means the core answered the online-stats RPC.
  177. OnlineAPISupported
  178. // OnlineAPIUnsupported means the core returned Unimplemented (older binary).
  179. OnlineAPIUnsupported
  180. )
  181. // OnlineAPISupport returns the cached online-stats capability of this process.
  182. func (p *process) OnlineAPISupport() OnlineAPISupport {
  183. return OnlineAPISupport(p.onlineAPISupport.Load())
  184. }
  185. // SetOnlineAPISupport records the probed online-stats capability of this process.
  186. func (p *process) SetOnlineAPISupport(v OnlineAPISupport) {
  187. p.onlineAPISupport.Store(int32(v))
  188. }
  189. var (
  190. xrayGracefulStopTimeout = 5 * time.Second
  191. xrayForceStopTimeout = 2 * time.Second
  192. // OnCrash is called when xray crashes unexpectedly. Set from web layer.
  193. OnCrash func(err error)
  194. )
  195. // newProcess creates a new internal process struct for Xray.
  196. func newProcess(config *Config) *process {
  197. return &process{
  198. version: "Unknown",
  199. config: config,
  200. logWriter: NewLogWriter(),
  201. startTime: time.Now(),
  202. }
  203. }
  204. // newTestProcess creates a process that writes and runs with a specific config path.
  205. func newTestProcess(config *Config, configPath string) *process {
  206. p := newProcess(config)
  207. p.configPath = configPath
  208. return p
  209. }
  210. // IsRunning returns true if the Xray process is currently running.
  211. func (p *process) IsRunning() bool {
  212. p.mu.RLock()
  213. cmd, done := p.cmd, p.done
  214. p.mu.RUnlock()
  215. if cmd == nil || cmd.Process == nil {
  216. return false
  217. }
  218. // done is closed by the waitForCommand goroutine exactly when cmd.Wait
  219. // returns, i.e. when the process has exited; it is the race-free signal here
  220. // (reading cmd.ProcessState would race with that Wait).
  221. if done != nil {
  222. select {
  223. case <-done:
  224. return false
  225. default:
  226. }
  227. }
  228. return true
  229. }
  230. // GetErr returns the last error encountered by the Xray process.
  231. func (p *process) GetErr() error {
  232. p.mu.RLock()
  233. defer p.mu.RUnlock()
  234. return p.exitErr
  235. }
  236. // GetResult returns the last log line or error from the Xray process.
  237. func (p *process) GetResult() string {
  238. p.mu.RLock()
  239. exitErr := p.exitErr
  240. p.mu.RUnlock()
  241. if len(p.logWriter.lastLine) == 0 && exitErr != nil {
  242. return exitErr.Error()
  243. }
  244. return p.logWriter.lastLine
  245. }
  246. // GetVersion returns the version string of the Xray process.
  247. func (p *process) GetVersion() string {
  248. return p.version
  249. }
  250. // GetAPIPort returns the API port used by the Xray process.
  251. func (p *Process) GetAPIPort() int {
  252. return p.apiPort
  253. }
  254. // GetConfig returns the configuration used by the Xray process.
  255. func (p *Process) GetConfig() *Config {
  256. return p.config
  257. }
  258. // SetConfig replaces the stored configuration snapshot after the running
  259. // process has been reconciled with it through the gRPC API (hot apply), so
  260. // later change detection compares against what is actually running.
  261. func (p *Process) SetConfig(config *Config) {
  262. p.config = config
  263. }
  264. // GetOnlineClients returns the union of locally-online clients and
  265. // node-online clients from every registered remote panel. Dedupes by
  266. // email so a client connected to both a local and a node-managed inbound
  267. // surfaces once. Cheap allocation — typical online sets are small and
  268. // the union is recomputed on demand.
  269. func (p *Process) GetOnlineClients() []string {
  270. p.onlineMu.RLock()
  271. defer p.onlineMu.RUnlock()
  272. if len(p.nodeOnlineTrees) == 0 {
  273. // Hot path for single-panel deployments: avoid the map+dedupe
  274. // work entirely and return the local slice as-is.
  275. return p.onlineClients
  276. }
  277. seen := make(map[string]struct{}, len(p.onlineClients))
  278. out := make([]string, 0, len(p.onlineClients))
  279. add := func(emails []string) {
  280. for _, email := range emails {
  281. if _, dup := seen[email]; dup {
  282. continue
  283. }
  284. seen[email] = struct{}{}
  285. out = append(out, email)
  286. }
  287. }
  288. add(p.onlineClients)
  289. for _, tree := range p.nodeOnlineTrees {
  290. for _, emails := range tree {
  291. add(emails)
  292. }
  293. }
  294. return out
  295. }
  296. // GetLocalOnlineClients returns a copy of the emails online on THIS panel's own
  297. // xray within the grace window. The service layer keys these under the panel's
  298. // own GUID when assembling the per-node online view.
  299. func (p *Process) GetLocalOnlineClients() []string {
  300. p.onlineMu.RLock()
  301. defer p.onlineMu.RUnlock()
  302. if len(p.onlineClients) == 0 {
  303. return nil
  304. }
  305. out := make([]string, len(p.onlineClients))
  306. copy(out, p.onlineClients)
  307. return out
  308. }
  309. // GetMergedNodeTrees returns the union of every direct node's reported subtree,
  310. // keyed by the panelGuid of the node that physically hosts each client set.
  311. // Because each child already reports its descendants under their own GUIDs,
  312. // merging the direct children yields the whole tree at any depth (#4983), so a
  313. // client three hops down is attributed to its real node, not the intermediate
  314. // one. GUIDs are globally unique, but a set reported under the same GUID by more
  315. // than one path is deduped per key; empty sets are omitted.
  316. func (p *Process) GetMergedNodeTrees() map[string][]string {
  317. p.onlineMu.RLock()
  318. defer p.onlineMu.RUnlock()
  319. if len(p.nodeOnlineTrees) == 0 {
  320. return map[string][]string{}
  321. }
  322. out := make(map[string][]string)
  323. seen := make(map[string]map[string]struct{})
  324. for _, tree := range p.nodeOnlineTrees {
  325. for guid, emails := range tree {
  326. if guid == "" || len(emails) == 0 {
  327. continue
  328. }
  329. dedup := seen[guid]
  330. if dedup == nil {
  331. dedup = make(map[string]struct{}, len(emails))
  332. seen[guid] = dedup
  333. }
  334. for _, email := range emails {
  335. if _, ok := dedup[email]; ok {
  336. continue
  337. }
  338. dedup[email] = struct{}{}
  339. out[guid] = append(out[guid], email)
  340. }
  341. }
  342. }
  343. return out
  344. }
  345. // GetLocalActiveInbounds returns a copy of THIS panel's inbound tags that
  346. // carried traffic within the grace window. Only the local xray reports
  347. // per-inbound activity; remote-node snapshots don't carry it, so the service
  348. // layer keys these under the panel's own GUID and a node missing from the
  349. // active-inbounds map means "don't gate" (fall back to the email-only signal).
  350. func (p *Process) GetLocalActiveInbounds() []string {
  351. p.onlineMu.RLock()
  352. defer p.onlineMu.RUnlock()
  353. if len(p.localActiveInbounds) == 0 {
  354. return nil
  355. }
  356. out := make([]string, len(p.localActiveInbounds))
  357. copy(out, p.localActiveInbounds)
  358. return out
  359. }
  360. // RefreshLocalOnline records that each email in activeEmails and each tag in
  361. // activeInboundTags had local xray traffic at now, then rebuilds onlineClients
  362. // and localActiveInbounds from every entry seen within graceMs, pruning older
  363. // ones. Called by the local XrayTrafficJob after each xray gRPC stats poll.
  364. // Pass nil/empty slices to only prune — NodeTrafficSyncJob does this so a
  365. // stopped local xray's clients and inbounds still age out between local polls.
  366. func (p *Process) RefreshLocalOnline(activeEmails, activeInboundTags []string, now, graceMs int64) {
  367. p.onlineMu.Lock()
  368. defer p.onlineMu.Unlock()
  369. if p.localLastOnline == nil {
  370. p.localLastOnline = make(map[string]int64, len(activeEmails))
  371. }
  372. for _, email := range activeEmails {
  373. p.localLastOnline[email] = now
  374. }
  375. online := make([]string, 0, len(p.localLastOnline))
  376. for email, ts := range p.localLastOnline {
  377. if now-ts < graceMs {
  378. online = append(online, email)
  379. } else {
  380. delete(p.localLastOnline, email)
  381. }
  382. }
  383. p.onlineClients = online
  384. if p.localInboundLastActive == nil {
  385. p.localInboundLastActive = make(map[string]int64, len(activeInboundTags))
  386. }
  387. for _, tag := range activeInboundTags {
  388. p.localInboundLastActive[tag] = now
  389. }
  390. activeInbounds := make([]string, 0, len(p.localInboundLastActive))
  391. for tag, ts := range p.localInboundLastActive {
  392. if now-ts < graceMs {
  393. activeInbounds = append(activeInbounds, tag)
  394. } else {
  395. delete(p.localInboundLastActive, tag)
  396. }
  397. }
  398. p.localActiveInbounds = activeInbounds
  399. }
  400. // SetNodeOnlineTree records the GUID-keyed online subtree one direct remote
  401. // node reported (its own clients under its panelGuid plus every descendant
  402. // under theirs). Replaces any previous entry for that node — NodeTrafficSyncJob
  403. // always sends the full subtree per tick.
  404. func (p *Process) SetNodeOnlineTree(nodeID int, tree map[string][]string) {
  405. p.onlineMu.Lock()
  406. defer p.onlineMu.Unlock()
  407. if p.nodeOnlineTrees == nil {
  408. p.nodeOnlineTrees = map[int]map[string][]string{}
  409. }
  410. p.nodeOnlineTrees[nodeID] = tree
  411. }
  412. // ClearNodeOnlineClients drops a direct node's whole subtree contribution.
  413. // Called when a probe fails so a downed node — and everything behind it — doesn't
  414. // keep its clients listed as "online" until the next successful probe.
  415. func (p *Process) ClearNodeOnlineClients(nodeID int) {
  416. p.onlineMu.Lock()
  417. defer p.onlineMu.Unlock()
  418. delete(p.nodeOnlineTrees, nodeID)
  419. }
  420. // GetUptime returns the uptime of the Xray process in seconds.
  421. func (p *Process) GetUptime() uint64 {
  422. return uint64(time.Since(p.startTime).Seconds())
  423. }
  424. // refreshAPIPort updates the API port from the inbound configs.
  425. func (p *process) refreshAPIPort() {
  426. for _, inbound := range p.config.InboundConfigs {
  427. if inbound.Tag == "api" {
  428. p.apiPort = inbound.Port
  429. break
  430. }
  431. }
  432. }
  433. // refreshVersion updates the version string by running the Xray binary with -version.
  434. func (p *process) refreshVersion() {
  435. cmd := exec.Command(GetBinaryPath(), "-version")
  436. data, err := cmd.Output()
  437. if err != nil {
  438. p.version = "Unknown"
  439. } else {
  440. datas := bytes.Split(data, []byte(" "))
  441. if len(datas) <= 1 {
  442. p.version = "Unknown"
  443. } else {
  444. p.version = string(datas[1])
  445. }
  446. }
  447. }
  448. // Start launches the Xray process with the current configuration.
  449. func (p *process) Start() (err error) {
  450. if p.IsRunning() {
  451. return errors.New("xray is already running")
  452. }
  453. defer func() {
  454. if err != nil {
  455. logger.Error("Failure in running xray-core process: ", err)
  456. p.setExitErr(err)
  457. }
  458. }()
  459. data, err := json.MarshalIndent(p.config, "", " ")
  460. if err != nil {
  461. return common.NewErrorf("Failed to generate XRAY configuration files: %v", err)
  462. }
  463. err = os.MkdirAll(config.GetLogFolder(), 0o770)
  464. if err != nil {
  465. logger.Warningf("Failed to create log folder: %s", err)
  466. }
  467. configPath := GetConfigPath()
  468. if p.configPath != "" {
  469. configPath = p.configPath
  470. }
  471. err = os.WriteFile(configPath, data, 0644)
  472. if err != nil {
  473. return common.NewErrorf("Failed to write configuration file: %v", err)
  474. }
  475. cmd := exec.Command(GetBinaryPath(), "-c", configPath)
  476. cmd.Stdout = p.logWriter
  477. cmd.Stderr = p.logWriter
  478. err = p.startCommand(cmd)
  479. if err != nil {
  480. return err
  481. }
  482. p.refreshVersion()
  483. p.refreshAPIPort()
  484. return nil
  485. }
  486. func (p *process) startCommand(cmd *exec.Cmd) error {
  487. p.mu.Lock()
  488. p.cmd = cmd
  489. p.done = make(chan struct{})
  490. p.exitErr = nil
  491. done := p.done
  492. p.mu.Unlock()
  493. p.intentionalStop.Store(false)
  494. if err := cmd.Start(); err != nil {
  495. close(done)
  496. p.mu.Lock()
  497. p.cmd = nil
  498. p.mu.Unlock()
  499. return err
  500. }
  501. attachChildLifetime(cmd)
  502. go p.waitForCommand(cmd, done)
  503. return nil
  504. }
  505. func (p *process) setExitErr(err error) {
  506. p.mu.Lock()
  507. p.exitErr = err
  508. p.mu.Unlock()
  509. }
  510. func (p *process) waitForCommand(cmd *exec.Cmd, done chan struct{}) {
  511. defer close(done)
  512. err := cmd.Wait()
  513. if err == nil || p.intentionalStop.Load() {
  514. return
  515. }
  516. // On Windows, killing the process results in "exit status 1" which isn't an error for us.
  517. if runtime.GOOS == "windows" {
  518. errStr := strings.ToLower(err.Error())
  519. if strings.Contains(errStr, "exit status 1") {
  520. p.setExitErr(err)
  521. return
  522. }
  523. }
  524. logger.Error("Failure in running xray-core:", err)
  525. p.setExitErr(err)
  526. if OnCrash != nil {
  527. OnCrash(err)
  528. }
  529. }
  530. // Stop terminates the running Xray process.
  531. func (p *process) Stop() error {
  532. if !p.IsRunning() {
  533. return errors.New("xray is not running")
  534. }
  535. p.intentionalStop.Store(true)
  536. // Snapshot cmd once, then run the blocking Signal/Kill/Wait on the local copy
  537. // without holding the lock.
  538. p.mu.RLock()
  539. cmd := p.cmd
  540. p.mu.RUnlock()
  541. if cmd == nil || cmd.Process == nil {
  542. return errors.New("xray is not running")
  543. }
  544. // Remove temporary config file used for test runs so main config is never touched
  545. if p.configPath != "" {
  546. if p.configPath != GetConfigPath() {
  547. // Check if file exists before removing
  548. if _, err := os.Stat(p.configPath); err == nil {
  549. _ = os.Remove(p.configPath)
  550. }
  551. }
  552. }
  553. if runtime.GOOS == "windows" {
  554. if err := cmd.Process.Kill(); err != nil && !errors.Is(err, os.ErrProcessDone) {
  555. return err
  556. }
  557. return p.waitForExit(xrayForceStopTimeout)
  558. }
  559. if err := cmd.Process.Signal(syscall.SIGTERM); err != nil {
  560. if errors.Is(err, os.ErrProcessDone) {
  561. return p.waitForExit(xrayForceStopTimeout)
  562. }
  563. return err
  564. }
  565. if err := p.waitForExit(xrayGracefulStopTimeout); err == nil {
  566. return nil
  567. }
  568. logger.Warning("xray-core did not stop after SIGTERM, killing process")
  569. if err := cmd.Process.Kill(); err != nil && !errors.Is(err, os.ErrProcessDone) {
  570. return err
  571. }
  572. return p.waitForExit(xrayForceStopTimeout)
  573. }
  574. func (p *process) waitForExit(timeout time.Duration) error {
  575. p.mu.RLock()
  576. done := p.done
  577. p.mu.RUnlock()
  578. if done == nil {
  579. return nil
  580. }
  581. timer := time.NewTimer(timeout)
  582. defer timer.Stop()
  583. select {
  584. case <-done:
  585. return nil
  586. case <-timer.C:
  587. return common.NewErrorf("timed out waiting for xray-core process to stop after %s", timeout)
  588. }
  589. }
  590. const (
  591. crashReportPrefix = "core_crash_"
  592. crashReportSuffix = ".log"
  593. maxCrashReports = 10
  594. )
  595. // writeCrashReport persists a captured xray crash chunk to the log folder
  596. // with nanosecond-precision filename so restart-loop bursts don't overwrite
  597. // each other, and prunes old reports to keep the folder bounded.
  598. func writeCrashReport(m []byte) error {
  599. dir := config.GetLogFolder()
  600. if err := os.MkdirAll(dir, 0o770); err != nil {
  601. return err
  602. }
  603. pruneOldCrashReports(dir, maxCrashReports-1)
  604. name := crashReportPrefix + time.Now().Format("20060102_150405_000000000") + crashReportSuffix
  605. return os.WriteFile(filepath.Join(dir, name), m, 0o640)
  606. }
  607. func pruneOldCrashReports(dir string, keep int) {
  608. entries, err := os.ReadDir(dir)
  609. if err != nil {
  610. return
  611. }
  612. var reports []string
  613. for _, e := range entries {
  614. n := e.Name()
  615. if !e.IsDir() && strings.HasPrefix(n, crashReportPrefix) && strings.HasSuffix(n, crashReportSuffix) {
  616. reports = append(reports, n)
  617. }
  618. }
  619. if len(reports) <= keep {
  620. return
  621. }
  622. sort.Strings(reports)
  623. for _, old := range reports[:len(reports)-keep] {
  624. _ = os.Remove(filepath.Join(dir, old))
  625. }
  626. }