master.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344
  1. package command
  2. import (
  3. "context"
  4. "crypto/tls"
  5. "fmt"
  6. "net/http"
  7. "os"
  8. "path"
  9. "strings"
  10. "time"
  11. "github.com/seaweedfs/seaweedfs/weed/util/version"
  12. hashicorpRaft "github.com/hashicorp/raft"
  13. "slices"
  14. "github.com/gorilla/mux"
  15. "github.com/seaweedfs/raft/protobuf"
  16. "github.com/spf13/viper"
  17. "google.golang.org/grpc/reflection"
  18. stats_collect "github.com/seaweedfs/seaweedfs/weed/stats"
  19. "github.com/seaweedfs/seaweedfs/weed/util/grace"
  20. "github.com/seaweedfs/seaweedfs/weed/glog"
  21. "github.com/seaweedfs/seaweedfs/weed/pb"
  22. "github.com/seaweedfs/seaweedfs/weed/pb/master_pb"
  23. "github.com/seaweedfs/seaweedfs/weed/security"
  24. weed_server "github.com/seaweedfs/seaweedfs/weed/server"
  25. "github.com/seaweedfs/seaweedfs/weed/storage/backend"
  26. "github.com/seaweedfs/seaweedfs/weed/util"
  27. )
  28. var (
  29. m MasterOptions
  30. )
  31. type MasterOptions struct {
  32. port *int
  33. portGrpc *int
  34. ip *string
  35. ipBind *string
  36. metaFolder *string
  37. peers *string
  38. volumeSizeLimitMB *uint
  39. volumePreallocate *bool
  40. maxParallelVacuumPerServer *int
  41. // pulseSeconds *int
  42. defaultReplication *string
  43. garbageThreshold *float64
  44. whiteList *string
  45. disableHttp *bool
  46. metricsAddress *string
  47. metricsIntervalSec *int
  48. raftResumeState *bool
  49. metricsHttpPort *int
  50. metricsHttpIp *string
  51. heartbeatInterval *time.Duration
  52. electionTimeout *time.Duration
  53. raftHashicorp *bool
  54. raftBootstrap *bool
  55. telemetryUrl *string
  56. telemetryEnabled *bool
  57. }
  58. func init() {
  59. cmdMaster.Run = runMaster // break init cycle
  60. m.port = cmdMaster.Flag.Int("port", 9333, "http listen port")
  61. m.portGrpc = cmdMaster.Flag.Int("port.grpc", 0, "grpc listen port")
  62. m.ip = cmdMaster.Flag.String("ip", util.DetectedHostAddress(), "master <ip>|<server> address, also used as identifier")
  63. m.ipBind = cmdMaster.Flag.String("ip.bind", "", "ip address to bind to. If empty, default to same as -ip option.")
  64. m.metaFolder = cmdMaster.Flag.String("mdir", os.TempDir(), "data directory to store meta data")
  65. m.peers = cmdMaster.Flag.String("peers", "", "all master nodes in comma separated ip:port list, example: 127.0.0.1:9093,127.0.0.1:9094,127.0.0.1:9095")
  66. m.volumeSizeLimitMB = cmdMaster.Flag.Uint("volumeSizeLimitMB", 30*1000, "Master stops directing writes to oversized volumes.")
  67. m.volumePreallocate = cmdMaster.Flag.Bool("volumePreallocate", false, "Preallocate disk space for volumes.")
  68. m.maxParallelVacuumPerServer = cmdMaster.Flag.Int("maxParallelVacuumPerServer", 1, "maximum number of volumes to vacuum in parallel per volume server")
  69. // m.pulseSeconds = cmdMaster.Flag.Int("pulseSeconds", 5, "number of seconds between heartbeats")
  70. m.defaultReplication = cmdMaster.Flag.String("defaultReplication", "", "Default replication type if not specified.")
  71. m.garbageThreshold = cmdMaster.Flag.Float64("garbageThreshold", 0.3, "threshold to vacuum and reclaim spaces")
  72. m.whiteList = cmdMaster.Flag.String("whiteList", "", "comma separated Ip addresses having write permission. No limit if empty.")
  73. m.disableHttp = cmdMaster.Flag.Bool("disableHttp", false, "disable http requests, only gRPC operations are allowed.")
  74. m.metricsAddress = cmdMaster.Flag.String("metrics.address", "", "Prometheus gateway address <host>:<port>")
  75. m.metricsIntervalSec = cmdMaster.Flag.Int("metrics.intervalSeconds", 15, "Prometheus push interval in seconds")
  76. m.metricsHttpPort = cmdMaster.Flag.Int("metricsPort", 0, "Prometheus metrics listen port")
  77. m.metricsHttpIp = cmdMaster.Flag.String("metricsIp", "", "metrics listen ip. If empty, default to same as -ip.bind option.")
  78. m.raftResumeState = cmdMaster.Flag.Bool("resumeState", false, "resume previous state on start master server")
  79. m.heartbeatInterval = cmdMaster.Flag.Duration("heartbeatInterval", 300*time.Millisecond, "heartbeat interval of master servers, and will be randomly multiplied by [1, 1.25)")
  80. m.electionTimeout = cmdMaster.Flag.Duration("electionTimeout", 10*time.Second, "election timeout of master servers")
  81. m.raftHashicorp = cmdMaster.Flag.Bool("raftHashicorp", false, "use hashicorp raft")
  82. m.raftBootstrap = cmdMaster.Flag.Bool("raftBootstrap", false, "Whether to bootstrap the Raft cluster")
  83. m.telemetryUrl = cmdMaster.Flag.String("telemetry.url", "https://telemetry.seaweedfs.com/api/collect", "telemetry server URL to send usage statistics")
  84. m.telemetryEnabled = cmdMaster.Flag.Bool("telemetry", false, "enable telemetry reporting")
  85. }
  86. var cmdMaster = &Command{
  87. UsageLine: "master -port=9333",
  88. Short: "start a master server",
  89. Long: `start a master server to provide volume=>location mapping service and sequence number of file ids
  90. The configuration file "security.toml" is read from ".", "$HOME/.seaweedfs/", "/usr/local/etc/seaweedfs/", or "/etc/seaweedfs/", in that order.
  91. The example security.toml configuration file can be generated by "weed scaffold -config=security"
  92. `,
  93. }
  94. var (
  95. masterCpuProfile = cmdMaster.Flag.String("cpuprofile", "", "cpu profile output file")
  96. masterMemProfile = cmdMaster.Flag.String("memprofile", "", "memory profile output file")
  97. )
  98. func runMaster(cmd *Command, args []string) bool {
  99. util.LoadSecurityConfiguration()
  100. util.LoadConfiguration("master", false)
  101. // bind viper configuration to command line flags
  102. if v := util.GetViper().GetString("master.mdir"); v != "" {
  103. *m.metaFolder = v
  104. }
  105. grace.SetupProfiling(*masterCpuProfile, *masterMemProfile)
  106. parent, _ := util.FullPath(*m.metaFolder).DirAndName()
  107. if util.FileExists(string(parent)) && !util.FileExists(*m.metaFolder) {
  108. os.MkdirAll(*m.metaFolder, 0755)
  109. }
  110. if err := util.TestFolderWritable(util.ResolvePath(*m.metaFolder)); err != nil {
  111. glog.Fatalf("Check Meta Folder (-mdir) Writable %s : %s", *m.metaFolder, err)
  112. }
  113. masterWhiteList := util.StringSplit(*m.whiteList, ",")
  114. if *m.volumeSizeLimitMB > util.VolumeSizeLimitGB*1000 {
  115. glog.Fatalf("volumeSizeLimitMB should be smaller than 30000")
  116. }
  117. switch {
  118. case *m.metricsHttpIp != "":
  119. // noting to do, use m.metricsHttpIp
  120. case *m.ipBind != "":
  121. *m.metricsHttpIp = *m.ipBind
  122. case *m.ip != "":
  123. *m.metricsHttpIp = *m.ip
  124. }
  125. go stats_collect.StartMetricsServer(*m.metricsHttpIp, *m.metricsHttpPort)
  126. go stats_collect.LoopPushingMetric("masterServer", util.JoinHostPort(*m.ip, *m.port), *m.metricsAddress, *m.metricsIntervalSec)
  127. startMaster(m, masterWhiteList)
  128. return true
  129. }
  130. func startMaster(masterOption MasterOptions, masterWhiteList []string) {
  131. backend.LoadConfiguration(util.GetViper())
  132. if *masterOption.portGrpc == 0 {
  133. *masterOption.portGrpc = 10000 + *masterOption.port
  134. }
  135. if *masterOption.ipBind == "" {
  136. *masterOption.ipBind = *masterOption.ip
  137. }
  138. myMasterAddress, peers := checkPeers(*masterOption.ip, *masterOption.port, *masterOption.portGrpc, *masterOption.peers)
  139. masterPeers := make(map[string]pb.ServerAddress)
  140. for _, peer := range peers {
  141. masterPeers[string(peer)] = peer
  142. }
  143. r := mux.NewRouter()
  144. ms := weed_server.NewMasterServer(r, masterOption.toMasterOption(masterWhiteList), masterPeers)
  145. listeningAddress := util.JoinHostPort(*masterOption.ipBind, *masterOption.port)
  146. glog.V(0).Infof("Start Seaweed Master %s at %s", version.Version(), listeningAddress)
  147. masterListener, masterLocalListener, e := util.NewIpAndLocalListeners(*masterOption.ipBind, *masterOption.port, 0)
  148. if e != nil {
  149. glog.Fatalf("Master startup error: %v", e)
  150. }
  151. // start raftServer
  152. metaDir := path.Join(*masterOption.metaFolder, fmt.Sprintf("m%d", *masterOption.port))
  153. raftServerOption := &weed_server.RaftServerOption{
  154. GrpcDialOption: security.LoadClientTLS(util.GetViper(), "grpc.master"),
  155. Peers: masterPeers,
  156. ServerAddr: myMasterAddress,
  157. DataDir: util.ResolvePath(metaDir),
  158. Topo: ms.Topo,
  159. RaftResumeState: *masterOption.raftResumeState,
  160. HeartbeatInterval: *masterOption.heartbeatInterval,
  161. ElectionTimeout: *masterOption.electionTimeout,
  162. RaftBootstrap: *masterOption.raftBootstrap,
  163. }
  164. var raftServer *weed_server.RaftServer
  165. var err error
  166. if *masterOption.raftHashicorp {
  167. if raftServer, err = weed_server.NewHashicorpRaftServer(raftServerOption); err != nil {
  168. glog.Fatalf("NewHashicorpRaftServer: %s", err)
  169. }
  170. } else {
  171. raftServer, err = weed_server.NewRaftServer(raftServerOption)
  172. if raftServer == nil {
  173. glog.Fatalf("please verify %s is writable, see https://github.com/seaweedfs/seaweedfs/issues/717: %s", *masterOption.metaFolder, err)
  174. }
  175. }
  176. ms.SetRaftServer(raftServer)
  177. r.HandleFunc("/cluster/status", raftServer.StatusHandler).Methods(http.MethodGet, http.MethodHead)
  178. r.HandleFunc("/cluster/healthz", raftServer.HealthzHandler).Methods(http.MethodGet, http.MethodHead)
  179. if *masterOption.raftHashicorp {
  180. r.HandleFunc("/raft/stats", raftServer.StatsRaftHandler).Methods(http.MethodGet)
  181. }
  182. // starting grpc server
  183. grpcPort := *masterOption.portGrpc
  184. grpcL, grpcLocalL, err := util.NewIpAndLocalListeners(*masterOption.ipBind, grpcPort, 0)
  185. if err != nil {
  186. glog.Fatalf("master failed to listen on grpc port %d: %v", grpcPort, err)
  187. }
  188. grpcS := pb.NewGrpcServer(security.LoadServerTLS(util.GetViper(), "grpc.master"))
  189. master_pb.RegisterSeaweedServer(grpcS, ms)
  190. if *masterOption.raftHashicorp {
  191. raftServer.TransportManager.Register(grpcS)
  192. } else {
  193. protobuf.RegisterRaftServer(grpcS, raftServer)
  194. }
  195. reflection.Register(grpcS)
  196. glog.V(0).Infof("Start Seaweed Master %s grpc server at %s:%d", version.Version(), *masterOption.ipBind, grpcPort)
  197. if grpcLocalL != nil {
  198. go grpcS.Serve(grpcLocalL)
  199. }
  200. go grpcS.Serve(grpcL)
  201. timeSleep := 1500 * time.Millisecond
  202. if !*masterOption.raftHashicorp {
  203. go func() {
  204. time.Sleep(timeSleep)
  205. ms.Topo.RaftServerAccessLock.RLock()
  206. isEmptyMaster := ms.Topo.RaftServer.Leader() == "" && ms.Topo.RaftServer.IsLogEmpty()
  207. if isEmptyMaster && isTheFirstOne(myMasterAddress, peers) && ms.MasterClient.FindLeaderFromOtherPeers(myMasterAddress) == "" {
  208. raftServer.DoJoinCommand()
  209. }
  210. ms.Topo.RaftServerAccessLock.RUnlock()
  211. }()
  212. }
  213. go ms.MasterClient.KeepConnectedToMaster(context.Background())
  214. // start http server
  215. var (
  216. clientCertFile,
  217. certFile,
  218. keyFile string
  219. )
  220. useTLS := false
  221. useMTLS := false
  222. if viper.GetString("https.master.key") != "" {
  223. useTLS = true
  224. certFile = viper.GetString("https.master.cert")
  225. keyFile = viper.GetString("https.master.key")
  226. }
  227. if viper.GetString("https.master.ca") != "" {
  228. useMTLS = true
  229. clientCertFile = viper.GetString("https.master.ca")
  230. }
  231. if masterLocalListener != nil {
  232. go newHttpServer(r, nil).Serve(masterLocalListener)
  233. }
  234. var tlsConfig *tls.Config
  235. if useMTLS {
  236. tlsConfig = security.LoadClientTLSHTTP(clientCertFile)
  237. security.FixTlsConfig(util.GetViper(), tlsConfig)
  238. }
  239. if useTLS {
  240. go newHttpServer(r, tlsConfig).ServeTLS(masterListener, certFile, keyFile)
  241. } else {
  242. go newHttpServer(r, nil).Serve(masterListener)
  243. }
  244. grace.OnInterrupt(ms.Shutdown)
  245. grace.OnInterrupt(grpcS.Stop)
  246. grace.OnReload(func() {
  247. if ms.Topo.HashicorpRaft != nil && ms.Topo.HashicorpRaft.State() == hashicorpRaft.Leader {
  248. ms.Topo.HashicorpRaft.LeadershipTransfer()
  249. }
  250. })
  251. select {}
  252. }
  253. func checkPeers(masterIp string, masterPort int, masterGrpcPort int, peers string) (masterAddress pb.ServerAddress, cleanedPeers []pb.ServerAddress) {
  254. glog.V(0).Infof("current: %s:%d peers:%s", masterIp, masterPort, peers)
  255. masterAddress = pb.NewServerAddress(masterIp, masterPort, masterGrpcPort)
  256. cleanedPeers = pb.ServerAddresses(peers).ToAddresses()
  257. hasSelf := false
  258. for _, peer := range cleanedPeers {
  259. if peer.ToHttpAddress() == masterAddress.ToHttpAddress() {
  260. hasSelf = true
  261. break
  262. }
  263. }
  264. if !hasSelf {
  265. cleanedPeers = append(cleanedPeers, masterAddress)
  266. }
  267. if len(cleanedPeers)%2 == 0 {
  268. glog.Fatalf("Only odd number of masters are supported: %+v", cleanedPeers)
  269. }
  270. return
  271. }
  272. func isTheFirstOne(self pb.ServerAddress, peers []pb.ServerAddress) bool {
  273. slices.SortFunc(peers, func(a, b pb.ServerAddress) int {
  274. return strings.Compare(string(a), string(b))
  275. })
  276. if len(peers) <= 0 {
  277. return true
  278. }
  279. return self == peers[0]
  280. }
  281. func (m *MasterOptions) toMasterOption(whiteList []string) *weed_server.MasterOption {
  282. masterAddress := pb.NewServerAddress(*m.ip, *m.port, *m.portGrpc)
  283. return &weed_server.MasterOption{
  284. Master: masterAddress,
  285. MetaFolder: *m.metaFolder,
  286. VolumeSizeLimitMB: uint32(*m.volumeSizeLimitMB),
  287. VolumePreallocate: *m.volumePreallocate,
  288. MaxParallelVacuumPerServer: *m.maxParallelVacuumPerServer,
  289. // PulseSeconds: *m.pulseSeconds,
  290. DefaultReplicaPlacement: *m.defaultReplication,
  291. GarbageThreshold: *m.garbageThreshold,
  292. WhiteList: whiteList,
  293. DisableHttp: *m.disableHttp,
  294. MetricsAddress: *m.metricsAddress,
  295. MetricsIntervalSec: *m.metricsIntervalSec,
  296. TelemetryUrl: *m.telemetryUrl,
  297. TelemetryEnabled: *m.telemetryEnabled,
  298. }
  299. }