mirror of
https://git.mirrors.martin98.com/https://github.com/SigNoz/signoz
synced 2025-06-04 11:25:52 +08:00
533 lines
14 KiB
Go
533 lines
14 KiB
Go
package app
|
|
|
|
import (
|
|
"bytes"
|
|
"context"
|
|
"encoding/json"
|
|
"fmt"
|
|
"io/ioutil"
|
|
"net"
|
|
"net/http"
|
|
_ "net/http/pprof" // http profiler
|
|
"os"
|
|
"time"
|
|
|
|
"github.com/gorilla/handlers"
|
|
"github.com/gorilla/mux"
|
|
"github.com/jmoiron/sqlx"
|
|
|
|
"github.com/rs/cors"
|
|
"github.com/soheilhy/cmux"
|
|
"go.signoz.io/signoz/pkg/query-service/agentConf"
|
|
"go.signoz.io/signoz/pkg/query-service/app/clickhouseReader"
|
|
"go.signoz.io/signoz/pkg/query-service/app/dashboards"
|
|
opamp "go.signoz.io/signoz/pkg/query-service/app/opamp"
|
|
opAmpModel "go.signoz.io/signoz/pkg/query-service/app/opamp/model"
|
|
|
|
"go.signoz.io/signoz/pkg/query-service/app/explorer"
|
|
"go.signoz.io/signoz/pkg/query-service/auth"
|
|
"go.signoz.io/signoz/pkg/query-service/constants"
|
|
"go.signoz.io/signoz/pkg/query-service/dao"
|
|
"go.signoz.io/signoz/pkg/query-service/featureManager"
|
|
"go.signoz.io/signoz/pkg/query-service/healthcheck"
|
|
am "go.signoz.io/signoz/pkg/query-service/integrations/alertManager"
|
|
"go.signoz.io/signoz/pkg/query-service/interfaces"
|
|
"go.signoz.io/signoz/pkg/query-service/model"
|
|
pqle "go.signoz.io/signoz/pkg/query-service/pqlEngine"
|
|
"go.signoz.io/signoz/pkg/query-service/rules"
|
|
"go.signoz.io/signoz/pkg/query-service/telemetry"
|
|
"go.signoz.io/signoz/pkg/query-service/utils"
|
|
"go.uber.org/zap"
|
|
)
|
|
|
|
type ServerOptions struct {
|
|
PromConfigPath string
|
|
HTTPHostPort string
|
|
PrivateHostPort string
|
|
// alert specific params
|
|
DisableRules bool
|
|
RuleRepoURL string
|
|
}
|
|
|
|
// Server runs HTTP, Mux and a grpc server
|
|
type Server struct {
|
|
// logger *zap.Logger
|
|
// tracer opentracing.Tracer // TODO make part of flags.Service
|
|
serverOptions *ServerOptions
|
|
conn net.Listener
|
|
ruleManager *rules.Manager
|
|
separatePorts bool
|
|
|
|
// public http router
|
|
httpConn net.Listener
|
|
httpServer *http.Server
|
|
|
|
// private http
|
|
privateConn net.Listener
|
|
privateHTTP *http.Server
|
|
|
|
unavailableChannel chan healthcheck.Status
|
|
}
|
|
|
|
// HealthCheckStatus returns health check status channel a client can subscribe to
|
|
func (s Server) HealthCheckStatus() chan healthcheck.Status {
|
|
return s.unavailableChannel
|
|
}
|
|
|
|
// NewServer creates and initializes Server
|
|
func NewServer(serverOptions *ServerOptions) (*Server, error) {
|
|
|
|
if err := dao.InitDao("sqlite", constants.RELATIONAL_DATASOURCE_PATH); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
localDB, err := dashboards.InitDB(constants.RELATIONAL_DATASOURCE_PATH)
|
|
explorer.InitWithDSN(constants.RELATIONAL_DATASOURCE_PATH)
|
|
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
localDB.SetMaxOpenConns(10)
|
|
|
|
// initiate feature manager
|
|
fm := featureManager.StartManager()
|
|
|
|
readerReady := make(chan bool)
|
|
|
|
var reader interfaces.Reader
|
|
storage := os.Getenv("STORAGE")
|
|
if storage == "clickhouse" {
|
|
zap.S().Info("Using ClickHouse as datastore ...")
|
|
clickhouseReader := clickhouseReader.NewReader(localDB, serverOptions.PromConfigPath, fm)
|
|
go clickhouseReader.Start(readerReady)
|
|
reader = clickhouseReader
|
|
} else {
|
|
return nil, fmt.Errorf("Storage type: %s is not supported in query service", storage)
|
|
}
|
|
|
|
<-readerReady
|
|
rm, err := makeRulesManager(serverOptions.PromConfigPath, constants.GetAlertManagerApiPrefix(), serverOptions.RuleRepoURL, localDB, reader, serverOptions.DisableRules)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
telemetry.GetInstance().SetReader(reader)
|
|
apiHandler, err := NewAPIHandler(APIHandlerOpts{
|
|
Reader: reader,
|
|
AppDao: dao.DB(),
|
|
RuleManager: rm,
|
|
FeatureFlags: fm,
|
|
})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
s := &Server{
|
|
// logger: logger,
|
|
// tracer: tracer,
|
|
ruleManager: rm,
|
|
serverOptions: serverOptions,
|
|
unavailableChannel: make(chan healthcheck.Status),
|
|
}
|
|
|
|
httpServer, err := s.createPublicServer(apiHandler)
|
|
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
s.httpServer = httpServer
|
|
|
|
privateServer, err := s.createPrivateServer(apiHandler)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
s.privateHTTP = privateServer
|
|
|
|
_, err = opAmpModel.InitDB(constants.RELATIONAL_DATASOURCE_PATH)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
if err := agentConf.Initiate(localDB, "sqlite"); err != nil {
|
|
return nil, err
|
|
}
|
|
return s, nil
|
|
}
|
|
|
|
func (s *Server) createPrivateServer(api *APIHandler) (*http.Server, error) {
|
|
|
|
r := NewRouter()
|
|
|
|
r.Use(setTimeoutMiddleware)
|
|
r.Use(s.analyticsMiddleware)
|
|
r.Use(loggingMiddlewarePrivate)
|
|
|
|
api.RegisterPrivateRoutes(r)
|
|
|
|
c := cors.New(cors.Options{
|
|
//todo(amol): find out a way to add exact domain or
|
|
// ip here for alert manager
|
|
AllowedOrigins: []string{"*"},
|
|
AllowedMethods: []string{"GET", "DELETE", "POST", "PUT", "PATCH"},
|
|
AllowedHeaders: []string{"Accept", "Authorization", "Content-Type"},
|
|
})
|
|
|
|
handler := c.Handler(r)
|
|
handler = handlers.CompressHandler(handler)
|
|
|
|
return &http.Server{
|
|
Handler: handler,
|
|
}, nil
|
|
}
|
|
|
|
func (s *Server) createPublicServer(api *APIHandler) (*http.Server, error) {
|
|
|
|
r := NewRouter()
|
|
|
|
r.Use(setTimeoutMiddleware)
|
|
r.Use(s.analyticsMiddleware)
|
|
r.Use(loggingMiddleware)
|
|
|
|
am := NewAuthMiddleware(auth.GetUserFromRequest)
|
|
|
|
api.RegisterRoutes(r, am)
|
|
api.RegisterMetricsRoutes(r, am)
|
|
api.RegisterLogsRoutes(r, am)
|
|
api.RegisterQueryRangeV3Routes(r, am)
|
|
|
|
c := cors.New(cors.Options{
|
|
AllowedOrigins: []string{"*"},
|
|
AllowedMethods: []string{"GET", "DELETE", "POST", "PUT", "PATCH", "OPTIONS"},
|
|
AllowedHeaders: []string{"Accept", "Authorization", "Content-Type", "cache-control"},
|
|
})
|
|
|
|
handler := c.Handler(r)
|
|
|
|
handler = handlers.CompressHandler(handler)
|
|
|
|
return &http.Server{
|
|
Handler: handler,
|
|
}, nil
|
|
}
|
|
|
|
// loggingMiddleware is used for logging public api calls
|
|
func loggingMiddleware(next http.Handler) http.Handler {
|
|
return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
|
route := mux.CurrentRoute(r)
|
|
path, _ := route.GetPathTemplate()
|
|
startTime := time.Now()
|
|
next.ServeHTTP(w, r)
|
|
zap.S().Info(path, "\ttimeTaken: ", time.Now().Sub(startTime))
|
|
})
|
|
}
|
|
|
|
// loggingMiddlewarePrivate is used for logging private api calls
|
|
// from internal services like alert manager
|
|
func loggingMiddlewarePrivate(next http.Handler) http.Handler {
|
|
return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
|
route := mux.CurrentRoute(r)
|
|
path, _ := route.GetPathTemplate()
|
|
startTime := time.Now()
|
|
next.ServeHTTP(w, r)
|
|
zap.S().Info(path, "\tprivatePort: true", "\ttimeTaken: ", time.Now().Sub(startTime))
|
|
})
|
|
}
|
|
|
|
type loggingResponseWriter struct {
|
|
http.ResponseWriter
|
|
statusCode int
|
|
}
|
|
|
|
func NewLoggingResponseWriter(w http.ResponseWriter) *loggingResponseWriter {
|
|
// WriteHeader(int) is not called if our response implicitly returns 200 OK, so
|
|
// we default to that status code.
|
|
return &loggingResponseWriter{w, http.StatusOK}
|
|
}
|
|
|
|
func (lrw *loggingResponseWriter) WriteHeader(code int) {
|
|
lrw.statusCode = code
|
|
lrw.ResponseWriter.WriteHeader(code)
|
|
}
|
|
|
|
// Flush implements the http.Flush interface.
|
|
func (lrw *loggingResponseWriter) Flush() {
|
|
lrw.ResponseWriter.(http.Flusher).Flush()
|
|
}
|
|
func extractDashboardMetaData(path string, r *http.Request) (map[string]interface{}, bool) {
|
|
pathToExtractBodyFrom := "/api/v2/metrics/query_range"
|
|
|
|
data := map[string]interface{}{}
|
|
var postData *model.QueryRangeParamsV2
|
|
|
|
if path == pathToExtractBodyFrom && (r.Method == "POST") {
|
|
if r.Body != nil {
|
|
bodyBytes, err := ioutil.ReadAll(r.Body)
|
|
if err != nil {
|
|
return nil, false
|
|
}
|
|
r.Body.Close() // must close
|
|
r.Body = ioutil.NopCloser(bytes.NewBuffer(bodyBytes))
|
|
json.Unmarshal(bodyBytes, &postData)
|
|
|
|
} else {
|
|
return nil, false
|
|
}
|
|
|
|
} else {
|
|
return nil, false
|
|
}
|
|
|
|
signozMetricNotFound := false
|
|
|
|
if postData != nil {
|
|
signozMetricNotFound = telemetry.GetInstance().CheckSigNozMetricsV2(postData.CompositeMetricQuery)
|
|
|
|
if postData.CompositeMetricQuery != nil {
|
|
data["queryType"] = postData.CompositeMetricQuery.QueryType
|
|
data["panelType"] = postData.CompositeMetricQuery.PanelType
|
|
}
|
|
|
|
data["datasource"] = postData.DataSource
|
|
}
|
|
|
|
if signozMetricNotFound {
|
|
telemetry.GetInstance().AddActiveMetricsUser()
|
|
telemetry.GetInstance().SendEvent(telemetry.TELEMETRY_EVENT_DASHBOARDS_METADATA, data, true)
|
|
}
|
|
|
|
return data, true
|
|
}
|
|
|
|
func getActiveLogs(path string, r *http.Request) {
|
|
// if path == "/api/v1/dashboards/{uuid}" {
|
|
// telemetry.GetInstance().AddActiveMetricsUser()
|
|
// }
|
|
if path == "/api/v1/logs" {
|
|
hasFilters := len(r.URL.Query().Get("q"))
|
|
if hasFilters > 0 {
|
|
telemetry.GetInstance().AddActiveLogsUser()
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
func (s *Server) analyticsMiddleware(next http.Handler) http.Handler {
|
|
return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
|
route := mux.CurrentRoute(r)
|
|
path, _ := route.GetPathTemplate()
|
|
|
|
dashboardMetadata, metadataExists := extractDashboardMetaData(path, r)
|
|
getActiveLogs(path, r)
|
|
|
|
lrw := NewLoggingResponseWriter(w)
|
|
next.ServeHTTP(lrw, r)
|
|
|
|
data := map[string]interface{}{"path": path, "statusCode": lrw.statusCode}
|
|
if metadataExists {
|
|
for key, value := range dashboardMetadata {
|
|
data[key] = value
|
|
}
|
|
}
|
|
|
|
// if telemetry.GetInstance().IsSampled() {
|
|
if _, ok := telemetry.IgnoredPaths()[path]; !ok {
|
|
telemetry.GetInstance().SendEvent(telemetry.TELEMETRY_EVENT_PATH, data)
|
|
}
|
|
// }
|
|
|
|
})
|
|
}
|
|
|
|
func setTimeoutMiddleware(next http.Handler) http.Handler {
|
|
return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
|
ctx := r.Context()
|
|
var cancel context.CancelFunc
|
|
// check if route is not excluded
|
|
url := r.URL.Path
|
|
if _, ok := constants.TimeoutExcludedRoutes[url]; !ok {
|
|
ctx, cancel = context.WithTimeout(r.Context(), constants.ContextTimeout)
|
|
defer cancel()
|
|
}
|
|
|
|
r = r.WithContext(ctx)
|
|
next.ServeHTTP(w, r)
|
|
})
|
|
}
|
|
|
|
// initListeners initialises listeners of the server
|
|
func (s *Server) initListeners() error {
|
|
// listen on public port
|
|
var err error
|
|
publicHostPort := s.serverOptions.HTTPHostPort
|
|
if publicHostPort == "" {
|
|
return fmt.Errorf("constants.HTTPHostPort is required")
|
|
}
|
|
|
|
s.httpConn, err = net.Listen("tcp", publicHostPort)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
zap.S().Info(fmt.Sprintf("Query server started listening on %s...", s.serverOptions.HTTPHostPort))
|
|
|
|
// listen on private port to support internal services
|
|
privateHostPort := s.serverOptions.PrivateHostPort
|
|
|
|
if privateHostPort == "" {
|
|
return fmt.Errorf("constants.PrivateHostPort is required")
|
|
}
|
|
|
|
s.privateConn, err = net.Listen("tcp", privateHostPort)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
zap.S().Info(fmt.Sprintf("Query server started listening on private port %s...", s.serverOptions.PrivateHostPort))
|
|
|
|
return nil
|
|
}
|
|
|
|
// Start listening on http and private http port concurrently
|
|
func (s *Server) Start() error {
|
|
|
|
// initiate rule manager first
|
|
if !s.serverOptions.DisableRules {
|
|
s.ruleManager.Start()
|
|
} else {
|
|
zap.S().Info("msg: Rules disabled as rules.disable is set to TRUE")
|
|
}
|
|
|
|
err := s.initListeners()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
var httpPort int
|
|
if port, err := utils.GetPort(s.httpConn.Addr()); err == nil {
|
|
httpPort = port
|
|
}
|
|
|
|
go func() {
|
|
zap.S().Info("Starting HTTP server", zap.Int("port", httpPort), zap.String("addr", s.serverOptions.HTTPHostPort))
|
|
|
|
switch err := s.httpServer.Serve(s.httpConn); err {
|
|
case nil, http.ErrServerClosed, cmux.ErrListenerClosed:
|
|
// normal exit, nothing to do
|
|
default:
|
|
zap.S().Error("Could not start HTTP server", zap.Error(err))
|
|
}
|
|
s.unavailableChannel <- healthcheck.Unavailable
|
|
}()
|
|
|
|
go func() {
|
|
zap.S().Info("Starting pprof server", zap.String("addr", constants.DebugHttpPort))
|
|
|
|
err = http.ListenAndServe(constants.DebugHttpPort, nil)
|
|
if err != nil {
|
|
zap.S().Error("Could not start pprof server", zap.Error(err))
|
|
}
|
|
}()
|
|
|
|
var privatePort int
|
|
if port, err := utils.GetPort(s.privateConn.Addr()); err == nil {
|
|
privatePort = port
|
|
}
|
|
fmt.Println("starting private http")
|
|
go func() {
|
|
zap.S().Info("Starting Private HTTP server", zap.Int("port", privatePort), zap.String("addr", s.serverOptions.PrivateHostPort))
|
|
|
|
switch err := s.privateHTTP.Serve(s.privateConn); err {
|
|
case nil, http.ErrServerClosed, cmux.ErrListenerClosed:
|
|
// normal exit, nothing to do
|
|
zap.S().Info("private http server closed")
|
|
default:
|
|
zap.S().Error("Could not start private HTTP server", zap.Error(err))
|
|
}
|
|
|
|
s.unavailableChannel <- healthcheck.Unavailable
|
|
|
|
}()
|
|
|
|
go func() {
|
|
zap.S().Info("Starting OpAmp Websocket server", zap.String("addr", constants.OpAmpWsEndpoint))
|
|
err := opamp.InitalizeServer(constants.OpAmpWsEndpoint, &opAmpModel.AllAgents)
|
|
if err != nil {
|
|
zap.S().Info("opamp ws server failed to start", err)
|
|
s.unavailableChannel <- healthcheck.Unavailable
|
|
}
|
|
}()
|
|
|
|
return nil
|
|
}
|
|
|
|
func (s *Server) Stop() error {
|
|
if s.httpServer != nil {
|
|
if err := s.httpServer.Shutdown(context.Background()); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
|
|
if s.privateHTTP != nil {
|
|
if err := s.privateHTTP.Shutdown(context.Background()); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
|
|
opamp.StopServer()
|
|
|
|
if s.ruleManager != nil {
|
|
s.ruleManager.Stop()
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func makeRulesManager(
|
|
promConfigPath,
|
|
alertManagerURL string,
|
|
ruleRepoURL string,
|
|
db *sqlx.DB,
|
|
ch interfaces.Reader,
|
|
disableRules bool) (*rules.Manager, error) {
|
|
|
|
// create engine
|
|
pqle, err := pqle.FromReader(ch)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to create pql engine : %v", err)
|
|
}
|
|
|
|
// notifier opts
|
|
notifierOpts := am.NotifierOptions{
|
|
QueueCapacity: 10000,
|
|
Timeout: 1 * time.Second,
|
|
AlertManagerURLs: []string{alertManagerURL},
|
|
}
|
|
|
|
// create manager opts
|
|
managerOpts := &rules.ManagerOptions{
|
|
NotifierOpts: notifierOpts,
|
|
Queriers: &rules.Queriers{
|
|
PqlEngine: pqle,
|
|
Ch: ch.GetConn(),
|
|
},
|
|
RepoURL: ruleRepoURL,
|
|
DBConn: db,
|
|
Context: context.Background(),
|
|
Logger: nil,
|
|
DisableRules: disableRules,
|
|
}
|
|
|
|
// create Manager
|
|
manager, err := rules.NewManager(managerOpts)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("rule manager error: %v", err)
|
|
}
|
|
|
|
zap.S().Info("rules manager is ready")
|
|
|
|
return manager, nil
|
|
}
|