You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
127 lines
3.1 KiB
Go
127 lines
3.1 KiB
Go
/*
|
|
* Copyright (c) 2021, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
package dcgmexporter
|
|
|
|
import (
|
|
"context"
|
|
"net/http"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/gorilla/mux"
|
|
"github.com/sirupsen/logrus"
|
|
)
|
|
|
|
func NewMetricsServer(c *Config, metrics chan string) (*MetricsServer, func(), error) {
|
|
router := mux.NewRouter()
|
|
serverv1 := &MetricsServer{
|
|
server: http.Server{
|
|
Addr: c.Address,
|
|
Handler: router,
|
|
ReadTimeout: 10 * time.Second,
|
|
WriteTimeout: 10 * time.Second,
|
|
},
|
|
metricsChan: metrics,
|
|
metrics: "",
|
|
}
|
|
|
|
router.HandleFunc("/", func(w http.ResponseWriter, r *http.Request) {
|
|
w.Header().Set("X-Content-Type-Options", "nosniff")
|
|
w.WriteHeader(http.StatusOK)
|
|
w.Write([]byte(`<html>
|
|
<head><title>GPU Exporter</title></head>
|
|
<body>
|
|
<h1>GPU Exporter</h1>
|
|
<p><a href="./metrics">Metrics</a></p>
|
|
</body>
|
|
</html>`))
|
|
})
|
|
|
|
router.HandleFunc("/health", serverv1.Health)
|
|
router.HandleFunc("/metrics", serverv1.Metrics)
|
|
|
|
return serverv1, func() {}, nil
|
|
}
|
|
|
|
func (s *MetricsServer) Run(stop chan interface{}, wg *sync.WaitGroup) {
|
|
defer wg.Done()
|
|
|
|
var httpwg sync.WaitGroup
|
|
httpwg.Add(1)
|
|
go func() {
|
|
defer httpwg.Done()
|
|
logrus.Info("Starting webserver")
|
|
if err := s.server.ListenAndServe(); err != nil && err != http.ErrServerClosed {
|
|
logrus.Fatalf("Failed to Listen and Server HTTP server with err: `%v`", err)
|
|
}
|
|
}()
|
|
|
|
httpwg.Add(1)
|
|
go func() {
|
|
defer httpwg.Done()
|
|
for {
|
|
select {
|
|
case <-stop:
|
|
return
|
|
case m := <-s.metricsChan:
|
|
s.updateMetrics(m)
|
|
}
|
|
}
|
|
}()
|
|
|
|
<-stop
|
|
if err := s.server.Shutdown(context.Background()); err != nil {
|
|
logrus.Fatalf("Failed to shutdown HTTP server, with err: `%v`", err)
|
|
}
|
|
|
|
if err := WaitWithTimeout(&httpwg, 3*time.Second); err != nil {
|
|
logrus.Fatalf("Failed waiting for HTTP server to shutdown, with err: `%v`", err)
|
|
}
|
|
}
|
|
|
|
func (s *MetricsServer) Metrics(w http.ResponseWriter, r *http.Request) {
|
|
w.Header().Set("X-Content-Type-Options", "nosniff")
|
|
w.WriteHeader(http.StatusOK)
|
|
w.Write([]byte(s.getMetrics()))
|
|
}
|
|
|
|
func (s *MetricsServer) Health(w http.ResponseWriter, r *http.Request) {
|
|
if s.getMetrics() == "" {
|
|
w.Header().Set("X-Content-Type-Options", "nosniff")
|
|
w.WriteHeader(http.StatusServiceUnavailable)
|
|
w.Write([]byte("KO"))
|
|
} else {
|
|
w.Header().Set("X-Content-Type-Options", "nosniff")
|
|
w.WriteHeader(http.StatusOK)
|
|
w.Write([]byte("OK"))
|
|
}
|
|
}
|
|
|
|
func (s *MetricsServer) updateMetrics(m string) {
|
|
s.Lock()
|
|
defer s.Unlock()
|
|
|
|
s.metrics = m
|
|
}
|
|
|
|
func (s *MetricsServer) getMetrics() string {
|
|
s.Lock()
|
|
defer s.Unlock()
|
|
|
|
return s.metrics
|
|
}
|