custom_metrics_stackdriver.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277
  1. /*
  2. Copyright 2017 The Kubernetes Authors.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package monitoring
  14. import (
  15. "context"
  16. "time"
  17. "golang.org/x/oauth2/google"
  18. clientset "k8s.io/client-go/kubernetes"
  19. "github.com/onsi/ginkgo"
  20. metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
  21. instrumentation "k8s.io/kubernetes/test/e2e/instrumentation/common"
  22. gcm "google.golang.org/api/monitoring/v3"
  23. "k8s.io/api/core/v1"
  24. "k8s.io/apimachinery/pkg/labels"
  25. "k8s.io/apimachinery/pkg/runtime/schema"
  26. "k8s.io/apimachinery/pkg/selection"
  27. "k8s.io/client-go/discovery"
  28. cacheddiscovery "k8s.io/client-go/discovery/cached/memory"
  29. "k8s.io/client-go/restmapper"
  30. "k8s.io/kubernetes/test/e2e/framework"
  31. e2elog "k8s.io/kubernetes/test/e2e/framework/log"
  32. customclient "k8s.io/metrics/pkg/client/custom_metrics"
  33. externalclient "k8s.io/metrics/pkg/client/external_metrics"
  34. )
  35. const (
  36. stackdriverExporterPod1 = "stackdriver-exporter-1"
  37. stackdriverExporterPod2 = "stackdriver-exporter-2"
  38. stackdriverExporterLabel = "stackdriver-exporter"
  39. )
  40. var _ = instrumentation.SIGDescribe("Stackdriver Monitoring", func() {
  41. ginkgo.BeforeEach(func() {
  42. framework.SkipUnlessProviderIs("gce", "gke")
  43. })
  44. f := framework.NewDefaultFramework("stackdriver-monitoring")
  45. ginkgo.It("should run Custom Metrics - Stackdriver Adapter for old resource model [Feature:StackdriverCustomMetrics]", func() {
  46. kubeClient := f.ClientSet
  47. config, err := framework.LoadConfig()
  48. if err != nil {
  49. framework.Failf("Failed to load config: %s", err)
  50. }
  51. discoveryClient := discovery.NewDiscoveryClientForConfigOrDie(config)
  52. cachedDiscoClient := cacheddiscovery.NewMemCacheClient(discoveryClient)
  53. restMapper := restmapper.NewDeferredDiscoveryRESTMapper(cachedDiscoClient)
  54. restMapper.Reset()
  55. apiVersionsGetter := customclient.NewAvailableAPIsGetter(discoveryClient)
  56. customMetricsClient := customclient.NewForConfig(config, restMapper, apiVersionsGetter)
  57. testCustomMetrics(f, kubeClient, customMetricsClient, discoveryClient, AdapterForOldResourceModel)
  58. })
  59. ginkgo.It("should run Custom Metrics - Stackdriver Adapter for new resource model [Feature:StackdriverCustomMetrics]", func() {
  60. kubeClient := f.ClientSet
  61. config, err := framework.LoadConfig()
  62. if err != nil {
  63. framework.Failf("Failed to load config: %s", err)
  64. }
  65. discoveryClient := discovery.NewDiscoveryClientForConfigOrDie(config)
  66. cachedDiscoClient := cacheddiscovery.NewMemCacheClient(discoveryClient)
  67. restMapper := restmapper.NewDeferredDiscoveryRESTMapper(cachedDiscoClient)
  68. restMapper.Reset()
  69. apiVersionsGetter := customclient.NewAvailableAPIsGetter(discoveryClient)
  70. customMetricsClient := customclient.NewForConfig(config, restMapper, apiVersionsGetter)
  71. testCustomMetrics(f, kubeClient, customMetricsClient, discoveryClient, AdapterForNewResourceModel)
  72. })
  73. ginkgo.It("should run Custom Metrics - Stackdriver Adapter for external metrics [Feature:StackdriverExternalMetrics]", func() {
  74. kubeClient := f.ClientSet
  75. config, err := framework.LoadConfig()
  76. if err != nil {
  77. framework.Failf("Failed to load config: %s", err)
  78. }
  79. externalMetricsClient := externalclient.NewForConfigOrDie(config)
  80. testExternalMetrics(f, kubeClient, externalMetricsClient)
  81. })
  82. })
  83. func testCustomMetrics(f *framework.Framework, kubeClient clientset.Interface, customMetricsClient customclient.CustomMetricsClient, discoveryClient *discovery.DiscoveryClient, adapterDeployment string) {
  84. projectID := framework.TestContext.CloudConfig.ProjectID
  85. ctx := context.Background()
  86. client, err := google.DefaultClient(ctx, gcm.CloudPlatformScope)
  87. gcmService, err := gcm.New(client)
  88. if err != nil {
  89. framework.Failf("Failed to create gcm service, %v", err)
  90. }
  91. // Set up a cluster: create a custom metric and set up k8s-sd adapter
  92. err = CreateDescriptors(gcmService, projectID)
  93. if err != nil {
  94. framework.Failf("Failed to create metric descriptor: %s", err)
  95. }
  96. defer CleanupDescriptors(gcmService, projectID)
  97. err = CreateAdapter(adapterDeployment)
  98. if err != nil {
  99. framework.Failf("Failed to set up: %s", err)
  100. }
  101. defer CleanupAdapter(adapterDeployment)
  102. _, err = kubeClient.RbacV1().ClusterRoleBindings().Create(HPAPermissions)
  103. if err != nil {
  104. framework.Failf("Failed to create ClusterRoleBindings: %v", err)
  105. }
  106. defer kubeClient.RbacV1().ClusterRoleBindings().Delete(HPAPermissions.Name, &metav1.DeleteOptions{})
  107. // Run application that exports the metric
  108. _, err = createSDExporterPods(f, kubeClient)
  109. if err != nil {
  110. framework.Failf("Failed to create stackdriver-exporter pod: %s", err)
  111. }
  112. defer cleanupSDExporterPod(f, kubeClient)
  113. // Wait a short amount of time to create a pod and export some metrics
  114. // TODO: add some events to wait for instead of fixed amount of time
  115. // i.e. pod creation, first time series exported
  116. time.Sleep(60 * time.Second)
  117. verifyResponsesFromCustomMetricsAPI(f, customMetricsClient, discoveryClient)
  118. }
  119. // TODO(kawych): migrate this test to new resource model
  120. func testExternalMetrics(f *framework.Framework, kubeClient clientset.Interface, externalMetricsClient externalclient.ExternalMetricsClient) {
  121. projectID := framework.TestContext.CloudConfig.ProjectID
  122. ctx := context.Background()
  123. client, err := google.DefaultClient(ctx, gcm.CloudPlatformScope)
  124. gcmService, err := gcm.New(client)
  125. if err != nil {
  126. framework.Failf("Failed to create gcm service, %v", err)
  127. }
  128. // Set up a cluster: create a custom metric and set up k8s-sd adapter
  129. err = CreateDescriptors(gcmService, projectID)
  130. if err != nil {
  131. framework.Failf("Failed to create metric descriptor: %s", err)
  132. }
  133. defer CleanupDescriptors(gcmService, projectID)
  134. // Both deployments - for old and new resource model - expose External Metrics API.
  135. err = CreateAdapter(AdapterForOldResourceModel)
  136. if err != nil {
  137. framework.Failf("Failed to set up: %s", err)
  138. }
  139. defer CleanupAdapter(AdapterForOldResourceModel)
  140. _, err = kubeClient.RbacV1().ClusterRoleBindings().Create(HPAPermissions)
  141. if err != nil {
  142. framework.Failf("Failed to create ClusterRoleBindings: %v", err)
  143. }
  144. defer kubeClient.RbacV1().ClusterRoleBindings().Delete(HPAPermissions.Name, &metav1.DeleteOptions{})
  145. // Run application that exports the metric
  146. pod, err := createSDExporterPods(f, kubeClient)
  147. if err != nil {
  148. framework.Failf("Failed to create stackdriver-exporter pod: %s", err)
  149. }
  150. defer cleanupSDExporterPod(f, kubeClient)
  151. // Wait a short amount of time to create a pod and export some metrics
  152. // TODO: add some events to wait for instead of fixed amount of time
  153. // i.e. pod creation, first time series exported
  154. time.Sleep(60 * time.Second)
  155. verifyResponseFromExternalMetricsAPI(f, externalMetricsClient, pod)
  156. }
  157. func verifyResponsesFromCustomMetricsAPI(f *framework.Framework, customMetricsClient customclient.CustomMetricsClient, discoveryClient *discovery.DiscoveryClient) {
  158. resources, err := discoveryClient.ServerResourcesForGroupVersion("custom.metrics.k8s.io/v1beta1")
  159. if err != nil {
  160. framework.Failf("Failed to retrieve a list of supported metrics: %s", err)
  161. }
  162. if !containsResource(resources.APIResources, "*/custom.googleapis.com|"+CustomMetricName) {
  163. framework.Failf("Metric '%s' expected but not received", CustomMetricName)
  164. }
  165. if !containsResource(resources.APIResources, "*/custom.googleapis.com|"+UnusedMetricName) {
  166. framework.Failf("Metric '%s' expected but not received", UnusedMetricName)
  167. }
  168. value, err := customMetricsClient.NamespacedMetrics(f.Namespace.Name).GetForObject(schema.GroupKind{Group: "", Kind: "Pod"}, stackdriverExporterPod1, CustomMetricName, labels.NewSelector())
  169. if err != nil {
  170. framework.Failf("Failed query: %s", err)
  171. }
  172. if value.Value.Value() != CustomMetricValue {
  173. framework.Failf("Unexpected metric value for metric %s: expected %v but received %v", CustomMetricName, CustomMetricValue, value.Value)
  174. }
  175. filter, err := labels.NewRequirement("name", selection.Equals, []string{stackdriverExporterLabel})
  176. if err != nil {
  177. framework.Failf("Couldn't create a label filter")
  178. }
  179. values, err := customMetricsClient.NamespacedMetrics(f.Namespace.Name).GetForObjects(schema.GroupKind{Group: "", Kind: "Pod"}, labels.NewSelector().Add(*filter), CustomMetricName, labels.NewSelector())
  180. if err != nil {
  181. framework.Failf("Failed query: %s", err)
  182. }
  183. if len(values.Items) != 1 {
  184. framework.Failf("Expected results for exactly 1 pod, but %v results received", len(values.Items))
  185. }
  186. if values.Items[0].DescribedObject.Name != stackdriverExporterPod1 || values.Items[0].Value.Value() != CustomMetricValue {
  187. framework.Failf("Unexpected metric value for metric %s and pod %s: %v", CustomMetricName, values.Items[0].DescribedObject.Name, values.Items[0].Value.Value())
  188. }
  189. }
  190. func containsResource(resourcesList []metav1.APIResource, resourceName string) bool {
  191. for _, resource := range resourcesList {
  192. if resource.Name == resourceName {
  193. return true
  194. }
  195. }
  196. return false
  197. }
  198. func verifyResponseFromExternalMetricsAPI(f *framework.Framework, externalMetricsClient externalclient.ExternalMetricsClient, pod *v1.Pod) {
  199. req1, _ := labels.NewRequirement("resource.type", selection.Equals, []string{"gke_container"})
  200. // It's important to filter out only metrics from the right namespace, since multiple e2e tests
  201. // may run in the same project concurrently. "dummy" is added to test
  202. req2, _ := labels.NewRequirement("resource.labels.pod_id", selection.In, []string{string(pod.UID), "dummy"})
  203. req3, _ := labels.NewRequirement("resource.labels.namespace_id", selection.Exists, []string{})
  204. req4, _ := labels.NewRequirement("resource.labels.zone", selection.NotEquals, []string{"dummy"})
  205. req5, _ := labels.NewRequirement("resource.labels.cluster_name", selection.NotIn, []string{"foo", "bar"})
  206. values, err := externalMetricsClient.
  207. NamespacedMetrics("dummy").
  208. List("custom.googleapis.com|"+CustomMetricName, labels.NewSelector().Add(*req1, *req2, *req3, *req4, *req5))
  209. if err != nil {
  210. framework.Failf("Failed query: %s", err)
  211. }
  212. if len(values.Items) != 1 {
  213. framework.Failf("Expected exactly one external metric value, but % values received", len(values.Items))
  214. }
  215. if values.Items[0].MetricName != "custom.googleapis.com|"+CustomMetricName ||
  216. values.Items[0].Value.Value() != CustomMetricValue ||
  217. // Check one label just to make sure labels are included
  218. values.Items[0].MetricLabels["resource.labels.pod_id"] != string(pod.UID) {
  219. framework.Failf("Unexpected result for metric %s: %v", CustomMetricName, values.Items[0])
  220. }
  221. }
  222. func cleanupSDExporterPod(f *framework.Framework, cs clientset.Interface) {
  223. err := cs.CoreV1().Pods(f.Namespace.Name).Delete(stackdriverExporterPod1, &metav1.DeleteOptions{})
  224. if err != nil {
  225. e2elog.Logf("Failed to delete %s pod: %v", stackdriverExporterPod1, err)
  226. }
  227. err = cs.CoreV1().Pods(f.Namespace.Name).Delete(stackdriverExporterPod2, &metav1.DeleteOptions{})
  228. if err != nil {
  229. e2elog.Logf("Failed to delete %s pod: %v", stackdriverExporterPod2, err)
  230. }
  231. }
  232. func createSDExporterPods(f *framework.Framework, cs clientset.Interface) (*v1.Pod, error) {
  233. pod, err := cs.CoreV1().Pods(f.Namespace.Name).Create(StackdriverExporterPod(stackdriverExporterPod1, f.Namespace.Name, stackdriverExporterLabel, CustomMetricName, CustomMetricValue))
  234. if err != nil {
  235. return nil, err
  236. }
  237. _, err = cs.CoreV1().Pods(f.Namespace.Name).Create(StackdriverExporterPod(stackdriverExporterPod2, f.Namespace.Name, stackdriverExporterLabel, UnusedMetricName, UnusedMetricValue))
  238. return pod, err
  239. }