mirror of
https://github.com/google/nomulus.git
synced 2025-05-06 15:07:55 +02:00
This originally started as a small change, but quickly grew into a major refactor as I realized the original parameter structure wasn't conducive to a cron task and manual re-runs. The changes are as follows: 1. Adds DNS metrics to activity reports, thanks to Nick's work with the Zoneman Dremel -> #plx workflow. 2. Surrounds registrar names in transactions reports with quotes, to escape possible commas. 3. Factors out the report generation logic into IcannReportingStager. 4. Assigns default values to the three main parameters - yearMonth defaults to the previous month - subdir defaults to "icann/monthly/yearMonth", i.e. "gs://domain-registry-reporting/icann/monthly/yyyy-MM" - reportType defaults to both reports 5. Adds "Total" row generation logic to transactions reports - This was a previously overlooked requirement. 6. Adds "MANIFEST.txt" generation and upload logic. - The MANIFEST lists out which files need to be uploaded in the subdirectory. 7. Increases urlfetch timeout from 5s to 10s in backend tasks. - Backend tasks should be more latency tolerant anyway, and this reduces the number of incorrect timeouts we see for services like Bigquery which might take some time to respond. TESTED=Extensive testing in alpha, and ran FOSS test. TODO: send out an e-mail for report generation and upload, and add reporting to cron.xml ------------- Created by MOE: https://github.com/google/moe MOE_MIGRATED_REVID=172738344
73 lines
2.9 KiB
SQL
73 lines
2.9 KiB
SQL
#standardSQL
|
|
-- Copyright 2017 The Nomulus Authors. All Rights Reserved.
|
|
--
|
|
-- Licensed under the Apache License, Version 2.0 (the "License");
|
|
-- you may not use this file except in compliance with the License.
|
|
-- You may obtain a copy of the License at
|
|
--
|
|
-- http://www.apache.org/licenses/LICENSE-2.0
|
|
--
|
|
-- Unless required by applicable law or agreed to in writing, software
|
|
-- distributed under the License is distributed on an "AS IS" BASIS,
|
|
-- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
-- See the License for the specific language governing permissions and
|
|
-- limitations under the License.
|
|
|
|
-- Determine the number of attempted adds each registrar made.
|
|
|
|
-- Since the specification requests all 'attempted' adds, we regex the
|
|
-- monthly App Engine logs, searching for all create commands and associating
|
|
-- them with their corresponding registrars.
|
|
|
|
-- Example log generated by FlowReporter in App Engine logs:
|
|
--google.registry.flows.FlowReporter
|
|
-- recordToLogs: FLOW-LOG-SIGNATURE-METADATA:
|
|
--{"serverTrid":"oNwL2J2eRya7bh7c9oHIzg==-2360a","clientId":"ipmirror"
|
|
-- ,"commandType":"hello", "resourceType":"","flowClassName":"HelloFlow"
|
|
-- ,"targetId":"","targetIds":[],"tld":"",
|
|
-- "tlds":[],"icannActivityReportField":""}
|
|
|
|
-- This outer select just converts the registrar's clientId to their name.
|
|
SELECT
|
|
tld,
|
|
registrar_table.registrarName AS registrar_name,
|
|
'ATTEMPTED_ADDS' AS metricName,
|
|
count AS metricValue
|
|
FROM (
|
|
SELECT
|
|
JSON_EXTRACT_SCALAR(json, '$.tld') AS tld,
|
|
JSON_EXTRACT_SCALAR(json, '$.clientId') AS clientId,
|
|
COUNT(json) AS count
|
|
FROM (
|
|
-- Extract JSON metadata package from monthly logs
|
|
SELECT
|
|
REGEXP_EXTRACT(logMessages, r'FLOW-LOG-SIGNATURE-METADATA: (.*)\n?$')
|
|
AS json
|
|
FROM (
|
|
SELECT
|
|
protoPayload.resource AS requestPath,
|
|
ARRAY(
|
|
SELECT logMessage
|
|
FROM UNNEST(protoPayload.line)) AS logMessage
|
|
FROM
|
|
`domain-registry-alpha.appengine_logs.appengine_googleapis_com_request_log_*`
|
|
WHERE _TABLE_SUFFIX
|
|
BETWEEN '20170901'
|
|
AND '20170930')
|
|
JOIN UNNEST(logMessage) AS logMessages
|
|
-- Look for metadata logs from epp and registrar console requests
|
|
WHERE requestPath IN ('/_dr/epp', '/_dr/epptool', '/registrar-xhr')
|
|
AND STARTS_WITH(logMessages, "google.registry.flows.FlowReporter recordToLogs: FLOW-LOG-SIGNATURE-METADATA")
|
|
-- Look for domain creates
|
|
AND REGEXP_CONTAINS(
|
|
logMessages, r'"commandType":"create","resourceType":"domain"')
|
|
-- Filter prober data
|
|
AND NOT REGEXP_CONTAINS(
|
|
logMessages, r'"prober-[a-z]{2}-((any)|(canary))"') )
|
|
GROUP BY tld, clientId ) AS logs_table
|
|
JOIN
|
|
`domain-registry-alpha.latest_datastore_export.Registrar`
|
|
AS registrar_table
|
|
ON logs_table.clientId = registrar_table.__key__.name
|
|
ORDER BY tld, registrar_name
|
|
|