pebble/tools/crash_stats.py

#!/usr/bin/env python
# Copyright 2024 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


import argparse
import csv
import logging
import os
import requests
import requests_oauthlib
import subprocess

from collections import OrderedDict
from triage import download_path, load_user_settings, download_elf_by_sw_hw_version

def crash_analytic_path(fw_version):
    return os.path.join(download_path(), fw_version + "_reboot_reasons")

def run_td_query_on_event_analytics(fw_version, error_code):
    query = """
    SELECT
       data_0_device_event_0_crash_report_0_link_register AS data_0_remote_device_0_system_crash_lr,
       device_0_remote_device_0_hw_version,
       COUNT(data_0_device_event_0_crash_report_0_crash_code) AS crash_count,
       device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version
    FROM
       remote_device_events
    WHERE
       device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version = '%s'
       AND data_0_device_event_0_event_enum = 10
       AND data_0_device_event_0_crash_report_0_crash_code = %d
       AND TD_TIME_RANGE(time, TD_TIME_ADD(TD_SCHEDULED_TIME(), '-30d'), TD_SCHEDULED_TIME())
    GROUP BY
       data_0_device_event_0_crash_report_0_crash_code,
       data_0_device_event_0_crash_report_0_link_register,
       device_0_remote_device_0_hw_version,
       device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version
    ORDER BY
       COUNT(data_0_device_event_0_crash_report_0_link_register) DESC,
       device_0_remote_device_0_hw_version
    """ % (fw_version, error_code)

    logging.debug(query)
    logging.info("Running TD query!")

    path = crash_analytic_path(fw_version)
    if not os.path.exists(path):
        os.makedirs(path)

    output_csv_file = crash_analytic_path(fw_version) + "/0x%x-crashcodes.csv" % error_code

    cmd = 'td query -d pebble_restricted -P 2 -T presto -c -f csv -w -o %s "%s"' % (output_csv_file, query)
    p = subprocess.Popen(cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.STDOUT)
    retval = p.wait()
    logging.info("Query Complete, Result = %d" % retval)
    return 0, output_csv_file

def run_td_query_on_hourly_analytics(fw_version, error_code):

    if (subprocess.call("type td", shell=True, \
        stdout=subprocess.PIPE, stderr=subprocess.PIPE) != 0):
        logging.error("You need to install the td toolbelt for this query to work!\n"
                      "Please see http://docs.treasuredata.com/articles/command-"
                      "line#step-1-installation-amp-update")
        exit(0)

    query = """
    SELECT
       data_0_remote_device_0_system_crash_lr,
       device_0_remote_device_0_hw_version,
       COUNT(data_0_remote_device_0_system_crashed_code) AS crash_count,
       device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version
    FROM
       remote_device_system_metrics
    WHERE
       device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version = '%s'
       AND data_0_remote_device_0_system_crashed_code=%d
       AND TD_TIME_RANGE(time, TD_TIME_ADD(TD_SCHEDULED_TIME(), '-30d'), TD_SCHEDULED_TIME())
    GROUP BY
       data_0_remote_device_0_system_crashed_code,
       data_0_remote_device_0_system_crash_lr,
       device_0_remote_device_0_hw_version,
       device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version
    ORDER BY
       COUNT(data_0_remote_device_0_system_crash_lr) DESC,
       device_0_remote_device_0_hw_version DESC
    """ % (fw_version, error_code)

    logging.debug(query)
    logging.info("Running TD query!")

    path = crash_analytic_path(fw_version)
    if not os.path.exists(path):
        os.makedirs(path)

    output_csv_file = crash_analytic_path(fw_version) + "/0x%x-crashcodes.csv" % error_code

    cmd = 'td query -d pebble_restricted -P 2 -T presto -c -f csv -w -o %s "%s"' % (output_csv_file, query)
    p = subprocess.Popen(cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.STDOUT)
    retval = p.wait()
    logging.info("Query Complete, Result = %d" % retval)
    return 0, output_csv_file

def gather_analytic_crash_stats(fw_version, error_code, error_code_name, use_events):

    elf_dict = dict()

    symbol_name_to_hw_model_lookup = {
        "v2_0": [ "102V1" ],
        "v1_5": [ "V3R1", "V3R2", "V3R3" ],
        "ev2_4": [ "V2R2" ],
        "snowy_evt2": [ "snowy20" ],
        "snowy_dvt": [ "snowy21", "snowy22", "snowy23" ],
        "snowy_s3": ["smiles10", "smiles11", "smiles12", "smiles13"],
        "spalding_evt" : [ "spauld10", "spauld11", "spauld12" ],
        "spalding" : [ "spauld13" ],
    }
    # Download the .elf associated with the core dump:
    for elf_name in symbol_name_to_hw_model_lookup.iterkeys():
        try:
            elf_dict[elf_name] = download_elf_by_sw_hw_version(fw_version, elf_name)
        except requests.exceptions.HTTPError as http_error:
            logging.debug("Could not find ELF file: %s (%s)" % (fw_version, http_error))

    if use_events:
        retval, res_file = run_td_query_on_event_analytics(fw_version, error_code)
    else:
        retval, res_file = run_td_query_on_hourly_analytics(fw_version, error_code)

    if retval != 0:
        return ""

    reader = csv.reader(open(res_file))
    next(reader, None)

    line_dict = dict()
    for line in reader:
        if len(line) < 3:
            continue

        # it looks like the LR need to be in hex for arm-none-eabi-addr2line to work
        try:
            lr = hex(int(line[0]))
        except ValueError:
            continue # Analytic is empty for some reason

        hw_rev = line[1]
        found = False
        for elf_name, hw_model_list in symbol_name_to_hw_model_lookup.iteritems():
            for hw_model in hw_model_list:
                if hw_rev.lower() == hw_model.lower():
                    try:
                        fw_symbols_name = elf_dict[elf_name]
                        found = True
                    except:
                        logging.debug("No dict for elf %s" % elf_name)
                    break

        if not found:
            print "Unhandled HW Version %s" % hw_rev
            continue

        cmd = 'arm-none-eabi-addr2line --exe=%s %s' % (fw_symbols_name, str(lr))
        p = subprocess.Popen(cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.STDOUT)
        result = p.stdout.readlines()
        retval = p.wait()

        if retval == 0 and len(result) >= 1:
            line_info = result[0].strip("\n")
            logging.debug("%s %s" % (lr, line_info))
            # Try to pretty print the path but if its not something in our build directory
            # just print the whole path
            idx = line_info.find('build/..')
            if (idx != -1):
                line_info = line_info[idx:]
            if line_info in line_dict:
                line_dict[line_info] += int(line[2])
            else:
                line_dict[line_info] = int(line[2])

    line_dict_sorted = OrderedDict(sorted(line_dict.items(), key=lambda x: x[1], reverse=True))

    result_text = "Results for %s:\n" % error_code_name
    asserts_analyzed = 0
    for k, v in line_dict_sorted.items():
        asserts_analyzed += v
        result_text += '%6d: %s\n' % (v, k)

    result_text += "%d %s analyzed\n" % (asserts_analyzed, error_code_name)
    return result_text

def analyze_analytics(fw_version, use_events):
    if use_events:
        ASSERT_CRASH_CODE = 0x11
        HARDFAULT_CRASH_CODE = 0x13
    else:
        ASSERT_CRASH_CODE = 0xDEAD0011
        HARDFAULT_CRASH_CODE = 0xDEAD0013

    result = "=======\n"
    result = gather_analytic_crash_stats(fw_version, ASSERT_CRASH_CODE, "Asserts", use_events)
    result += "\n"
    result += gather_analytic_crash_stats(fw_version, HARDFAULT_CRASH_CODE, "Hard Faults", use_events)

    print result

if (__name__ == '__main__'):
    parser = argparse.ArgumentParser()
    parser.add_argument('fw_tag',  type=str, help="Analyzes "
                        "crashes seen in the field by line for the specified "
                        "build, for example v2.9-beta6")
    parser.add_argument('--debug', action='store_true',
                        help="Turn on debug logging")
    parser.add_argument('--use_event', action='store_true', help="Look at crash information "
                        "using event analytics instead of the default hourly analytics")

    args = parser.parse_args()

    load_user_settings()

    level = logging.INFO
    if args.debug:
        level = logging.DEBUG
    logging.basicConfig(level=level)

    logging.info("Analyzing crash stats for %s" % args.fw_tag)
    if args.fw_tag:
      analyze_analytics(args.fw_tag, args.use_event)
Import of the watch repository from Pebble 2024-12-12 16:43:03 -08:00			`#!/usr/bin/env python`
			`# Copyright 2024 Google LLC`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`


			`import argparse`
			`import csv`
			`import logging`
			`import os`
			`import requests`
			`import requests_oauthlib`
			`import subprocess`

			`from collections import OrderedDict`
			`from triage import download_path, load_user_settings, download_elf_by_sw_hw_version`

			`def crash_analytic_path(fw_version):`
			`return os.path.join(download_path(), fw_version + "_reboot_reasons")`

			`def run_td_query_on_event_analytics(fw_version, error_code):`
			`query = """`
			`SELECT`
			`data_0_device_event_0_crash_report_0_link_register AS data_0_remote_device_0_system_crash_lr,`
			`device_0_remote_device_0_hw_version,`
			`COUNT(data_0_device_event_0_crash_report_0_crash_code) AS crash_count,`
			`device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version`
			`FROM`
			`remote_device_events`
			`WHERE`
			`device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version = '%s'`
			`AND data_0_device_event_0_event_enum = 10`
			`AND data_0_device_event_0_crash_report_0_crash_code = %d`
			`AND TD_TIME_RANGE(time, TD_TIME_ADD(TD_SCHEDULED_TIME(), '-30d'), TD_SCHEDULED_TIME())`
			`GROUP BY`
			`data_0_device_event_0_crash_report_0_crash_code,`
			`data_0_device_event_0_crash_report_0_link_register,`
			`device_0_remote_device_0_hw_version,`
			`device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version`
			`ORDER BY`
			`COUNT(data_0_device_event_0_crash_report_0_link_register) DESC,`
			`device_0_remote_device_0_hw_version`
			`""" % (fw_version, error_code)`

			`logging.debug(query)`
			`logging.info("Running TD query!")`

			`path = crash_analytic_path(fw_version)`
			`if not os.path.exists(path):`
			`os.makedirs(path)`

			`output_csv_file = crash_analytic_path(fw_version) + "/0x%x-crashcodes.csv" % error_code`

			`cmd = 'td query -d pebble_restricted -P 2 -T presto -c -f csv -w -o %s "%s"' % (output_csv_file, query)`
			`p = subprocess.Popen(cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.STDOUT)`
			`retval = p.wait()`
			`logging.info("Query Complete, Result = %d" % retval)`
			`return 0, output_csv_file`

			`def run_td_query_on_hourly_analytics(fw_version, error_code):`

			`if (subprocess.call("type td", shell=True, \`
			`stdout=subprocess.PIPE, stderr=subprocess.PIPE) != 0):`
			`logging.error("You need to install the td toolbelt for this query to work!\n"`
			`"Please see http://docs.treasuredata.com/articles/command-"`
			`"line#step-1-installation-amp-update")`
			`exit(0)`

			`query = """`
			`SELECT`
			`data_0_remote_device_0_system_crash_lr,`
			`device_0_remote_device_0_hw_version,`
			`COUNT(data_0_remote_device_0_system_crashed_code) AS crash_count,`
			`device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version`
			`FROM`
			`remote_device_system_metrics`
			`WHERE`
			`device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version = '%s'`
			`AND data_0_remote_device_0_system_crashed_code=%d`
			`AND TD_TIME_RANGE(time, TD_TIME_ADD(TD_SCHEDULED_TIME(), '-30d'), TD_SCHEDULED_TIME())`
			`GROUP BY`
			`data_0_remote_device_0_system_crashed_code,`
			`data_0_remote_device_0_system_crash_lr,`
			`device_0_remote_device_0_hw_version,`
			`device_0_remote_device_0_firmware_description_0_version_0_firmware_0_fw_version`
			`ORDER BY`
			`COUNT(data_0_remote_device_0_system_crash_lr) DESC,`
			`device_0_remote_device_0_hw_version DESC`
			`""" % (fw_version, error_code)`

			`logging.debug(query)`
			`logging.info("Running TD query!")`

			`path = crash_analytic_path(fw_version)`
			`if not os.path.exists(path):`
			`os.makedirs(path)`

			`output_csv_file = crash_analytic_path(fw_version) + "/0x%x-crashcodes.csv" % error_code`

			`cmd = 'td query -d pebble_restricted -P 2 -T presto -c -f csv -w -o %s "%s"' % (output_csv_file, query)`
			`p = subprocess.Popen(cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.STDOUT)`
			`retval = p.wait()`
			`logging.info("Query Complete, Result = %d" % retval)`
			`return 0, output_csv_file`

			`def gather_analytic_crash_stats(fw_version, error_code, error_code_name, use_events):`

			`elf_dict = dict()`

			`symbol_name_to_hw_model_lookup = {`
			`"v2_0": [ "102V1" ],`
			`"v1_5": [ "V3R1", "V3R2", "V3R3" ],`
			`"ev2_4": [ "V2R2" ],`
			`"snowy_evt2": [ "snowy20" ],`
			`"snowy_dvt": [ "snowy21", "snowy22", "snowy23" ],`
			`"snowy_s3": ["smiles10", "smiles11", "smiles12", "smiles13"],`
			`"spalding_evt" : [ "spauld10", "spauld11", "spauld12" ],`
			`"spalding" : [ "spauld13" ],`
			`}`
			`# Download the .elf associated with the core dump:`
			`for elf_name in symbol_name_to_hw_model_lookup.iterkeys():`
			`try:`
			`elf_dict[elf_name] = download_elf_by_sw_hw_version(fw_version, elf_name)`
			`except requests.exceptions.HTTPError as http_error:`
			`logging.debug("Could not find ELF file: %s (%s)" % (fw_version, http_error))`

			`if use_events:`
			`retval, res_file = run_td_query_on_event_analytics(fw_version, error_code)`
			`else:`
			`retval, res_file = run_td_query_on_hourly_analytics(fw_version, error_code)`

			`if retval != 0:`
			`return ""`

			`reader = csv.reader(open(res_file))`
			`next(reader, None)`

			`line_dict = dict()`
			`for line in reader:`
			`if len(line) < 3:`
			`continue`

			`# it looks like the LR need to be in hex for arm-none-eabi-addr2line to work`
			`try:`
			`lr = hex(int(line[0]))`
			`except ValueError:`
			`continue # Analytic is empty for some reason`

			`hw_rev = line[1]`
			`found = False`
			`for elf_name, hw_model_list in symbol_name_to_hw_model_lookup.iteritems():`
			`for hw_model in hw_model_list:`
			`if hw_rev.lower() == hw_model.lower():`
			`try:`
			`fw_symbols_name = elf_dict[elf_name]`
			`found = True`
			`except:`
			`logging.debug("No dict for elf %s" % elf_name)`
			`break`

			`if not found:`
			`print "Unhandled HW Version %s" % hw_rev`
			`continue`

			`cmd = 'arm-none-eabi-addr2line --exe=%s %s' % (fw_symbols_name, str(lr))`
			`p = subprocess.Popen(cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.STDOUT)`
			`result = p.stdout.readlines()`
			`retval = p.wait()`

			`if retval == 0 and len(result) >= 1:`
			`line_info = result[0].strip("\n")`
			`logging.debug("%s %s" % (lr, line_info))`
			`# Try to pretty print the path but if its not something in our build directory`
			`# just print the whole path`
			`idx = line_info.find('build/..')`
			`if (idx != -1):`
			`line_info = line_info[idx:]`
			`if line_info in line_dict:`
			`line_dict[line_info] += int(line[2])`
			`else:`
			`line_dict[line_info] = int(line[2])`

			`line_dict_sorted = OrderedDict(sorted(line_dict.items(), key=lambda x: x[1], reverse=True))`

			`result_text = "Results for %s:\n" % error_code_name`
			`asserts_analyzed = 0`
			`for k, v in line_dict_sorted.items():`
			`asserts_analyzed += v`
			`result_text += '%6d: %s\n' % (v, k)`

			`result_text += "%d %s analyzed\n" % (asserts_analyzed, error_code_name)`
			`return result_text`

			`def analyze_analytics(fw_version, use_events):`
			`if use_events:`
			`ASSERT_CRASH_CODE = 0x11`
			`HARDFAULT_CRASH_CODE = 0x13`
			`else:`
			`ASSERT_CRASH_CODE = 0xDEAD0011`
			`HARDFAULT_CRASH_CODE = 0xDEAD0013`

			`result = "=======\n"`
			`result = gather_analytic_crash_stats(fw_version, ASSERT_CRASH_CODE, "Asserts", use_events)`
			`result += "\n"`
			`result += gather_analytic_crash_stats(fw_version, HARDFAULT_CRASH_CODE, "Hard Faults", use_events)`

			`print result`

			`if (__name__ == '__main__'):`
			`parser = argparse.ArgumentParser()`
			`parser.add_argument('fw_tag', type=str, help="Analyzes "`
			`"crashes seen in the field by line for the specified "`
			`"build, for example v2.9-beta6")`
			`parser.add_argument('--debug', action='store_true',`
			`help="Turn on debug logging")`
			`parser.add_argument('--use_event', action='store_true', help="Look at crash information "`
			`"using event analytics instead of the default hourly analytics")`

			`args = parser.parse_args()`

			`load_user_settings()`

			`level = logging.INFO`
			`if args.debug:`
			`level = logging.DEBUG`
			`logging.basicConfig(level=level)`

			`logging.info("Analyzing crash stats for %s" % args.fw_tag)`
			`if args.fw_tag:`
			`analyze_analytics(args.fw_tag, args.use_event)`