mysql56/pfs__digest_8cc_source.html

/* Copyright (c) 2008, 2013, Oracle and/or its affiliates. All rights reserved.


  This program is free software; you can redistribute it and/or modify

  it under the terms of the GNU General Public License as published by

  the Free Software Foundation; version 2 of the License.


  This program is distributed in the hope that it will be useful,

  but WITHOUT ANY WARRANTY; without even the implied warranty of

  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  GNU General Public License for more details.


  You should have received a copy of the GNU General Public License

  along with this program; if not, write to the Free Software Foundation,

  51 Franklin Street, Suite 500, Boston, MA 02110-1335 USA */


/*

  This code needs extra visibility in the lexer structures

*/


#include "my_global.h"

#include "my_sys.h"

#include "pfs_instr.h"

#include "pfs_digest.h"

#include "pfs_global.h"

#include "table_helper.h"

#include "my_md5.h"

#include "sql_lex.h"

#include "sql_get_diagnostics.h"

#include "sql_string.h"

#include <string.h>


/* Generated code */

#include "../sql/sql_yacc.h"

#include "../storage/perfschema/pfs_lex_token.h"


/* Name pollution from sql/sql_lex.h */

#ifdef LEX_YYSTYPE

#undef LEX_YYSTYPE

#endif


#define LEX_YYSTYPE YYSTYPE


ulong digest_max= 0;

ulong digest_lost= 0;


PFS_statements_digest_stat *statements_digest_stat_array= NULL;

bool flag_statements_digest= true;

volatile uint32 digest_index= 1;


LF_HASH digest_hash;

static bool digest_hash_inited= false;


int init_digest(const PFS_global_param *param)

{

  unsigned int index;


  /*

    Allocate memory for statements_digest_stat_array based on

    performance_schema_digests_size values

  */

  digest_max= param->m_digest_sizing;

  digest_lost= 0;


  if (digest_max == 0)

    return 0;


  statements_digest_stat_array=

    PFS_MALLOC_ARRAY(digest_max, PFS_statements_digest_stat,

                     MYF(MY_ZEROFILL));

  if (unlikely(statements_digest_stat_array == NULL))

    return 1;


  for (index= 0; index < digest_max; index++)

  {

    statements_digest_stat_array[index].reset_data();

  }


  return 0;

}


void cleanup_digest(void)

{

  /*  Free memory allocated to statements_digest_stat_array. */

  pfs_free(statements_digest_stat_array);

  statements_digest_stat_array= NULL;

}


C_MODE_START

static uchar *digest_hash_get_key(const uchar *entry, size_t *length,

                                  my_bool)

{

  const PFS_statements_digest_stat * const *typed_entry;

  const PFS_statements_digest_stat *digest;

  const void *result;

  typed_entry= reinterpret_cast<const PFS_statements_digest_stat*const*>(entry);

  DBUG_ASSERT(typed_entry != NULL);

  digest= *typed_entry;

  DBUG_ASSERT(digest != NULL);

  *length= sizeof (PFS_digest_key);

  result= & digest->m_digest_key;

  return const_cast<uchar*> (reinterpret_cast<const uchar*> (result));

}

C_MODE_END


int init_digest_hash(void)

{

  if ((! digest_hash_inited) && (digest_max > 0))

  {

    lf_hash_init(&digest_hash, sizeof(PFS_statements_digest_stat*),

                 LF_HASH_UNIQUE, 0, 0, digest_hash_get_key,

                 &my_charset_bin);

    digest_hash.size= digest_max;

    digest_hash_inited= true;

  }

  return 0;

}


void cleanup_digest_hash(void)

{

  if (digest_hash_inited)

  {

    lf_hash_destroy(&digest_hash);

    digest_hash_inited= false;

  }

}


static LF_PINS* get_digest_hash_pins(PFS_thread *thread)

{

  if (unlikely(thread->m_digest_hash_pins == NULL))

  {

    if (!digest_hash_inited)

      return NULL;

    thread->m_digest_hash_pins= lf_hash_get_pins(&digest_hash);

  }

  return thread->m_digest_hash_pins;

}


PFS_statement_stat*

find_or_create_digest(PFS_thread *thread,

                      PSI_digest_storage *digest_storage,

                      const char *schema_name,

                      uint schema_name_length)

{

  if (statements_digest_stat_array == NULL)

    return NULL;


  if (digest_storage->m_byte_count <= 0)

    return NULL;


  LF_PINS *pins= get_digest_hash_pins(thread);

  if (unlikely(pins == NULL))

    return NULL;


  /*

    Note: the LF_HASH key is a block of memory,

    make sure to clean unused bytes,

    so that memcmp() can compare keys.

  */

  PFS_digest_key hash_key;

  memset(& hash_key, 0, sizeof(hash_key));

  /* Compute MD5 Hash of the tokens received. */

  compute_md5_hash((char *) hash_key.m_md5,

                   (char *) digest_storage->m_token_array,

                   digest_storage->m_byte_count);

  /* Add the current schema to the key */

  hash_key.m_schema_name_length= schema_name_length;

  if (schema_name_length > 0)

    memcpy(hash_key.m_schema_name, schema_name, schema_name_length);


  int res;

  ulong safe_index;

  uint retry_count= 0;

  const uint retry_max= 3;

  PFS_statements_digest_stat **entry;

  PFS_statements_digest_stat *pfs= NULL;


  ulonglong now= my_micro_time();


search:


  /* Lookup LF_HASH using this new key. */

  entry= reinterpret_cast<PFS_statements_digest_stat**>

    (lf_hash_search(&digest_hash, pins,

                    &hash_key, sizeof(PFS_digest_key)));


  if (entry && (entry != MY_ERRPTR))

  {

    /* If digest already exists, update stats and return. */

    pfs= *entry;

    pfs->m_last_seen= now;

    lf_hash_search_unpin(pins);

    return & pfs->m_stat;

  }


  lf_hash_search_unpin(pins);


  /* Dirty read of digest_index */

  if (digest_index == 0)

  {

    /*  digest_stat array is full. Add stat at index 0 and return. */

    pfs= &statements_digest_stat_array[0];


    if (pfs->m_first_seen == 0)

      pfs->m_first_seen= now;

    pfs->m_last_seen= now;

    return & pfs->m_stat;

  }


  safe_index= PFS_atomic::add_u32(& digest_index, 1);

  if (safe_index >= digest_max)

  {

    /* The digest array is now full. */

    digest_index= 0;

    pfs= &statements_digest_stat_array[0];


    if (pfs->m_first_seen == 0)

      pfs->m_first_seen= now;

    pfs->m_last_seen= now;

    return & pfs->m_stat;

  }


  /* Add a new record in digest stat array. */

  pfs= &statements_digest_stat_array[safe_index];


  /* Copy digest hash/LF Hash search key. */

  memcpy(& pfs->m_digest_key, &hash_key, sizeof(PFS_digest_key));


  /*

    Copy digest storage to statement_digest_stat_array so that it could be

    used later to generate digest text.

  */

  digest_copy(& pfs->m_digest_storage, digest_storage);


  pfs->m_first_seen= now;

  pfs->m_last_seen= now;


  res= lf_hash_insert(&digest_hash, pins, &pfs);

  if (likely(res == 0))

  {

    return & pfs->m_stat;

  }


  if (res > 0)

  {

    /* Duplicate insert by another thread */

    if (++retry_count > retry_max)

    {

      /* Avoid infinite loops */

      digest_lost++;

      return NULL;

    }

    goto search;

  }


  /* OOM in lf_hash_insert */

  digest_lost++;

  return NULL;

}


void purge_digest(PFS_thread* thread, PFS_digest_key *hash_key)

{

  LF_PINS *pins= get_digest_hash_pins(thread);

  if (unlikely(pins == NULL))

    return;


  PFS_statements_digest_stat **entry;


  /* Lookup LF_HASH using this new key. */

  entry= reinterpret_cast<PFS_statements_digest_stat**>

    (lf_hash_search(&digest_hash, pins,

                    hash_key, sizeof(PFS_digest_key)));


  if (entry && (entry != MY_ERRPTR))

  {

    lf_hash_delete(&digest_hash, pins,

                   hash_key, sizeof(PFS_digest_key));

  }

  lf_hash_search_unpin(pins);

  return;

}


void PFS_statements_digest_stat::reset_data()

{

  digest_reset(& m_digest_storage);

  m_stat.reset();

  m_first_seen= 0;

  m_last_seen= 0;

}


void PFS_statements_digest_stat::reset_index(PFS_thread *thread)

{

  /* Only remove entries that exists in the HASH index. */

  if (m_digest_storage.m_byte_count > 0)

  {

    purge_digest(thread, & m_digest_key);

  }

}


void reset_esms_by_digest()

{

  uint index;


  if (statements_digest_stat_array == NULL)

    return;


  PFS_thread *thread= PFS_thread::get_current_thread();

  if (unlikely(thread == NULL))

    return;


  /* Reset statements_digest_stat_array. */

  for (index= 0; index < digest_max; index++)

  {

    statements_digest_stat_array[index].reset_index(thread);

    statements_digest_stat_array[index].reset_data();

  }


  /*

    Reset index which indicates where the next calculated digest information

    to be inserted in statements_digest_stat_array.

  */

  digest_index= 1;

}


/*

  Iterate token array and updates digest_text.

*/

void get_digest_text(char* digest_text, PSI_digest_storage* digest_storage)

{

  DBUG_ASSERT(digest_storage != NULL);

  bool truncated= false;

  int byte_count= digest_storage->m_byte_count;

  char *digest_output= digest_text;

  int bytes_needed= 0;

  uint tok= 0;

  int current_byte= 0;

  lex_token_string *tok_data;

  /* -4 is to make sure extra space for '...' and a '\0' at the end. */

  int bytes_available= COL_DIGEST_TEXT_SIZE - 4;


  if (byte_count <= 0 || byte_count > PSI_MAX_DIGEST_STORAGE_SIZE)

  {

    *digest_text= '\0';

    return;

  }


  /* Convert text to utf8 */

  const CHARSET_INFO *from_cs= get_charset(digest_storage->m_charset_number, MYF(0));

  const CHARSET_INFO *to_cs= &my_charset_utf8_bin;


  if (from_cs == NULL)

  {

    /*

      Can happen, as we do dirty reads on digest_storage,

      which can be written to in another thread.

    */

    *digest_text= '\0';

    return;

  }


  /*

     Max converted size is number of characters * max multibyte length of the

     target charset, which is 4 for UTF8.

   */

  const uint max_converted_size= PSI_MAX_DIGEST_STORAGE_SIZE * 4;

  char id_buffer[max_converted_size];

  char *id_string;

  int  id_length;

  bool convert_text= !my_charset_same(from_cs, to_cs);


  DBUG_ASSERT(byte_count <= PSI_MAX_DIGEST_STORAGE_SIZE);


  while ((current_byte < byte_count) &&

         (bytes_available > 0) &&

         !truncated)

  {

    current_byte= read_token(digest_storage, current_byte, &tok);


    if (tok <= 0 || tok >= array_elements(lex_token_array))

    {

      *digest_text='\0';

      return;

    }


    tok_data= &lex_token_array[tok];


    switch (tok)

    {

    /* All identifiers are printed with their name. */

    case IDENT:

    case IDENT_QUOTED:

      {

        char *id_ptr;

        int id_len;

        uint err_cs= 0;


        /* Get the next identifier from the storage buffer. */

        current_byte= read_identifier(digest_storage, current_byte,

                                      &id_ptr, &id_len);

        if (convert_text)

        {

          /* Verify that the converted text will fit. */

          if (to_cs->mbmaxlen*id_len > max_converted_size)

          {

            truncated= true;

            break;

          }

          /* Convert identifier string into the storage character set. */

          id_length= my_convert(id_buffer, max_converted_size, to_cs,

                                id_ptr, id_len, from_cs, &err_cs);

          id_string= id_buffer;

        }

        else

        {

          id_string= id_ptr;

          id_length= id_len;

        }


        if (id_length == 0 || err_cs != 0)

        {

          truncated= true;

          break;

        }

        /* Copy the converted identifier into the digest string. */

        bytes_needed= id_length + (tok == IDENT ? 1 : 3);

        if (bytes_needed <= bytes_available)

        {

          if (tok == IDENT_QUOTED)

            *digest_output++= '`';

          if (id_length > 0)

          {

            memcpy(digest_output, id_string, id_length);

            digest_output+= id_length;

          }

          if (tok == IDENT_QUOTED)

            *digest_output++= '`';

          *digest_output++= ' ';

          bytes_available-= bytes_needed;

        }

        else

        {

          truncated= true;

        }

      }

      break;


    /* Everything else is printed as is. */

    default:

      /*

        Make sure not to overflow digest_text buffer.

        +1 is to make sure extra space for ' '.

      */

      int tok_length= tok_data->m_token_length;

      bytes_needed= tok_length + 1;


      if (bytes_needed <= bytes_available)

      {

        strncpy(digest_output, tok_data->m_token_string, tok_length);

        digest_output+= tok_length;

        *digest_output++= ' ';

        bytes_available-= bytes_needed;

      }

      else

      {

        truncated= true;

      }

      break;

    }

  }


  /* Truncate digest text in case of long queries. */

  if (digest_storage->m_full || truncated)

  {

    strcpy(digest_output, "...");

    digest_output+= 3;

  }


  *digest_output= '\0';

}


static inline uint peek_token(const PSI_digest_storage *digest, int index)

{

  uint token;

  DBUG_ASSERT(index >= 0);

  DBUG_ASSERT(index + PFS_SIZE_OF_A_TOKEN <= digest->m_byte_count);

  DBUG_ASSERT(digest->m_byte_count <=  PSI_MAX_DIGEST_STORAGE_SIZE);


  token= ((digest->m_token_array[index + 1])<<8) | digest->m_token_array[index];

  return token;

}


static inline void peek_last_two_tokens(const PSI_digest_storage* digest_storage,

                                        int last_id_index, uint *t1, uint *t2)

{

  int byte_count= digest_storage->m_byte_count;

  int peek_index= byte_count - PFS_SIZE_OF_A_TOKEN;


  if (last_id_index <= peek_index)

  {

    /* Take last token. */

    *t1= peek_token(digest_storage, peek_index);


    peek_index-= PFS_SIZE_OF_A_TOKEN;

    if (last_id_index <= peek_index)

    {

      /* Take 2nd token from last. */

      *t2= peek_token(digest_storage, peek_index);

    }

    else

    {

      *t2= TOK_PFS_UNUSED;

    }

  }

  else

  {

    *t1= TOK_PFS_UNUSED;

    *t2= TOK_PFS_UNUSED;

  }

}


struct PSI_digest_locker* pfs_digest_start_v1(PSI_statement_locker *locker)

{

  PSI_statement_locker_state *statement_state;

  statement_state= reinterpret_cast<PSI_statement_locker_state*> (locker);

  DBUG_ASSERT(statement_state != NULL);


  if (statement_state->m_discarded)

    return NULL;


  if (statement_state->m_flags & STATE_FLAG_DIGEST)

  {

    PSI_digest_locker_state *digest_state;

    digest_state= &statement_state->m_digest_state;

    return reinterpret_cast<PSI_digest_locker*> (digest_state);

  }


  return NULL;

}


PSI_digest_locker* pfs_digest_add_token_v1(PSI_digest_locker *locker,

                                           uint token,

                                           OPAQUE_LEX_YYSTYPE *yylval)

{

  PSI_digest_locker_state *state= NULL;

  PSI_digest_storage      *digest_storage= NULL;


  state= reinterpret_cast<PSI_digest_locker_state*> (locker);

  DBUG_ASSERT(state != NULL);


  digest_storage= &state->m_digest_storage;


  /*

    Stop collecting further tokens if digest storage is full or

    if END token is received.

  */

  if (digest_storage->m_full || token == END_OF_INPUT)

    return NULL;


  /*

    Take last_token 2 tokens collected till now. These tokens will be used

    in reduce for normalisation. Make sure not to consider ID tokens in reduce.

  */

  uint last_token;

  uint last_token2;


  switch (token)

  {

    case BIN_NUM:

    case DECIMAL_NUM:

    case FLOAT_NUM:

    case HEX_NUM:

    case LEX_HOSTNAME:

    case LONG_NUM:

    case NUM:

    case TEXT_STRING:

    case NCHAR_STRING:

    case ULONGLONG_NUM:

    {

      /*

        REDUCE:

        TOK_PFS_GENERIC_VALUE := BIN_NUM | DECIMAL_NUM | ... | ULONGLONG_NUM

      */

      token= TOK_PFS_GENERIC_VALUE;

    }

    /* fall through */

    case NULL_SYM:

    {

      peek_last_two_tokens(digest_storage, state->m_last_id_index,

                           &last_token, &last_token2);


      if ((last_token2 == TOK_PFS_GENERIC_VALUE ||

           last_token2 == TOK_PFS_GENERIC_VALUE_LIST ||

           last_token2 == NULL_SYM) &&

          (last_token == ','))

      {

        /*

          REDUCE:

          TOK_PFS_GENERIC_VALUE_LIST :=

            (TOK_PFS_GENERIC_VALUE|NULL_SYM) ',' (TOK_PFS_GENERIC_VALUE|NULL_SYM)


          REDUCE:

          TOK_PFS_GENERIC_VALUE_LIST :=

            TOK_PFS_GENERIC_VALUE_LIST ',' (TOK_PFS_GENERIC_VALUE|NULL_SYM)

        */

        digest_storage->m_byte_count-= 2*PFS_SIZE_OF_A_TOKEN;

        token= TOK_PFS_GENERIC_VALUE_LIST;

      }

      /*

        Add this token or the resulting reduce to digest storage.

      */

      store_token(digest_storage, token);

      break;

    }

    case ')':

    {

      peek_last_two_tokens(digest_storage, state->m_last_id_index,

                           &last_token, &last_token2);


      if (last_token == TOK_PFS_GENERIC_VALUE &&

          last_token2 == '(')

      {

        /*

          REDUCE:

          TOK_PFS_ROW_SINGLE_VALUE :=

            '(' TOK_PFS_GENERIC_VALUE ')'

        */

        digest_storage->m_byte_count-= 2*PFS_SIZE_OF_A_TOKEN;

        token= TOK_PFS_ROW_SINGLE_VALUE;


        /* Read last two tokens again */

        peek_last_two_tokens(digest_storage, state->m_last_id_index,

                             &last_token, &last_token2);


        if ((last_token2 == TOK_PFS_ROW_SINGLE_VALUE ||

             last_token2 == TOK_PFS_ROW_SINGLE_VALUE_LIST) &&

            (last_token == ','))

        {

          /*

            REDUCE:

            TOK_PFS_ROW_SINGLE_VALUE_LIST :=

              TOK_PFS_ROW_SINGLE_VALUE ',' TOK_PFS_ROW_SINGLE_VALUE


            REDUCE:

            TOK_PFS_ROW_SINGLE_VALUE_LIST :=

              TOK_PFS_ROW_SINGLE_VALUE_LIST ',' TOK_PFS_ROW_SINGLE_VALUE

          */

          digest_storage->m_byte_count-= 2*PFS_SIZE_OF_A_TOKEN;

          token= TOK_PFS_ROW_SINGLE_VALUE_LIST;

        }

      }

      else if (last_token == TOK_PFS_GENERIC_VALUE_LIST &&

               last_token2 == '(')

      {

        /*

          REDUCE:

          TOK_PFS_ROW_MULTIPLE_VALUE :=

            '(' TOK_PFS_GENERIC_VALUE_LIST ')'

        */

        digest_storage->m_byte_count-= 2*PFS_SIZE_OF_A_TOKEN;

        token= TOK_PFS_ROW_MULTIPLE_VALUE;


        /* Read last two tokens again */

        peek_last_two_tokens(digest_storage, state->m_last_id_index,

                             &last_token, &last_token2);


        if ((last_token2 == TOK_PFS_ROW_MULTIPLE_VALUE ||

             last_token2 == TOK_PFS_ROW_MULTIPLE_VALUE_LIST) &&

            (last_token == ','))

        {

          /*

            REDUCE:

            TOK_PFS_ROW_MULTIPLE_VALUE_LIST :=

              TOK_PFS_ROW_MULTIPLE_VALUE ',' TOK_PFS_ROW_MULTIPLE_VALUE


            REDUCE:

            TOK_PFS_ROW_MULTIPLE_VALUE_LIST :=

              TOK_PFS_ROW_MULTIPLE_VALUE_LIST ',' TOK_PFS_ROW_MULTIPLE_VALUE

          */

          digest_storage->m_byte_count-= 2*PFS_SIZE_OF_A_TOKEN;

          token= TOK_PFS_ROW_MULTIPLE_VALUE_LIST;

        }

      }

      /*

        Add this token or the resulting reduce to digest storage.

      */

      store_token(digest_storage, token);

      break;

    }

    case IDENT:

    case IDENT_QUOTED:

    {

      LEX_YYSTYPE *lex_token= (LEX_YYSTYPE*) yylval;

      char *yytext= lex_token->lex_str.str;

      int yylen= lex_token->lex_str.length;


      /* Add this token and identifier string to digest storage. */

      store_token_identifier(digest_storage, token, yylen, yytext);


      /* Update the index of last identifier found. */

      state->m_last_id_index= digest_storage->m_byte_count;

      break;

    }

    default:

    {

      /* Add this token to digest storage. */

      store_token(digest_storage, token);

      break;

    }

  }


  return locker;

}