Uploaded image for project: 'Couchbase Server'
  1. Couchbase Server
  2. MB-33536

data mismatch when we kill consumer or erlang with n1ql op and timers

    XMLWordPrintable

Details

    • Bug
    • Resolution: Fixed
    • Major
    • 6.5.0
    • 6.5.0
    • eventing
    • None
    • Untriaged
    • Unknown

    Description

      Build: 6.5.0-2715

      Test: Failure on onDelete

       ./testrunner -i /tmp/testexec.1749.ini -p get-cbcollect-info=True,GROUP=recovery -t eventing.eventing_recovery.EventingRecovery.test_killing_eventing_consumer_when_eventing_is_processing_mutations,nodes_init=4,services_init=kv-eventing-index-n1ql,dataset=default,groups=simple,reset_services=True,skip_cleanup=True,doc-per-day=2,handler_code=n1ql_op_with_timers,GROUP=recovery
       
      Exception: Bucket operations from handler code took lot of time to complete or didn't go through. Current : 4032 Expected : 0  dcp_backlog : 0  TIMERS_IN_PAST : 0 lcb_exceptions : {'172.23.97.67': {}}

      [2019-03-23 13:23:37,258] - [eventing_base:233] INFO - Stats for Node 172.23.97.67 is 
      [
          {
              "dcp_feed_boundary": "everything", 
              "event_processing_stats": {
                  "adhoc_timer_response_received": 274, 
                  "agg_messages_sent_to_worker": 9571, 
                  "agg_queue_memory": 0, 
                  "agg_queue_memory_cap": 53477376, 
                  "agg_queue_size": 0, 
                  "agg_queue_size_cap": 300000, 
                  "agg_timer_feedback_queue_cap": 1500, 
                  "agg_timer_feedback_queue_size": 0, 
                  "dcp_deletion": 4032, 
                  "dcp_deletion_sent_to_worker": 4032, 
                  "dcp_snapshot": 998, 
                  "dcp_stream_req_counter": 1024, 
                  "dcp_streamreq": 1024, 
                  "execution_stats": 900, 
                  "failure_stats": 900, 
                  "latency_stats": 900, 
                  "lcb_exception_stats": 900, 
                  "log_level": 3, 
                  "thr_count": 3, 
                  "thr_map": 3, 
                  "timer_responses_received": 4032, 
                  "v8_init": 3, 
                  "v8_load": 3, 
                  "worker_spawn_counter": 6
              }, 
              "events_remaining": {
                  "dcp_backlog": 0
              }, 
              "execution_stats": {
                  "agg_queue_memory": 0, 
                  "agg_queue_size": 0, 
                  "dcp_delete_msg_counter": 4032, 
                  "dcp_mutation_msg_counter": 0, 
                  "enqueued_dcp_delete_msg_counter": 4032, 
                  "enqueued_dcp_mutation_msg_counter": 0, 
                  "enqueued_timer_msg_counter": 0, 
                  "feedback_queue_size": 0, 
                  "lcb_retry_failure": 0, 
                  "messages_parsed": 9559, 
                  "on_delete_failure": 0, 
                  "on_delete_success": 4032, 
                  "on_update_failure": 0, 
                  "on_update_success": 0, 
                  "timer_create_failure": 0, 
                  "timer_msg_counter": 0, 
                  "timer_responses_sent": 4032, 
                  "timestamp": {
                      "24583": "2019-03-23T20:23:34Z", 
                      "24584": "2019-03-23T20:23:34Z", 
                      "24593": "2019-03-23T20:23:34Z"
                  }, 
                  "uv_try_write_failure_counter": 0
              }, 
              "failure_stats": {
                  "app_worker_setting_events_lost": 0, 
                  "bucket_op_exception_count": 0, 
                  "checkpoint_failure_count": 0, 
                  "dcp_events_lost": 0, 
                  "debugger_events_lost": 0, 
                  "delete_events_lost": 0, 
                  "mutation_events_lost": 0, 
                  "n1ql_op_exception_count": 0, 
                  "timeout_count": 0, 
                  "timer_callback_missing_counter": 0, 
                  "timer_context_size_exceeded_counter": 0, 
                  "timer_events_lost": 0, 
                  "timestamp": {
                      "24583": "2019-03-23T20:23:34Z", 
                      "24584": "2019-03-23T20:23:34Z", 
                      "24593": "2019-03-23T20:23:34Z"
                  }, 
                  "v8worker_events_lost": 0
              }, 
              "function_id": 3034789801, 
              "function_name": "Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations", 
              "gocb_creds_request_counter": 22, 
              "internal_vb_distribution_stats": {
                  "worker_Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations_0": "[0-341]", 
                  "worker_Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations_1": "[342-682]", 
                  "worker_Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations_2": "[683-1023]"
              }, 
              "latency_percentile_stats": {
                  "100": 1800, 
                  "50": 100, 
                  "80": 100, 
                  "90": 100, 
                  "95": 200, 
                  "99": 400
              }, 
              "lcb_creds_request_counter": 36, 
              "lcb_exception_stats": {}, 
              "metastore_stats": {
                  "kvpool_incr": 16128, 
                  "kvpool_insert": 1024, 
                  "kvpool_lookup": 192751, 
                  "kvpool_remove": 14524, 
                  "kvpool_replace": 70152, 
                  "kvpool_upsert": 32256, 
                  "meta_alarm_missing": 0, 
                  "meta_cancel": 0, 
                  "meta_cancel_alarm_missing": 0, 
                  "meta_cancel_context_missing": 0, 
                  "meta_cancel_success": 0, 
                  "meta_context_missing": 0, 
                  "meta_del": 0, 
                  "meta_del_success": 0, 
                  "meta_external_span_change": 0, 
                  "meta_scan_column": 39623, 
                  "meta_scan_column_lookup": 0, 
                  "meta_scan_due": 39623, 
                  "meta_scan_row": 39623, 
                  "meta_scan_row_lookup": 43136, 
                  "meta_set": 4032, 
                  "meta_set_success": 4032, 
                  "meta_span_cas_mismatch": 0, 
                  "meta_span_start_change": 0, 
                  "meta_span_stop_change": 0, 
                  "meta_sync_span": 32510, 
                  "meta_timer_in_future_fired": 0, 
                  "meta_timer_in_past": 0, 
                  "metastore_delete_err": 0, 
                  "metastore_deletes": 0, 
                  "metastore_not_found": 0, 
                  "metastore_scan": 0, 
                  "metastore_scan_due": 39623, 
                  "metastore_scan_err": 0, 
                  "metastore_set": 4032, 
                  "metastore_set_err": 0
              }, 
              "planner_stats": [
                  {
                      "host_name": "172.23.97.67:8096", 
                      "start_vb": 0, 
                      "vb_count": 1024
                  }
              ], 
              "vb_distribution_stats_from_metadata": {
                  "172.23.97.67:8096": {
                      "worker_Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations_0": "[0-341]", 
                      "worker_Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations_1": "[342-682]", 
                      "worker_Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations_2": "[683-1023]"
                  }
              }, 
              "worker_pids": {
                  "worker_Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations_0": 24593, 
                  "worker_Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations_1": 24584, 
                  "worker_Function_359590882_test_killing_eventing_consumer_when_eventing_is_processing_mutations_2": 24583
              }
          }
      ] 

       ./testrunner -i /tmp/testexec.1749.ini -p get-cbcollect-info=True,GROUP=recovery -t eventing.eventing_recovery.EventingRecovery.test_killing_erlang_when_eventing_is_processing_mutations,nodes_init=4,services_init=kv-eventing-index-n1ql,dataset=default,groups=simple,reset_services=True,skip_cleanup=True,doc-per-day=2,handler_code=n1ql_op_with_timers,GROUP=recovery
       
      Exception: Bucket operations from handler code took lot of time to complete or didn't go through. Current : 2 Expected : 0  dcp_backlog : 0  TIMERS_IN_PAST : 0 lcb_exceptions : {'172.23.97.67': {u'0': 2}}

      ./testrunner -i /tmp/testexec.1749.ini -p get-cbcollect-info=True,GROUP=recovery -t eventing.eventing_recovery.EventingRecovery.test_time_drift_between_kv_eventing,nodes_init=4,services_init=kv-eventing-index-n1ql,dataset=default,groups=simple,reset_services=True,skip_cleanup=True,doc-per-day=2,handler_code=n1ql_op_with_timers,GROUP=recovery
       
      Exception: Bucket operations from handler code took lot of time to complete or didn't go through. Current : 4032 Expected : 0  dcp_backlog : 0  TIMERS_IN_PAST : 0 lcb_exceptions : {'172.23.97.67': {}} 

      ./testrunner -i /tmp/testexec.1749.ini -p get-cbcollect-info=True,GROUP=recovery -t eventing.eventing_recovery.EventingRecovery.test_eventing_n1ql_in_different_time_zone,nodes_init=4,services_init=kv-eventing-index-n1ql,dataset=default,groups=simple,reset_services=True,skip_cleanup=True,doc-per-day=2,handler_code=n1ql_op_with_timers,GROUP=recovery 

      Attachments

        1. test_22.zip
          45.42 MB
        2. test_25.zip
          55.67 MB
        3. test_28.zip
          64.14 MB

        Issue Links

          No reviews matched the request. Check your Options in the drop-down menu of this sections header.

          Activity

            People

              vikas.chaudhary Vikas Chaudhary
              vikas.chaudhary Vikas Chaudhary
              Votes:
              0 Vote for this issue
              Watchers:
              2 Start watching this issue

              Dates

                Created:
                Updated:
                Resolved:

                Gerrit Reviews

                  There are no open Gerrit changes

                  PagerDuty