Uploaded image for project: 'JGroups'
  1. JGroups
  2. JGRP-1343

JGroups 2.6.2 hangs during JChannel.connect

XMLWordPrintable

    • Icon: Quality Risk Quality Risk
    • Resolution: Won't Do
    • Icon: Major Major
    • None
    • 2.6.2
    • None

      In a cluster having two nodes A & B, A is up and running and when B is started for the first time it sometimes hangs in JChannel.connect.
      If we bring down A then B is able to resume and connect. This issue happens randomly but frequently.
      Please let us know if we have missed something or need something.
      The jgroups configuration used is :
      <config>
      <UDP
      mcast_addr="${jgroups.udp.mcast_addr:224.0.0.0}"
      mcast_port="${jgroups.udp.mcast_port:$JGroup_port}"
      tos="8"
      ucast_recv_buf_size="20000000"
      ucast_send_buf_size="640000"
      mcast_recv_buf_size="25000000"
      mcast_send_buf_size="640000"
      loopback="false"
      discard_incompatible_packets="true"
      max_bundle_size="64000"
      max_bundle_timeout="30"
      use_incoming_packet_handler="true"
      ip_ttl="${jgroups.udp.ip_ttl:2}"
      enable_bundling="true"
      enable_diagnostics="true"
      thread_naming_pattern="cl"

      use_concurrent_stack="true"

      thread_pool.enabled="true"
      thread_pool.min_threads="2"
      thread_pool.max_threads="8"
      thread_pool.keep_alive_time="5000"
      thread_pool.queue_enabled="true"
      thread_pool.queue_max_size="1000"
      thread_pool.rejection_policy="Run"

      oob_thread_pool.enabled="true"
      oob_thread_pool.min_threads="1"
      oob_thread_pool.max_threads="8"
      oob_thread_pool.keep_alive_time="5000"
      oob_thread_pool.queue_enabled="false"
      oob_thread_pool.queue_max_size="100"
      oob_thread_pool.rejection_policy="Run"/>

      <PING timeout="2000"
      num_initial_members="3"/>
      <MERGE2 max_interval="30000"
      min_interval="10000"/>
      <FD_SOCK/>
      <FD timeout="10000" max_tries="5" shun="true"/>
      <VERIFY_SUSPECT timeout="1500" />
      <BARRIER />
      <pbcast.NAKACK use_stats_for_retransmission="false"
      exponential_backoff="150"
      use_mcast_xmit="true" gc_lag="0"
      retransmit_timeout="50,300,600,1200"
      discard_delivered_msgs="true"/>
      <UNICAST timeout="300,600,1200"/>
      <pbcast.STABLE stability_delay="1000" desired_avg_gossip="50000"
      max_bytes="1000000"/>
      <VIEW_SYNC avg_send_interval="60000" />
      <pbcast.GMS print_local_addr="true" join_timeout="5000"
      shun="false"
      view_bundling="true"/>
      <FC max_credits="500000"
      min_threshold="0.20"/>
      <FRAG2 frag_size="60000" />
      <pbcast.STREAMING_STATE_TRANSFER />
      <!-- <pbcast.STATE_TRANSFER />-->
      <pbcast.FLUSH timeout="0"/>
      </config>

            rhn-engineering-bban Bela Ban
            sandeep.th_jira Sandeep T H (Inactive)
            Votes:
            0 Vote for this issue
            Watchers:
            2 Start watching this issue

              Created:
              Updated:
              Resolved: