jjzjj

c - C 中的多线程 TCP 服务器崩溃

coder 2023-09-19 原文

我用 C 编写了一个多线程 TCP 服务器。当我针对它运行多个测试客户端时它崩溃了。我遇到了 2 种类型的崩溃,它们似乎都有相同的根本原因。附加的崩溃发生在 main 中。在另一种情况下,当它想要锁定以关闭套接字时,我在客户端部分崩溃了。 有人可以告诉我崩溃的原因吗?

TCP 服务器代码:

#include <stdio.h>
#include <stdint.h>
#include <stdlib.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <unistd.h>
#include <arpa/inet.h> //inet_addr
#include <pthread.h> //for threading , link with lpthread

#define BUFSIZE     2048 // TODO
#define MAXWORKERS 10

pthread_mutex_t mtx = PTHREAD_MUTEX_INITIALIZER;
const pthread_cond_t condInit = PTHREAD_COND_INITIALIZER;
pthread_cond_t idle = PTHREAD_COND_INITIALIZER;

typedef struct {
    pthread_t       tid;
    int             sd;
    pthread_cond_t  cond;
    uint8_t         num;
    uint8_t         state;
} worker_t;

worker_t     workers[MAXWORKERS]; //  reference to worker

void error(const char *msg)
{
    perror(msg);
    exit(1);
}

/* worker thread */
void *handle_client(void *arg)
{
    worker_t* worker = (worker_t *) arg;
    int n;
    char buf[BUFSIZE];

    /* By default a new thread is joinable, we don't
     really want this (unless we do something special we
     end up with the thread equivalent of zombies). So
     we explicitly change the thread type to detached
     */

    pthread_detach(pthread_self());

    printf("Thread %ld started for client number %d (sd %d)\n", pthread_self(),
            worker->num, worker->sd);

    /* worker thread */
    while (1)
    {
        /* wait for work to do */
        while (worker->state == 0)
        {
            pthread_cond_wait(&worker->cond, &mtx);
        }
        int sd = worker->sd; /* get the updated socket fd */
        pthread_mutex_unlock(&mtx);

         n = read(sd, buf, BUFSIZE);
         if (n < 0)
             error("ERROR reading from socket");

         n = write(sd, "I got your message",18);
         if (n < 0)
             error("ERROR writing to socket");

        /* work done - set itself idle assumes that read returned EOF */
        pthread_mutex_lock(&mtx);
        close(sd);
        worker->state = 0;
        printf("Worker %d has completed work \n", worker->num);
        pthread_cond_signal(&idle); /* notifies dispatcher*/
        pthread_mutex_unlock(&mtx);
    } /* end while */

}

int main() { /* Dispatcher */
    int ld, sd;
    struct sockaddr_in skaddr;
    struct sockaddr_in from;
    int addrlen, length;
    int i;

    if ((ld = socket( AF_INET, SOCK_STREAM, 0)) < 0) {
        perror("Problem creating socket\n");
        exit(1);
    }

    skaddr.sin_family = AF_INET;
    skaddr.sin_addr.s_addr = htonl(INADDR_ANY);

    //skaddr.sin_port = htons(0);
    skaddr.sin_port = htons(41332);

    if (bind(ld, (struct sockaddr *) &skaddr, sizeof(skaddr)) < 0) {
        perror("Problem binding\n");
        exit(0);
    }

    /* find out what port we were assigned and print it out */

    length = sizeof(skaddr);
    if (getsockname(ld, (struct sockaddr *) &skaddr, &length) < 0) {
        perror("Error getsockname\n");
        exit(1);
    }
    in_port_t pport = ntohs(skaddr.sin_port);
    printf("%d\n", pport);

    /* put the socket into passive mode (waiting for connections) */

    if (listen(ld, 5) < 0) {
        perror("Error calling listen\n");
        exit(1);
    }

    /* do some initialization */

    for (i = 0; i < MAXWORKERS; i++) {
        workers[i].state    = 0;
        workers[i].num      = i;
        workers[i].sd       = 0;
        workers[i].cond     = condInit;
        pthread_create(&workers[i].tid, NULL, handle_client, (void *) &workers[i]);
    }

    /* Dispatcher now processes incoming connections forever ... */
    while (1) {
        printf("Ready for a connection...\n");
        addrlen = sizeof(skaddr);

        printf("trying to accept a new connection\n");
        if ((sd = accept(ld, (struct sockaddr*) &from, &addrlen)) < 0) {
            perror("Problem with accept call\n");
            exit(1);
        }
        printf("Got a connection - processing...\n");
        for (i = 0; i < MAXWORKERS; i++) {
            pthread_mutex_lock(&mtx);
            if (workers[i].state == 0) /* worker i is idle – dispatch him to work */
            {
                printf("dispatch to worker number: %d \n", i);
                pthread_mutex_unlock(&mtx);
                break;
            }
            printf("worker number: %d was busy\n", i);

            pthread_mutex_unlock(&mtx);
        }

        if (i == MAXWORKERS) {
            /* all workers busy */
            pthread_mutex_lock(&mtx);
            pthread_cond_wait(&idle, &mtx); /* wait for one idle; */
            pthread_mutex_unlock(&mtx);
        } else { /* dispatch worker */
            pthread_mutex_lock(&mtx);
            workers[i].state = 1;
            workers[i].sd = sd;
            pthread_cond_signal(&workers[i].cond); /* wake up worker */
            pthread_mutex_unlock(&mtx);
        }
    }
}

崩溃:

Thread 11 (Thread 0x7fae90004700 (LWP 16318)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x602408 <workers+648>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae90004700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 10 (Thread 0x7fae90805700 (LWP 16317)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x6023c0 <workers+576>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae90805700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 9 (Thread 0x7fae9400c700 (LWP 16310)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x6021c8 <workers+72>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae9400c700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 8 (Thread 0x7fae91006700 (LWP 16316)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x602378 <workers+504>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae91006700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 7 (Thread 0x7fae91807700 (LWP 16315)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x602330 <workers+432>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae91807700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 6 (Thread 0x7fae9300a700 (LWP 16312)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x602258 <workers+216>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae9300a700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 5 (Thread 0x7fae92008700 (LWP 16314)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x6022e8 <workers+360>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae92008700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 4 (Thread 0x7fae92809700 (LWP 16313)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x6022a0 <workers+288>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae92809700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 3 (Thread 0x7fae9380b700 (LWP 16311)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x602210 <workers+144>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae9380b700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 2 (Thread 0x7fae9480d700 (LWP 16309)):
#0  pthread_cond_wait@@GLIBC_2.3.2 () at ../sysdeps/unix/sysv/linux/x86_64/pthread_cond_wait.S:185
#1  0x0000000000401024 in handle_client (arg=0x602180 <workers>) at main.c:87
#2  0x00007fae94bdf6ba in start_thread (arg=0x7fae9480d700) at pthread_create.c:333
#3  0x00007fae949153dd in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:109

Thread 1 (Thread 0x7fae94ff3700 (LWP 16308)):
#0  0x00007fae94843428 in __GI_raise (sig=sig@entry=6) at ../sysdeps/unix/sysv/linux/raise.c:54
---Type <return> to continue, or q <return> to quit---
#1  0x00007fae9484502a in __GI_abort () at abort.c:89
#2  0x00007fae9483bbd7 in __assert_fail_base (fmt=<optimized out>, assertion=assertion@entry=0x7fae94beb015 "mutex->__data.__owner == 0", file=file@entry=0x7fae94beaff8 "../nptl/pthread_mutex_lock.c", line=line@entry=81, 
    function=function@entry=0x7fae94beb180 <__PRETTY_FUNCTION__.8623> "__pthread_mutex_lock") at assert.c:92
#3  0x00007fae9483bc82 in __GI___assert_fail (assertion=assertion@entry=0x7fae94beb015 "mutex->__data.__owner == 0", file=file@entry=0x7fae94beaff8 "../nptl/pthread_mutex_lock.c", line=line@entry=81, 
    function=function@entry=0x7fae94beb180 <__PRETTY_FUNCTION__.8623> "__pthread_mutex_lock") at assert.c:101
#4  0x00007fae94be1f68 in __GI___pthread_mutex_lock (mutex=mutex@entry=0x602140 <mtx>) at ../nptl/pthread_mutex_lock.c:81
#5  0x0000000000400cfa in main () at main.c:173

最佳答案

在您的工作线程中,首先发生的事情是没有首先锁定互斥量的 pthread_cond_wait 或没有首先锁定互斥量的 pthread_mutex_unlock。在这两种情况下,根据 POSIX 文档,这是未定义的行为。

你的 worker 函数应该这样开始:

    /* worker thread */
while (1)
{
    /* wait for work to do */
    pthread_mutex_lock(&mtx);
    while (worker->state == 0)
    {
        pthread_cond_wait(&worker->cond, &mtx);
    }
    int sd = worker->sd; /* get the updated socket fd */
    pthread_mutex_unlock(&mtx);

关于c - C 中的多线程 TCP 服务器崩溃,我们在Stack Overflow上找到一个类似的问题: https://stackoverflow.com/questions/45034981/

有关c - C 中的多线程 TCP 服务器崩溃的更多相关文章

  1. ruby - 如何从 ruby​​ 中的字符串运行任意对象方法? - 2

    总的来说,我对ruby​​还比较陌生,我正在为我正在创建的对象编写一些rspec测试用例。许多测试用例都非常基础,我只是想确保正确填充和返回值。我想知道是否有办法使用循环结构来执行此操作。不必为我要测试的每个方法都设置一个assertEquals。例如:describeitem,"TestingtheItem"doit"willhaveanullvaluetostart"doitem=Item.new#HereIcoulddotheitem.name.shouldbe_nil#thenIcoulddoitem.category.shouldbe_nilendend但我想要一些方法来使用

  2. ruby - 其他文件中的 Rake 任务 - 2

    我试图在一个项目中使用rake,如果我把所有东西都放到Rakefile中,它会很大并且很难读取/找到东西,所以我试着将每个命名空间放在lib/rake中它自己的文件中,我添加了这个到我的rake文件的顶部:Dir['#{File.dirname(__FILE__)}/lib/rake/*.rake'].map{|f|requiref}它加载文件没问题,但没有任务。我现在只有一个.rake文件作为测试,名为“servers.rake”,它看起来像这样:namespace:serverdotask:testdoputs"test"endend所以当我运行rakeserver:testid时

  3. ruby-on-rails - Ruby net/ldap 模块中的内存泄漏 - 2

    作为我的Rails应用程序的一部分,我编写了一个小导入程序,它从我们的LDAP系统中吸取数据并将其塞入一个用户表中。不幸的是,与LDAP相关的代码在遍历我们的32K用户时泄漏了大量内存,我一直无法弄清楚如何解决这个问题。这个问题似乎在某种程度上与LDAP库有关,因为当我删除对LDAP内容的调用时,内存使用情况会很好地稳定下来。此外,不断增加的对象是Net::BER::BerIdentifiedString和Net::BER::BerIdentifiedArray,它们都是LDAP库的一部分。当我运行导入时,内存使用量最终达到超过1GB的峰值。如果问题存在,我需要找到一些方法来更正我的代

  4. ruby - 使用 ruby​​ 和 savon 的 SOAP 服务 - 2

    我正在尝试使用ruby​​和Savon来使用网络服务。测试服务为http://www.webservicex.net/WS/WSDetails.aspx?WSID=9&CATID=2require'rubygems'require'savon'client=Savon::Client.new"http://www.webservicex.net/stockquote.asmx?WSDL"client.get_quotedo|soap|soap.body={:symbol=>"AAPL"}end返回SOAP异常。检查soap信封,在我看来soap请求没有正确的命名空间。任何人都可以建议我

  5. ruby-on-rails - Rails 3 中的多个路由文件 - 2

    Rails2.3可以选择随时使用RouteSet#add_configuration_file添加更多路由。是否可以在Rails3项目中做同样的事情? 最佳答案 在config/application.rb中:config.paths.config.routes在Rails3.2(也可能是Rails3.1)中,使用:config.paths["config/routes"] 关于ruby-on-rails-Rails3中的多个路由文件,我们在StackOverflow上找到一个类似的问题

  6. ruby - 具有身份验证的私有(private) Ruby Gem 服务器 - 2

    我想安装一个带有一些身份验证的私有(private)Rubygem服务器。我希望能够使用公共(public)Ubuntu服务器托管内部gem。我读到了http://docs.rubygems.org/read/chapter/18.但是那个没有身份验证-如我所见。然后我读到了https://github.com/cwninja/geminabox.但是当我使用基本身份验证(他们在他们的Wiki中有)时,它会提示从我的服务器获取源。所以。如何制作带有身份验证的私有(private)Rubygem服务器?这是不可能的吗?谢谢。编辑:Geminabox问题。我尝试“捆绑”以安装新的gem..

  7. ruby-on-rails - Rails - 一个 View 中的多个模型 - 2

    我需要从一个View访问多个模型。以前,我的links_controller仅用于提供以不同方式排序的链接资源。现在我想包括一个部分(我假设)显示按分数排序的顶级用户(@users=User.all.sort_by(&:score))我知道我可以将此代码插入每个链接操作并从View访问它,但这似乎不是“ruby方式”,我将需要在不久的将来访问更多模型。这可能会变得很脏,是否有针对这种情况的任何技术?注意事项:我认为我的应用程序正朝着单一格式和动态页面内容的方向发展,本质上是一个典型的网络应用程序。我知道before_filter但考虑到我希望应用程序进入的方向,这似乎很麻烦。最终从任何

  8. ruby - 检查 "command"的输出应该包含 NilClass 的意外崩溃 - 2

    为了将Cucumber用于命令行脚本,我按照提供的说明安装了arubagem。它在我的Gemfile中,我可以验证是否安装了正确的版本并且我已经包含了require'aruba/cucumber'在'features/env.rb'中为了确保它能正常工作,我写了以下场景:@announceScenario:Testingcucumber/arubaGivenablankslateThentheoutputfrom"ls-la"shouldcontain"drw"假设事情应该失败。它确实失败了,但失败的原因是错误的:@announceScenario:Testingcucumber/ar

  9. ruby-on-rails - Rails 3.2.1 中 ActionMailer 中的未定义方法 'default_content_type=' - 2

    我在我的项目中添加了一个系统来重置用户密码并通过电子邮件将密码发送给他,以防他忘记密码。昨天它运行良好(当我实现它时)。当我今天尝试启动服务器时,出现以下错误。=>BootingWEBrick=>Rails3.2.1applicationstartingindevelopmentonhttp://0.0.0.0:3000=>Callwith-dtodetach=>Ctrl-CtoshutdownserverExiting/Users/vinayshenoy/.rvm/gems/ruby-1.9.3-p0/gems/actionmailer-3.2.1/lib/action_mailer

  10. ruby-on-rails - Rails 应用程序中的 Rails : How are you using application_controller. rb 是新手吗? - 2

    刚入门rails,开始慢慢理解。有人可以解释或给我一些关于在application_controller中编码的好处或时间和原因的想法吗?有哪些用例。您如何为Rails应用程序使用应用程序Controller?我不想在那里放太多代码,因为据我了解,每个请求都会调用此Controller。这是真的? 最佳答案 ApplicationController实际上是您应用程序中的每个其他Controller都将从中继承的类(尽管这不是强制性的)。我同意不要用太多代码弄乱它并保持干净整洁的态度,尽管在某些情况下ApplicationContr

随机推荐