字符串中单词的比较？

如何解决字符串中单词的比较？

是否有一个函数可以用来比较单词的位置无关紧要的字符串？我的意思是“Aaron Jack Brussels”与“Brussels Aaron Jack”等相同。

解决方法

没有标准函数可以做任何接近您目标的事情。您需要编写特定的代码。您可以遍历一个字符串并搜索另一个字符串中的每个单词，反之亦然。

这是一个不修改字符串也不分配任何内存的简单实现：

#include <stdio.h>
#include <string.h>

int countword(const char *w,size_t len,const char *str) {
    size_t i;
    int count = 0;

    for (;;) {
        while (*str == ' ')
            str++;
        if (!*str)
            return count;
        for (i = 1; str[i] && str[i] != ' '; i++)
            continue;
        if (i == len && !memcmp(w,str,len))
            count++;
        str += i;
    }
}

int samewords(const char *s1,const char *s2) {
    const char *p0,*p;

    for (p = s1;;) {
        while (*p == ' ')
            p++;
        if (!*p)
            return 1;
        for (p0 = p++; *p && *p != ' '; p++)
            continue;
        if (countword(p0,p - p0,s1) != countword(p0,s2))
            return 0;
    }
}

int main() {
    if (samewords("Aaron  Jack  Brussels","Brussels Aaron Jack"))
        printf("OK\n");
    if (samewords("Aaron  Jack  Brussels","AaronJackBrussels"))
        printf("Not OK\n");
    if (samewords("Aaron Jack","Aaron Jack Jack"))
        printf("Not OK\n");
    if (samewords("Aaron Jack Brussels","Aaron Jack"))
        printf("Not OK\n");
    if (samewords("John John Doe","John Doe Doe"))
        printf("Not OK\n");    return 0;
}

您可以使用 strspn() 中的 strcspn() 和 <string.h> 将其扩展为处理多个分隔符，例如空格、制表符和换行符：

int countword(const char *w,const char *str) {
    const char *separators = " \t\r\n";
    size_t i;
    int count = 0;

    for (;;) {
        str += strspn(str,separators);
        if (!*str)
            return count;
        i = strcspn(str,separators);
        if (i == len && !memcmp(w,const char *s2) {
    const char *separators = " \t\r\n";
    const char *p0,*p;

    for (p = s1;;) {
        p += strspn(p,separators);
        if (!*p)
            return 1;
        p += strcspn(p0 = p,separators);
        if (countword(p0,s2))
            return 0;
    }
}

注意：我用更通用的版本更新了答案，该版本可以处理重复的单词，例如 "John John Doe" "John Doe Doe"，以前的版本会错误地将其视为等效。

您真正要做的是创建两组（数学上的）字符串，并尝试比较这些组。不幸的是，未排序的数组（如字符串）不利于这种比较。在 github 上寻找实现集合的 C 库可能是一个更好的起点（我认为 https://github.com/barrust/set 会满足您的需求）。

如果你真的需要一个简单的实现，这应该可以工作并避免分配或字符串修改：

from django.db import models
from django.contrib.auth.models import User
# Create your models here.

class Category(models.Model):
    name = models.CharField(max_length=100)

    def __str__(self):
        return self.name

    class Meta:
        verbose_name = 'Category'
        verbose_name_plural = 'Categories'


class Book(models.Model):
    name = models.CharField(max_length=200)
    description = models.TextField()
    image = models.ImageField()
    price = models.IntegerField()
    category = models.ForeignKey(Category,on_delete=models.SET_NULL,null=True)

    def __str__(self):
        return self.name

class OrderItem(models.Model):
    order_id = models.CharField(max_length=10)
    user = models.ForeignKey(User,null=True)
    book = models.ForeignKey(Book,null=True)

    def __str__(self):
        return self.user.username

class CartItem(models.Model):
    user = models.ForeignKey(User,null=True)

    def __str__(self):
        return self.user.username

不是直接的，但是您可以使用 strtok()（或其更有用的可重入表亲 strtok_r()）的组合通过“”分隔符分割您的字符串，并使用 strcmp() 来比较每个substring 针对所有其他子字符串。

我的例子非常粗糙（它假设两个字符串集中的子字符串数量相同，并且只检查一个集合与另一个集合），但应该有助于让您走上正确的轨道。

#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <stdbool.h>

int main() {
  char stringA[] = "Aaron Jack Brussels";
  char stringB[] = "Brussels Aaron Jack";                                                           
  int numSubStrings = 3;

  char **stringSetA,**stringSetB;
  char *saveStrA,*saveStrB;

  stringSetA = malloc(numSubStrings*sizeof(*stringSetA));
  stringSetB = malloc(numSubStrings*sizeof(*stringSetB));

  // extract first token of each to initialize strtok
  stringSetA[0] = strtok_r(stringA," ",&saveStrA);
  stringSetB[0] = strtok_r(stringB,&saveStrB);

  // loop through the string to extract all other tokens                                            
  for (int i = 1; i < numSubStrings; ++i) {
    stringSetA[i] = strtok_r(NULL,&saveStrA);
    stringSetB[i] = strtok_r(NULL,&saveStrB);
  }

  for (int i = 0; i < numSubStrings; ++i) {
    bool found = false;
    for (int j = 0; j < numSubStrings; ++j) {
      // strcmp == 0 if both strings are equal                                                      
      if (!strcmp(stringSetA[i],stringSetB[j])) {
        found = true;
        break;
      }
    }
    if (!found) printf("Both sets of strings aren't equal!\n");
    else printf("Found %s!\n",stringSetA[i]);
  }
  return 0;
}

字符串中单词的比较？

如何解决字符串中单词的比较？

解决方法

相关推荐