static void Testj2269() { UErrorCode status = U_ZERO_ERROR; UChar a[4] = { 0x61, 0x62, 0x63, 0 }; USet *s = uset_open(1, 0); uset_addString(s, a, 3); a[0] = 0x63; a[1] = 0x63; expect(s, "{abc}", "{ccc}", &status); uset_close(s); }
/** * Basic API test for uset.x */ static void TestAPI() { USet* set; USet* set2; UErrorCode ec; /* [] */ set = uset_openEmpty(); expect(set, "", "abc{ab}", NULL); uset_close(set); set = uset_open(1, 0); expect(set, "", "abc{ab}", NULL); uset_close(set); set = uset_open(1, 1); uset_clear(set); expect(set, "", "abc{ab}", NULL); uset_close(set); /* [ABC] */ set = uset_open(0x0041, 0x0043); expect(set, "ABC", "DEF{ab}", NULL); uset_close(set); /* [a-c{ab}] */ ec = U_ZERO_ERROR; set = uset_openPattern(PAT, PAT_LEN, &ec); if(U_FAILURE(ec)) { log_err("uset_openPattern([a-c{ab}]) failed - %s\n", u_errorName(ec)); return; } if(!uset_resemblesPattern(PAT, PAT_LEN, 0)) { log_err("uset_resemblesPattern of PAT failed\n"); } expect(set, "abc{ab}", "def{bc}", &ec); /* [a-d{ab}] */ uset_add(set, 0x64); expect(set, "abcd{ab}", "ef{bc}", NULL); /* [acd{ab}{bc}] */ uset_remove(set, 0x62); uset_addString(set, STR_bc, STR_bc_LEN); expect(set, "acd{ab}{bc}", "bef{cd}", NULL); /* [acd{bc}] */ uset_removeString(set, STR_ab, STR_ab_LEN); expect(set, "acd{bc}", "bfg{ab}", NULL); /* [^acd{bc}] */ uset_complement(set); expect(set, "bef{bc}", "acd{ac}", NULL); /* [a-e{bc}] */ uset_complement(set); uset_addRange(set, 0x0062, 0x0065); expect(set, "abcde{bc}", "fg{ab}", NULL); /* [de{bc}] */ uset_removeRange(set, 0x0050, 0x0063); expect(set, "de{bc}", "bcfg{ab}", NULL); /* [g-l] */ uset_set(set, 0x0067, 0x006C); expect(set, "ghijkl", "de{bc}", NULL); if (uset_indexOf(set, 0x0067) != 0) { log_err("uset_indexOf failed finding correct index of 'g'\n"); } if (uset_charAt(set, 0) != 0x0067) { log_err("uset_charAt failed finding correct char 'g' at index 0\n"); } /* How to test this one...? */ uset_compact(set); /* [g-i] */ uset_retain(set, 0x0067, 0x0069); expect(set, "ghi", "dejkl{bc}", NULL); /* UCHAR_ASCII_HEX_DIGIT */ uset_applyIntPropertyValue(set, UCHAR_ASCII_HEX_DIGIT, 1, &ec); if(U_FAILURE(ec)) { log_err("uset_applyIntPropertyValue([UCHAR_ASCII_HEX_DIGIT]) failed - %s\n", u_errorName(ec)); return; } expect(set, "0123456789ABCDEFabcdef", "GHIjkl{bc}", NULL); /* [ab] */ uset_clear(set); uset_addAllCodePoints(set, STR_ab, STR_ab_LEN); expect(set, "ab", "def{ab}", NULL); if (uset_containsAllCodePoints(set, STR_bc, STR_bc_LEN)){ log_err("set should not conatin all characters of \"bc\" \n"); } /* [] */ set2 = uset_open(1, 1); uset_clear(set2); /* space */ uset_applyPropertyAlias(set2, PAT_lb, PAT_lb_LEN, VAL_SP, VAL_SP_LEN, &ec); expect(set2, " ", "abcdefghi{bc}", NULL); /* [a-c] */ uset_set(set2, 0x0061, 0x0063); /* [g-i] */ uset_set(set, 0x0067, 0x0069); /* [a-c g-i] */ if (uset_containsSome(set, set2)) { log_err("set should not contain some of set2 yet\n"); } uset_complementAll(set, set2); if (!uset_containsSome(set, set2)) { log_err("set should contain some of set2\n"); } expect(set, "abcghi", "def{bc}", NULL); /* [g-i] */ uset_removeAll(set, set2); expect(set, "ghi", "abcdef{bc}", NULL); /* [a-c g-i] */ uset_addAll(set2, set); expect(set2, "abcghi", "def{bc}", NULL); /* [g-i] */ uset_retainAll(set2, set); expect(set2, "ghi", "abcdef{bc}", NULL); uset_close(set); uset_close(set2); }
static void addSpecial(contContext *context, UChar *buffer, int32_t bufLen, uint32_t CE, int32_t leftIndex, int32_t rightIndex, UErrorCode *status) { const UCollator *coll = context->coll; USet *contractions = context->conts; USet *expansions = context->expansions; UBool addPrefixes = context->addPrefixes; const UChar *UCharOffset = (UChar *)coll->image+getContractOffset(CE); uint32_t newCE = *(coll->contractionCEs + (UCharOffset - coll->contractionIndex)); // we might have a contraction that ends from previous level if(newCE != UCOL_NOT_FOUND) { if(isSpecial(CE) && getCETag(CE) == CONTRACTION_TAG && isSpecial(newCE) && getCETag(newCE) == SPEC_PROC_TAG && addPrefixes) { addSpecial(context, buffer, bufLen, newCE, leftIndex, rightIndex, status); } if(contractions && rightIndex-leftIndex > 1) { uset_addString(contractions, buffer+leftIndex, rightIndex-leftIndex); if(expansions && isSpecial(CE) && getCETag(CE) == EXPANSION_TAG) { uset_addString(expansions, buffer+leftIndex, rightIndex-leftIndex); } } } UCharOffset++; // check whether we're doing contraction or prefix if(getCETag(CE) == SPEC_PROC_TAG && addPrefixes) { if(leftIndex == 0) { *status = U_INTERNAL_PROGRAM_ERROR; return; } --leftIndex; while(*UCharOffset != 0xFFFF) { newCE = *(coll->contractionCEs + (UCharOffset - coll->contractionIndex)); buffer[leftIndex] = *UCharOffset; if(isSpecial(newCE) && (getCETag(newCE) == CONTRACTION_TAG || getCETag(newCE) == SPEC_PROC_TAG)) { addSpecial(context, buffer, bufLen, newCE, leftIndex, rightIndex, status); } else { if(contractions) { uset_addString(contractions, buffer+leftIndex, rightIndex-leftIndex); } if(expansions && isSpecial(newCE) && getCETag(newCE) == EXPANSION_TAG) { uset_addString(expansions, buffer+leftIndex, rightIndex-leftIndex); } } UCharOffset++; } } else if(getCETag(CE) == CONTRACTION_TAG) { if(rightIndex == bufLen-1) { *status = U_INTERNAL_PROGRAM_ERROR; return; } while(*UCharOffset != 0xFFFF) { newCE = *(coll->contractionCEs + (UCharOffset - coll->contractionIndex)); buffer[rightIndex] = *UCharOffset; if(isSpecial(newCE) && (getCETag(newCE) == CONTRACTION_TAG || getCETag(newCE) == SPEC_PROC_TAG)) { addSpecial(context, buffer, bufLen, newCE, leftIndex, rightIndex+1, status); } else { if(contractions) { uset_addString(contractions, buffer+leftIndex, rightIndex+1-leftIndex); } if(expansions && isSpecial(newCE) && getCETag(newCE) == EXPANSION_TAG) { uset_addString(expansions, buffer+leftIndex, rightIndex+1-leftIndex); } } UCharOffset++; } } }