Function: `string-lessp`

string-lessp is a function defined in fns.c.

Signature

(string-lessp STRING1 STRING2)

Documentation

Return non-nil if STRING1 is less than STRING2 in lexicographic order.

Case is significant. Symbols are also allowed; their print names are used instead.

Other relevant functions are documented in the comparison and string groups.

Probably introduced at or before Emacs version 20.4.

Shortdoc

;; string
(string-lessp "abc" "def")
    => t
  (string-lessp "pic4.png" "pic32.png")
    => nil
  (string-lessp "1.1" "1.2")
    => t
;; comparison
(string-lessp "abc" "abd")
    => t
  (string-lessp "abc" "abc")
    => nil
  (string-lessp "pic4.png" "pic32.png")
    => nil

Aliases

Source Code

// Defined in /usr/src/emacs/src/fns.c
{
  if (SYMBOLP (string1))
    string1 = SYMBOL_NAME (string1);
  else
    CHECK_STRING (string1);
  if (SYMBOLP (string2))
    string2 = SYMBOL_NAME (string2);
  else
    CHECK_STRING (string2);

  ptrdiff_t n = min (SCHARS (string1), SCHARS (string2));

  if ((!STRING_MULTIBYTE (string1) || SCHARS (string1) == SBYTES (string1))
      && (!STRING_MULTIBYTE (string2) || SCHARS (string2) == SBYTES (string2)))
    {
      /* Each argument is either unibyte or all-ASCII multibyte:
	 we can compare bytewise.  */
      int d = memcmp (SSDATA (string1), SSDATA (string2), n);
      return d < 0 || (d == 0 && n < SCHARS (string2)) ? Qt : Qnil;
    }
  else if (STRING_MULTIBYTE (string1) && STRING_MULTIBYTE (string2))
    {
      /* Two arbitrary multibyte strings: we cannot use memcmp because
	 the encoding for raw bytes would sort those between U+007F and U+0080
	 which isn't where we want them.
	 Instead, we skip the longest common prefix and look at
	 what follows.  */
      ptrdiff_t nb1 = SBYTES (string1);
      ptrdiff_t nb2 = SBYTES (string2);
      ptrdiff_t nb = min (nb1, nb2);
      ptrdiff_t b = 0;

      /* String data is normally allocated with word alignment, but
	 there are exceptions (notably pure strings) so we restrict the
	 wordwise skipping to safe architectures.  */
      if (HAVE_FAST_UNALIGNED_ACCESS)
	{
	  /* First compare entire machine words.  */
	  typedef size_t word_t;
	  int ws = sizeof (word_t);
	  const word_t *w1 = (const word_t *) SDATA (string1);
	  const word_t *w2 = (const word_t *) SDATA (string2);
	  while (b < nb - ws + 1 && w1[b / ws] == w2[b / ws])
	    b += ws;
	}

      /* Scan forward to the differing byte.  */
      while (b < nb && SREF (string1, b) == SREF (string2, b))
	b++;

      if (b >= nb)
	/* One string is a prefix of the other.  */
	return b < nb2 ? Qt : Qnil;

      /* Now back up to the start of the differing characters:
	 it's the last byte not having the bit pattern 10xxxxxx.  */
      while ((SREF (string1, b) & 0xc0) == 0x80)
	b--;

      /* Compare the differing characters.  */
      ptrdiff_t i1 = 0, i2 = 0;
      ptrdiff_t i1_byte = b, i2_byte = b;
      int c1 = fetch_string_char_advance_no_check (string1, &i1, &i1_byte);
      int c2 = fetch_string_char_advance_no_check (string2, &i2, &i2_byte);
      return c1 < c2 ? Qt : Qnil;
    }
  else if (STRING_MULTIBYTE (string1))
    {
      /* string1 multibyte, string2 unibyte */
      ptrdiff_t i1 = 0, i1_byte = 0, i2 = 0;
      while (i1 < n)
	{
	  int c1 = fetch_string_char_advance_no_check (string1, &i1, &i1_byte);
	  int c2 = SREF (string2, i2++);
	  if (c1 != c2)
	    return c1 < c2 ? Qt : Qnil;
	}
      return i1 < SCHARS (string2) ? Qt : Qnil;
    }
  else
    {
      /* string1 unibyte, string2 multibyte */
      ptrdiff_t i1 = 0, i2 = 0, i2_byte = 0;
      while (i1 < n)
	{
	  int c1 = SREF (string1, i1++);
	  int c2 = fetch_string_char_advance_no_check (string2, &i2, &i2_byte);
	  if (c1 != c2)
	    return c1 < c2 ? Qt : Qnil;
	}
      return i1 < SCHARS (string2) ? Qt : Qnil;
    }
}