You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
			
				
					293 lines
				
				12 KiB
			
		
		
			
		
	
	
					293 lines
				
				12 KiB
			| 
											6 years ago
										 | '\" t
 | ||
|  | .\"     Title: ztrie
 | ||
|  | .\"    Author: [see the "AUTHORS" section]
 | ||
|  | .\" Generator: DocBook XSL Stylesheets v1.76.1 <http://docbook.sf.net/>
 | ||
|  | .\"      Date: 12/31/2016
 | ||
|  | .\"    Manual: CZMQ Manual
 | ||
|  | .\"    Source: CZMQ 4.0.2
 | ||
|  | .\"  Language: English
 | ||
|  | .\"
 | ||
|  | .TH "ZTRIE" "3" "12/31/2016" "CZMQ 4\&.0\&.2" "CZMQ Manual"
 | ||
|  | .\" -----------------------------------------------------------------
 | ||
|  | .\" * Define some portability stuff
 | ||
|  | .\" -----------------------------------------------------------------
 | ||
|  | .\" ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 | ||
|  | .\" http://bugs.debian.org/507673
 | ||
|  | .\" http://lists.gnu.org/archive/html/groff/2009-02/msg00013.html
 | ||
|  | .\" ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 | ||
|  | .ie \n(.g .ds Aq \(aq
 | ||
|  | .el       .ds Aq '
 | ||
|  | .\" -----------------------------------------------------------------
 | ||
|  | .\" * set default formatting
 | ||
|  | .\" -----------------------------------------------------------------
 | ||
|  | .\" disable hyphenation
 | ||
|  | .nh
 | ||
|  | .\" disable justification (adjust text to left margin only)
 | ||
|  | .ad l
 | ||
|  | .\" -----------------------------------------------------------------
 | ||
|  | .\" * MAIN CONTENT STARTS HERE *
 | ||
|  | .\" -----------------------------------------------------------------
 | ||
|  | .SH "NAME"
 | ||
|  | ztrie \- simple trie for tokenizable strings
 | ||
|  | .SH "SYNOPSIS"
 | ||
|  | .sp
 | ||
|  | .nf
 | ||
|  | //  This is a draft class, and may change without notice\&. It is disabled in
 | ||
|  | //  stable builds by default\&. If you use this in applications, please ask
 | ||
|  | //  for it to be pushed to stable state\&. Use \-\-enable\-drafts to enable\&.
 | ||
|  | #ifdef CZMQ_BUILD_DRAFT_API
 | ||
|  | // Callback function for ztrie_node to destroy node data\&.
 | ||
|  | typedef void (ztrie_destroy_data_fn) (
 | ||
|  |     void **data);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Creates a new ztrie\&.
 | ||
|  | CZMQ_EXPORT ztrie_t *
 | ||
|  |     ztrie_new (char delimiter);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Destroy the ztrie\&.
 | ||
|  | CZMQ_EXPORT void
 | ||
|  |     ztrie_destroy (ztrie_t **self_p);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Inserts a new route into the tree and attaches the data\&. Returns \-1
 | ||
|  | //  if the route already exists, otherwise 0\&. This method takes ownership of
 | ||
|  | //  the provided data if a destroy_data_fn is provided\&.
 | ||
|  | CZMQ_EXPORT int
 | ||
|  |     ztrie_insert_route (ztrie_t *self, const char *path, void *data, ztrie_destroy_data_fn destroy_data_fn);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Removes a route from the trie and destroys its data\&. Returns \-1 if the
 | ||
|  | //  route does not exists, otherwise 0\&.
 | ||
|  | //  the start of the list call zlist_first ()\&. Advances the cursor\&.
 | ||
|  | CZMQ_EXPORT int
 | ||
|  |     ztrie_remove_route (ztrie_t *self, const char *path);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Returns true if the path matches a route in the tree, otherwise false\&.
 | ||
|  | CZMQ_EXPORT bool
 | ||
|  |     ztrie_matches (ztrie_t *self, const char *path);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Returns the data of a matched route from last ztrie_matches\&. If the path
 | ||
|  | //  did not match, returns NULL\&. Do not delete the data as it\*(Aqs owned by
 | ||
|  | //  ztrie\&.
 | ||
|  | CZMQ_EXPORT void *
 | ||
|  |     ztrie_hit_data (ztrie_t *self);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Returns the count of parameters that a matched route has\&.
 | ||
|  | CZMQ_EXPORT size_t
 | ||
|  |     ztrie_hit_parameter_count (ztrie_t *self);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Returns the parameters of a matched route with named regexes from last
 | ||
|  | //  ztrie_matches\&. If the path did not match or the route did not contain any
 | ||
|  | //  named regexes, returns NULL\&.
 | ||
|  | CZMQ_EXPORT zhashx_t *
 | ||
|  |     ztrie_hit_parameters (ztrie_t *self);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Returns the asterisk matched part of a route, if there has been no match
 | ||
|  | //  or no asterisk match, returns NULL\&.
 | ||
|  | CZMQ_EXPORT const char *
 | ||
|  |     ztrie_hit_asterisk_match (ztrie_t *self);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Print the trie
 | ||
|  | CZMQ_EXPORT void
 | ||
|  |     ztrie_print (ztrie_t *self);
 | ||
|  | 
 | ||
|  | //  *** Draft method, for development use, may change without warning ***
 | ||
|  | //  Self test of this class\&.
 | ||
|  | CZMQ_EXPORT void
 | ||
|  |     ztrie_test (bool verbose);
 | ||
|  | 
 | ||
|  | #endif // CZMQ_BUILD_DRAFT_API
 | ||
|  | Please add \*(Aq@interface\*(Aq section in \*(Aq\&./\&.\&./src/ztrie\&.c\*(Aq\&.
 | ||
|  | .fi
 | ||
|  | .SH "DESCRIPTION"
 | ||
|  | .sp
 | ||
|  | This is a variant of a trie or prefix tree where all the descendants of a node have a common prefix of the string associated with that node\&. This implementation is specialized for strings that can be tokenized by a delimiter like a URL, URI or URN\&. Routes in the tree can be matched by regular expressions and by using capturing groups parts of a matched route can be easily obtained\&.
 | ||
|  | .sp
 | ||
|  | Note that the performance for pure string based matching is okay but on short strings zhash and zhashx are 3\-4 times faster\&.
 | ||
|  | .SH "EXAMPLE"
 | ||
|  | .PP
 | ||
|  | \fBFrom ztrie_test method\fR. 
 | ||
|  | .sp
 | ||
|  | .if n \{\
 | ||
|  | .RS 4
 | ||
|  | .\}
 | ||
|  | .nf
 | ||
|  | //  Create a new trie for matching strings that can be tokenized by a slash
 | ||
|  | //  (e\&.g\&. URLs minus the protocol, address and port)\&.
 | ||
|  | ztrie_t *self = ztrie_new (\*(Aq/\*(Aq);
 | ||
|  | assert (self);
 | ||
|  | 
 | ||
|  | int ret = 0;
 | ||
|  | 
 | ||
|  | //  Let\*(Aqs start by inserting a couple of routes into the trie\&.
 | ||
|  | //  This one is for the route \*(Aq/foo/bar\*(Aq the slash at the beginning of the
 | ||
|  | //  route is important because everything before the first delimiter will be
 | ||
|  | //  discarded\&. A slash at the end of a route is optional though\&. The data
 | ||
|  | //  associated with this node is passed without destroy function which means
 | ||
|  | //  it must be destroyed by the caller\&.
 | ||
|  | int foo_bar_data = 10;
 | ||
|  | ret = ztrie_insert_route (self, "/foo/bar", &foo_bar_data, NULL);
 | ||
|  | assert (ret == 0);
 | ||
|  | 
 | ||
|  | //  Now suppose we like to match all routes with two tokens that start with
 | ||
|  | //  \*(Aq/foo/\*(Aq but aren\*(Aqt \*(Aq/foo/bar\*(Aq\&. This is possible by using regular
 | ||
|  | //  expressions which are enclosed in an opening and closing curly bracket\&.
 | ||
|  | //  Tokens that contain regular  expressions are always match after string
 | ||
|  | //  based tokens\&.
 | ||
|  | //  Note: There is no order in which regular expressions are sorted thus
 | ||
|  | //  if you enter multiple expressions for a route you will have to make
 | ||
|  | //  sure they don\*(Aqt have overlapping results\&. For example \*(Aq/foo/{[^/]+}\*(Aq
 | ||
|  | //  and \*(Aq/foo/{\ed+} having could turn out badly\&.
 | ||
|  | int foo_other_data = 100;
 | ||
|  | ret = ztrie_insert_route (self, "/foo/{[^/]+}", &foo_other_data, NULL);
 | ||
|  | assert (ret == 0);
 | ||
|  | 
 | ||
|  | //  Regular expression are only matched against tokens of the same level\&.
 | ||
|  | //  This allows us to append to are route with a regular expression as if
 | ||
|  | //  it were a string\&.
 | ||
|  | ret = ztrie_insert_route (self, "/foo/{[^/]+}/gulp", NULL, NULL);
 | ||
|  | assert (ret == 0);
 | ||
|  | 
 | ||
|  | //  Routes are identified by their endpoint, which is the last token of the route\&.
 | ||
|  | //  It is possible to insert routes for a node that already exists but isn\*(Aqt an
 | ||
|  | //  endpoint yet\&. The delimiter at the end of a route is optional and has no effect\&.
 | ||
|  | ret = ztrie_insert_route (self, "/foo/", NULL, NULL);
 | ||
|  | assert (ret == 0);
 | ||
|  | 
 | ||
|  | //  If you try to insert a route which already exists the method will return \-1\&.
 | ||
|  | ret = ztrie_insert_route (self, "/foo", NULL, NULL);
 | ||
|  | assert (ret == \-1);
 | ||
|  | 
 | ||
|  | //  It is not allowed to insert routes with empty tokens\&.
 | ||
|  | ret = ztrie_insert_route (self, "//foo", NULL, NULL);
 | ||
|  | assert (ret == \-1);
 | ||
|  | 
 | ||
|  | //  Everything before the first delimiter is ignored so \*(Aqfoo/bar/baz\*(Aq is equivalent
 | ||
|  | //  to \*(Aq/bar/baz\*(Aq\&.
 | ||
|  | ret = ztrie_insert_route (self, "foo/bar/baz", NULL, NULL);
 | ||
|  | assert (ret == 0);
 | ||
|  | ret = ztrie_insert_route (self, "/bar/baz", NULL, NULL);
 | ||
|  | assert (ret == \-1);
 | ||
|  | 
 | ||
|  | //  Of course you are allowed to remove routes, in case there is data associated with a
 | ||
|  | //  route and a destroy data function has been supplied that data will be destroyed\&.
 | ||
|  | ret = ztrie_remove_route (self, "/foo");
 | ||
|  | assert (ret == 0);
 | ||
|  | 
 | ||
|  | //  Removing a non existent route will  as well return \-1\&.
 | ||
|  | ret = ztrie_remove_route (self, "/foo");
 | ||
|  | assert (ret == \-1);
 | ||
|  | 
 | ||
|  | //  Removing a route with a regular expression must exactly match the entered one\&.
 | ||
|  | ret = ztrie_remove_route (self, "/foo/{[^/]+}");
 | ||
|  | assert (ret == 0);
 | ||
|  | 
 | ||
|  | //  Next we like to match a path by regular expressions and also extract matched
 | ||
|  | //  parts of a route\&. This can be done by naming the regular expression\&. The name of a
 | ||
|  | //  regular expression is entered at the beginning of the curly brackets and separated
 | ||
|  | //  by a colon from the regular expression\&. The first one in this examples is named
 | ||
|  | //  \*(Aqname\*(Aq and names the expression \*(Aq[^/]\*(Aq\&. If there is no capturing group defined in
 | ||
|  | //  the expression the whole matched string will be associated with this parameter\&. In
 | ||
|  | //  case you don\*(Aqt like the get the whole matched string use a capturing group, like
 | ||
|  | //  it has been done for the \*(Aqid\*(Aq parameter\&. This is nice but you can even match as
 | ||
|  | //  many parameter for a token as you like\&. Therefore simply put the parameter names
 | ||
|  | //  separated by colons in front of the regular expression and make sure to add a
 | ||
|  | //  capturing group for each parameter\&. The first parameter will be associated with
 | ||
|  | //  the first capturing and so on\&.
 | ||
|  | char *data = (char *) malloc (80);
 | ||
|  | sprintf (data, "%s", "Hello World!");
 | ||
|  | ret = ztrie_insert_route (self, "/baz/{name:[^/]+}/{id:\-\-(\e\ed+)}/{street:nr:(\e\ea+)(\e\ed+)}", data, NULL);
 | ||
|  | assert (ret == 0);
 | ||
|  | 
 | ||
|  | //  There is a lot you can do with regular expression but matching routes
 | ||
|  | //  of arbitrary length wont work\&. Therefore we make use of the asterisk
 | ||
|  | //  operator\&. Just place it at the end of your route, e\&.g\&. \*(Aq/config/bar/*\*(Aq\&.
 | ||
|  | ret = ztrie_insert_route (self, "/config/bar/*", NULL, NULL);
 | ||
|  | assert (ret == 0);
 | ||
|  | 
 | ||
|  | //  Appending to an asterisk as you would to with a regular expression
 | ||
|  | //  isn\*(Aqt valid\&.
 | ||
|  | ret = ztrie_insert_route (self, "/config/bar/*/bar", NULL, NULL);
 | ||
|  | assert (ret == \-1);
 | ||
|  | 
 | ||
|  | //  The asterisk operator will only work as a leaf in the tree\&. If you
 | ||
|  | //  enter an asterisk in the middle of your route it will simply be
 | ||
|  | //  interpreted as a string\&.
 | ||
|  | ret = ztrie_insert_route (self, "/test/*/bar", NULL, NULL);
 | ||
|  | assert (ret == 0);
 | ||
|  | 
 | ||
|  | //  If a parent has an asterisk as child it is not allowed to have
 | ||
|  | //  other siblings\&.
 | ||
|  | ret = ztrie_insert_route (self, "/config/bar/foo/glup", NULL, NULL);
 | ||
|  | assert (ret != 0);
 | ||
|  | 
 | ||
|  | //  Test matches
 | ||
|  | bool hasMatch = false;
 | ||
|  | 
 | ||
|  | //  The route \*(Aq/bar/foo\*(Aq will fail to match as this route has never been inserted\&.
 | ||
|  | hasMatch = ztrie_matches (self, "/bar/foo");
 | ||
|  | assert (!hasMatch);
 | ||
|  | 
 | ||
|  | //  The route \*(Aq/foo/bar\*(Aq will match and we can obtain the data associated with it\&.
 | ||
|  | hasMatch = ztrie_matches (self, "/foo/bar");
 | ||
|  | assert (hasMatch);
 | ||
|  | int foo_bar_hit_data = *((int *) ztrie_hit_data (self));
 | ||
|  | assert (foo_bar_data == foo_bar_hit_data);
 | ||
|  | 
 | ||
|  | //  This route is part of another but is no endpoint itself thus the matches will fail\&.
 | ||
|  | hasMatch = ztrie_matches (self, "/baz/blub");
 | ||
|  | assert (!hasMatch);
 | ||
|  | 
 | ||
|  | //  This route will match our named regular expressions route\&. Thus we can extract data
 | ||
|  | //  from the route by their names\&.
 | ||
|  | hasMatch = ztrie_matches (self, "/baz/blub/\-\-11/abc23");
 | ||
|  | assert (hasMatch);
 | ||
|  | char *match_data = (char *) ztrie_hit_data (self);
 | ||
|  | assert (streq ("Hello World!", match_data));
 | ||
|  | zhashx_t *parameters = ztrie_hit_parameters (self);
 | ||
|  | assert (zhashx_size (parameters) == 4);
 | ||
|  | assert (streq ("blub", (char *) zhashx_lookup (parameters, "name")));
 | ||
|  | assert (streq ("11", (char *) zhashx_lookup (parameters, "id")));
 | ||
|  | assert (streq ("abc", (char *) zhashx_lookup (parameters, "street")));
 | ||
|  | assert (streq ("23", (char *) zhashx_lookup (parameters, "nr")));
 | ||
|  | zhashx_destroy (¶meters);
 | ||
|  | 
 | ||
|  | //  This will match our asterisk route \*(Aq/config/bar/*\*(Aq\&. As the result we
 | ||
|  | //  can obtain the asterisk matched part of the route\&.
 | ||
|  | hasMatch = ztrie_matches (self, "/config/bar/foo/bar");
 | ||
|  | assert (hasMatch);
 | ||
|  | assert (streq (ztrie_hit_asterisk_match (self), "foo/bar"));
 | ||
|  | 
 | ||
|  | zstr_free (&data);
 | ||
|  | ztrie_destroy (&self);
 | ||
|  | .fi
 | ||
|  | .if n \{\
 | ||
|  | .RE
 | ||
|  | .\}
 | ||
|  | .sp
 | ||
|  | .SH "AUTHORS"
 | ||
|  | .sp
 | ||
|  | The czmq manual was written by the authors in the AUTHORS file\&.
 | ||
|  | .SH "RESOURCES"
 | ||
|  | .sp
 | ||
|  | Main web site: \m[blue]\fB\%\fR\m[]
 | ||
|  | .sp
 | ||
|  | Report bugs to the email <\m[blue]\fBzeromq\-dev@lists\&.zeromq\&.org\fR\m[]\&\s-2\u[1]\d\s+2>
 | ||
|  | .SH "COPYRIGHT"
 | ||
|  | .sp
 | ||
|  | Copyright (c) the Contributors as noted in the AUTHORS file\&. This file is part of CZMQ, the high\-level C binding for 0MQ: http://czmq\&.zeromq\&.org\&. This Source Code Form is subject to the terms of the Mozilla Public License, v\&. 2\&.0\&. If a copy of the MPL was not distributed with this file, You can obtain one at http://mozilla\&.org/MPL/2\&.0/\&. LICENSE included with the czmq distribution\&.
 | ||
|  | .SH "NOTES"
 | ||
|  | .IP " 1." 4
 | ||
|  | zeromq-dev@lists.zeromq.org
 | ||
|  | .RS 4
 | ||
|  | \%mailto:zeromq-dev@lists.zeromq.org
 | ||
|  | .RE
 |