mirror of
https://github.com/rust-lang/book.git
synced 2026-05-19 00:00:04 -04:00
Merge pull request #1297 from rust-lang/2018-edition
Fork the second edition into the 2018 edition
This commit is contained in:
142
2018-edition/Cargo.lock
generated
Normal file
142
2018-edition/Cargo.lock
generated
Normal file
@@ -0,0 +1,142 @@
|
||||
[[package]]
|
||||
name = "aho-corasick"
|
||||
version = "0.5.3"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
dependencies = [
|
||||
"memchr 0.1.11 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
]
|
||||
|
||||
[[package]]
|
||||
name = "docopt"
|
||||
version = "0.6.86"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
dependencies = [
|
||||
"lazy_static 0.2.10 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"regex 0.1.80 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"rustc-serialize 0.3.24 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"strsim 0.5.2 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
]
|
||||
|
||||
[[package]]
|
||||
name = "kernel32-sys"
|
||||
version = "0.2.2"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
dependencies = [
|
||||
"winapi 0.2.8 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"winapi-build 0.1.1 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
]
|
||||
|
||||
[[package]]
|
||||
name = "lazy_static"
|
||||
version = "0.2.10"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
|
||||
[[package]]
|
||||
name = "libc"
|
||||
version = "0.2.33"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
|
||||
[[package]]
|
||||
name = "memchr"
|
||||
version = "0.1.11"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
dependencies = [
|
||||
"libc 0.2.33 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
]
|
||||
|
||||
[[package]]
|
||||
name = "regex"
|
||||
version = "0.1.80"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
dependencies = [
|
||||
"aho-corasick 0.5.3 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"memchr 0.1.11 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"regex-syntax 0.3.9 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"thread_local 0.2.7 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"utf8-ranges 0.1.3 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
]
|
||||
|
||||
[[package]]
|
||||
name = "regex-syntax"
|
||||
version = "0.3.9"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
|
||||
[[package]]
|
||||
name = "rust-book"
|
||||
version = "0.0.1"
|
||||
dependencies = [
|
||||
"docopt 0.6.86 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"lazy_static 0.2.10 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"regex 0.1.80 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"rustc-serialize 0.3.24 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"walkdir 0.1.8 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
]
|
||||
|
||||
[[package]]
|
||||
name = "rustc-serialize"
|
||||
version = "0.3.24"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
|
||||
[[package]]
|
||||
name = "strsim"
|
||||
version = "0.5.2"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
|
||||
[[package]]
|
||||
name = "thread-id"
|
||||
version = "2.0.0"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
dependencies = [
|
||||
"kernel32-sys 0.2.2 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"libc 0.2.33 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
]
|
||||
|
||||
[[package]]
|
||||
name = "thread_local"
|
||||
version = "0.2.7"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
dependencies = [
|
||||
"thread-id 2.0.0 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
]
|
||||
|
||||
[[package]]
|
||||
name = "utf8-ranges"
|
||||
version = "0.1.3"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
|
||||
[[package]]
|
||||
name = "walkdir"
|
||||
version = "0.1.8"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
dependencies = [
|
||||
"kernel32-sys 0.2.2 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
"winapi 0.2.8 (registry+https://github.com/rust-lang/crates.io-index)",
|
||||
]
|
||||
|
||||
[[package]]
|
||||
name = "winapi"
|
||||
version = "0.2.8"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
|
||||
[[package]]
|
||||
name = "winapi-build"
|
||||
version = "0.1.1"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
|
||||
[metadata]
|
||||
"checksum aho-corasick 0.5.3 (registry+https://github.com/rust-lang/crates.io-index)" = "ca972c2ea5f742bfce5687b9aef75506a764f61d37f8f649047846a9686ddb66"
|
||||
"checksum docopt 0.6.86 (registry+https://github.com/rust-lang/crates.io-index)" = "4a7ef30445607f6fc8720f0a0a2c7442284b629cf0d049286860fae23e71c4d9"
|
||||
"checksum kernel32-sys 0.2.2 (registry+https://github.com/rust-lang/crates.io-index)" = "7507624b29483431c0ba2d82aece8ca6cdba9382bff4ddd0f7490560c056098d"
|
||||
"checksum lazy_static 0.2.10 (registry+https://github.com/rust-lang/crates.io-index)" = "236eb37a62591d4a41a89b7763d7de3e06ca02d5ab2815446a8bae5d2f8c2d57"
|
||||
"checksum libc 0.2.33 (registry+https://github.com/rust-lang/crates.io-index)" = "5ba3df4dcb460b9dfbd070d41c94c19209620c191b0340b929ce748a2bcd42d2"
|
||||
"checksum memchr 0.1.11 (registry+https://github.com/rust-lang/crates.io-index)" = "d8b629fb514376c675b98c1421e80b151d3817ac42d7c667717d282761418d20"
|
||||
"checksum regex 0.1.80 (registry+https://github.com/rust-lang/crates.io-index)" = "4fd4ace6a8cf7860714a2c2280d6c1f7e6a413486c13298bbc86fd3da019402f"
|
||||
"checksum regex-syntax 0.3.9 (registry+https://github.com/rust-lang/crates.io-index)" = "f9ec002c35e86791825ed294b50008eea9ddfc8def4420124fbc6b08db834957"
|
||||
"checksum rustc-serialize 0.3.24 (registry+https://github.com/rust-lang/crates.io-index)" = "dcf128d1287d2ea9d80910b5f1120d0b8eede3fbf1abe91c40d39ea7d51e6fda"
|
||||
"checksum strsim 0.5.2 (registry+https://github.com/rust-lang/crates.io-index)" = "67f84c44fbb2f91db7fef94554e6b2ac05909c9c0b0bc23bb98d3a1aebfe7f7c"
|
||||
"checksum thread-id 2.0.0 (registry+https://github.com/rust-lang/crates.io-index)" = "a9539db560102d1cef46b8b78ce737ff0bb64e7e18d35b2a5688f7d097d0ff03"
|
||||
"checksum thread_local 0.2.7 (registry+https://github.com/rust-lang/crates.io-index)" = "8576dbbfcaef9641452d5cf0df9b0e7eeab7694956dd33bb61515fb8f18cfdd5"
|
||||
"checksum utf8-ranges 0.1.3 (registry+https://github.com/rust-lang/crates.io-index)" = "a1ca13c08c41c9c3e04224ed9ff80461d97e121589ff27c753a16cb10830ae0f"
|
||||
"checksum walkdir 0.1.8 (registry+https://github.com/rust-lang/crates.io-index)" = "c66c0b9792f0a765345452775f3adbd28dde9d33f30d13e5dcc5ae17cf6f3780"
|
||||
"checksum winapi 0.2.8 (registry+https://github.com/rust-lang/crates.io-index)" = "167dc9d6949a9b857f3451275e911c3f44255842c1f7a76f33c55103a909087a"
|
||||
"checksum winapi-build 0.1.1 (registry+https://github.com/rust-lang/crates.io-index)" = "2d315eee3b34aca4797b2da6b13ed88266e6d612562a0c46390af8299fc699bc"
|
||||
36
2018-edition/Cargo.toml
Normal file
36
2018-edition/Cargo.toml
Normal file
@@ -0,0 +1,36 @@
|
||||
[package]
|
||||
name = "rust-book"
|
||||
version = "0.0.1"
|
||||
authors = ["Steve Klabnik <steve@steveklabnik.com>"]
|
||||
description = "The Rust Book"
|
||||
|
||||
[[bin]]
|
||||
name = "concat_chapters"
|
||||
path = "tools/src/bin/concat_chapters.rs"
|
||||
|
||||
[[bin]]
|
||||
name = "lfp"
|
||||
path = "tools/src/bin/lfp.rs"
|
||||
|
||||
[[bin]]
|
||||
name = "link2print"
|
||||
path = "tools/src/bin/link2print.rs"
|
||||
|
||||
[[bin]]
|
||||
name = "remove_links"
|
||||
path = "tools/src/bin/remove_links.rs"
|
||||
|
||||
[[bin]]
|
||||
name = "remove_markup"
|
||||
path = "tools/src/bin/remove_markup.rs"
|
||||
|
||||
[[bin]]
|
||||
name = "convert_quotes"
|
||||
path = "tools/src/bin/convert_quotes.rs"
|
||||
|
||||
[dependencies]
|
||||
walkdir = "0.1.5"
|
||||
docopt = "0.6.82"
|
||||
rustc-serialize = "0.3.19"
|
||||
regex = "0.1.73"
|
||||
lazy_static = "0.2.1"
|
||||
201
2018-edition/LICENSE-APACHE
Normal file
201
2018-edition/LICENSE-APACHE
Normal file
@@ -0,0 +1,201 @@
|
||||
Apache License
|
||||
Version 2.0, January 2004
|
||||
http://www.apache.org/licenses/
|
||||
|
||||
TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
|
||||
|
||||
1. Definitions.
|
||||
|
||||
"License" shall mean the terms and conditions for use, reproduction,
|
||||
and distribution as defined by Sections 1 through 9 of this document.
|
||||
|
||||
"Licensor" shall mean the copyright owner or entity authorized by
|
||||
the copyright owner that is granting the License.
|
||||
|
||||
"Legal Entity" shall mean the union of the acting entity and all
|
||||
other entities that control, are controlled by, or are under common
|
||||
control with that entity. For the purposes of this definition,
|
||||
"control" means (i) the power, direct or indirect, to cause the
|
||||
direction or management of such entity, whether by contract or
|
||||
otherwise, or (ii) ownership of fifty percent (50%) or more of the
|
||||
outstanding shares, or (iii) beneficial ownership of such entity.
|
||||
|
||||
"You" (or "Your") shall mean an individual or Legal Entity
|
||||
exercising permissions granted by this License.
|
||||
|
||||
"Source" form shall mean the preferred form for making modifications,
|
||||
including but not limited to software source code, documentation
|
||||
source, and configuration files.
|
||||
|
||||
"Object" form shall mean any form resulting from mechanical
|
||||
transformation or translation of a Source form, including but
|
||||
not limited to compiled object code, generated documentation,
|
||||
and conversions to other media types.
|
||||
|
||||
"Work" shall mean the work of authorship, whether in Source or
|
||||
Object form, made available under the License, as indicated by a
|
||||
copyright notice that is included in or attached to the work
|
||||
(an example is provided in the Appendix below).
|
||||
|
||||
"Derivative Works" shall mean any work, whether in Source or Object
|
||||
form, that is based on (or derived from) the Work and for which the
|
||||
editorial revisions, annotations, elaborations, or other modifications
|
||||
represent, as a whole, an original work of authorship. For the purposes
|
||||
of this License, Derivative Works shall not include works that remain
|
||||
separable from, or merely link (or bind by name) to the interfaces of,
|
||||
the Work and Derivative Works thereof.
|
||||
|
||||
"Contribution" shall mean any work of authorship, including
|
||||
the original version of the Work and any modifications or additions
|
||||
to that Work or Derivative Works thereof, that is intentionally
|
||||
submitted to Licensor for inclusion in the Work by the copyright owner
|
||||
or by an individual or Legal Entity authorized to submit on behalf of
|
||||
the copyright owner. For the purposes of this definition, "submitted"
|
||||
means any form of electronic, verbal, or written communication sent
|
||||
to the Licensor or its representatives, including but not limited to
|
||||
communication on electronic mailing lists, source code control systems,
|
||||
and issue tracking systems that are managed by, or on behalf of, the
|
||||
Licensor for the purpose of discussing and improving the Work, but
|
||||
excluding communication that is conspicuously marked or otherwise
|
||||
designated in writing by the copyright owner as "Not a Contribution."
|
||||
|
||||
"Contributor" shall mean Licensor and any individual or Legal Entity
|
||||
on behalf of whom a Contribution has been received by Licensor and
|
||||
subsequently incorporated within the Work.
|
||||
|
||||
2. Grant of Copyright License. Subject to the terms and conditions of
|
||||
this License, each Contributor hereby grants to You a perpetual,
|
||||
worldwide, non-exclusive, no-charge, royalty-free, irrevocable
|
||||
copyright license to reproduce, prepare Derivative Works of,
|
||||
publicly display, publicly perform, sublicense, and distribute the
|
||||
Work and such Derivative Works in Source or Object form.
|
||||
|
||||
3. Grant of Patent License. Subject to the terms and conditions of
|
||||
this License, each Contributor hereby grants to You a perpetual,
|
||||
worldwide, non-exclusive, no-charge, royalty-free, irrevocable
|
||||
(except as stated in this section) patent license to make, have made,
|
||||
use, offer to sell, sell, import, and otherwise transfer the Work,
|
||||
where such license applies only to those patent claims licensable
|
||||
by such Contributor that are necessarily infringed by their
|
||||
Contribution(s) alone or by combination of their Contribution(s)
|
||||
with the Work to which such Contribution(s) was submitted. If You
|
||||
institute patent litigation against any entity (including a
|
||||
cross-claim or counterclaim in a lawsuit) alleging that the Work
|
||||
or a Contribution incorporated within the Work constitutes direct
|
||||
or contributory patent infringement, then any patent licenses
|
||||
granted to You under this License for that Work shall terminate
|
||||
as of the date such litigation is filed.
|
||||
|
||||
4. Redistribution. You may reproduce and distribute copies of the
|
||||
Work or Derivative Works thereof in any medium, with or without
|
||||
modifications, and in Source or Object form, provided that You
|
||||
meet the following conditions:
|
||||
|
||||
(a) You must give any other recipients of the Work or
|
||||
Derivative Works a copy of this License; and
|
||||
|
||||
(b) You must cause any modified files to carry prominent notices
|
||||
stating that You changed the files; and
|
||||
|
||||
(c) You must retain, in the Source form of any Derivative Works
|
||||
that You distribute, all copyright, patent, trademark, and
|
||||
attribution notices from the Source form of the Work,
|
||||
excluding those notices that do not pertain to any part of
|
||||
the Derivative Works; and
|
||||
|
||||
(d) If the Work includes a "NOTICE" text file as part of its
|
||||
distribution, then any Derivative Works that You distribute must
|
||||
include a readable copy of the attribution notices contained
|
||||
within such NOTICE file, excluding those notices that do not
|
||||
pertain to any part of the Derivative Works, in at least one
|
||||
of the following places: within a NOTICE text file distributed
|
||||
as part of the Derivative Works; within the Source form or
|
||||
documentation, if provided along with the Derivative Works; or,
|
||||
within a display generated by the Derivative Works, if and
|
||||
wherever such third-party notices normally appear. The contents
|
||||
of the NOTICE file are for informational purposes only and
|
||||
do not modify the License. You may add Your own attribution
|
||||
notices within Derivative Works that You distribute, alongside
|
||||
or as an addendum to the NOTICE text from the Work, provided
|
||||
that such additional attribution notices cannot be construed
|
||||
as modifying the License.
|
||||
|
||||
You may add Your own copyright statement to Your modifications and
|
||||
may provide additional or different license terms and conditions
|
||||
for use, reproduction, or distribution of Your modifications, or
|
||||
for any such Derivative Works as a whole, provided Your use,
|
||||
reproduction, and distribution of the Work otherwise complies with
|
||||
the conditions stated in this License.
|
||||
|
||||
5. Submission of Contributions. Unless You explicitly state otherwise,
|
||||
any Contribution intentionally submitted for inclusion in the Work
|
||||
by You to the Licensor shall be under the terms and conditions of
|
||||
this License, without any additional terms or conditions.
|
||||
Notwithstanding the above, nothing herein shall supersede or modify
|
||||
the terms of any separate license agreement you may have executed
|
||||
with Licensor regarding such Contributions.
|
||||
|
||||
6. Trademarks. This License does not grant permission to use the trade
|
||||
names, trademarks, service marks, or product names of the Licensor,
|
||||
except as required for reasonable and customary use in describing the
|
||||
origin of the Work and reproducing the content of the NOTICE file.
|
||||
|
||||
7. Disclaimer of Warranty. Unless required by applicable law or
|
||||
agreed to in writing, Licensor provides the Work (and each
|
||||
Contributor provides its Contributions) on an "AS IS" BASIS,
|
||||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
|
||||
implied, including, without limitation, any warranties or conditions
|
||||
of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
|
||||
PARTICULAR PURPOSE. You are solely responsible for determining the
|
||||
appropriateness of using or redistributing the Work and assume any
|
||||
risks associated with Your exercise of permissions under this License.
|
||||
|
||||
8. Limitation of Liability. In no event and under no legal theory,
|
||||
whether in tort (including negligence), contract, or otherwise,
|
||||
unless required by applicable law (such as deliberate and grossly
|
||||
negligent acts) or agreed to in writing, shall any Contributor be
|
||||
liable to You for damages, including any direct, indirect, special,
|
||||
incidental, or consequential damages of any character arising as a
|
||||
result of this License or out of the use or inability to use the
|
||||
Work (including but not limited to damages for loss of goodwill,
|
||||
work stoppage, computer failure or malfunction, or any and all
|
||||
other commercial damages or losses), even if such Contributor
|
||||
has been advised of the possibility of such damages.
|
||||
|
||||
9. Accepting Warranty or Additional Liability. While redistributing
|
||||
the Work or Derivative Works thereof, You may choose to offer,
|
||||
and charge a fee for, acceptance of support, warranty, indemnity,
|
||||
or other liability obligations and/or rights consistent with this
|
||||
License. However, in accepting such obligations, You may act only
|
||||
on Your own behalf and on Your sole responsibility, not on behalf
|
||||
of any other Contributor, and only if You agree to indemnify,
|
||||
defend, and hold each Contributor harmless for any liability
|
||||
incurred by, or claims asserted against, such Contributor by reason
|
||||
of your accepting any such warranty or additional liability.
|
||||
|
||||
END OF TERMS AND CONDITIONS
|
||||
|
||||
APPENDIX: How to apply the Apache License to your work.
|
||||
|
||||
To apply the Apache License to your work, attach the following
|
||||
boilerplate notice, with the fields enclosed by brackets "[]"
|
||||
replaced with your own identifying information. (Don't include
|
||||
the brackets!) The text should be enclosed in the appropriate
|
||||
comment syntax for the file format. We also recommend that a
|
||||
file or class name and description of purpose be included on the
|
||||
same "printed page" as the copyright notice for easier
|
||||
identification within third-party archives.
|
||||
|
||||
Copyright 2010-2017 The Rust Project Developers
|
||||
|
||||
Licensed under the Apache License, Version 2.0 (the "License");
|
||||
you may not use this file except in compliance with the License.
|
||||
You may obtain a copy of the License at
|
||||
|
||||
http://www.apache.org/licenses/LICENSE-2.0
|
||||
|
||||
Unless required by applicable law or agreed to in writing, software
|
||||
distributed under the License is distributed on an "AS IS" BASIS,
|
||||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
See the License for the specific language governing permissions and
|
||||
limitations under the License.
|
||||
25
2018-edition/LICENSE-MIT
Normal file
25
2018-edition/LICENSE-MIT
Normal file
@@ -0,0 +1,25 @@
|
||||
Copyright (c) 2010-2017 The Rust Project Developers
|
||||
|
||||
Permission is hereby granted, free of charge, to any
|
||||
person obtaining a copy of this software and associated
|
||||
documentation files (the "Software"), to deal in the
|
||||
Software without restriction, including without
|
||||
limitation the rights to use, copy, modify, merge,
|
||||
publish, distribute, sublicense, and/or sell copies of
|
||||
the Software, and to permit persons to whom the Software
|
||||
is furnished to do so, subject to the following
|
||||
conditions:
|
||||
|
||||
The above copyright notice and this permission notice
|
||||
shall be included in all copies or substantial portions
|
||||
of the Software.
|
||||
|
||||
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF
|
||||
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
|
||||
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
|
||||
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
|
||||
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
|
||||
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
|
||||
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
|
||||
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
||||
DEALINGS IN THE SOFTWARE.
|
||||
3
2018-edition/book.toml
Normal file
3
2018-edition/book.toml
Normal file
@@ -0,0 +1,3 @@
|
||||
[book]
|
||||
title = "The Rust Programming Language"
|
||||
author = "Steve Klabnik and Carol Nichols, with Contributions from the Rust Community"
|
||||
22
2018-edition/convert-quotes.sh
Normal file
22
2018-edition/convert-quotes.sh
Normal file
@@ -0,0 +1,22 @@
|
||||
#!/bin/bash
|
||||
# Copyright 2017 The Rust Project Developers. See the COPYRIGHT
|
||||
# file at the top-level directory of this distribution and at
|
||||
# http://rust-lang.org/COPYRIGHT.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
||||
# http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
||||
# <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
||||
# option. This file may not be copied, modified, or distributed
|
||||
# except according to those terms.
|
||||
|
||||
set -eu
|
||||
|
||||
dir=$1
|
||||
|
||||
mkdir -p "tmp/$dir"
|
||||
|
||||
for f in $dir/*.md
|
||||
do
|
||||
cat "$f" | cargo run --bin convert_quotes > "tmp/$f"
|
||||
mv "tmp/$f" "$f"
|
||||
done
|
||||
502
2018-edition/dictionary.txt
Normal file
502
2018-edition/dictionary.txt
Normal file
@@ -0,0 +1,502 @@
|
||||
personal_ws-1.1 en 0 utf-8
|
||||
abcabcabc
|
||||
abcd
|
||||
abcdefghijklmnopqrstuvwxyz
|
||||
adaptor
|
||||
adaptors
|
||||
AddAssign
|
||||
Addr
|
||||
aggregator
|
||||
AGraph
|
||||
aliasability
|
||||
alignof
|
||||
alloc
|
||||
allocator
|
||||
Amir
|
||||
anotherusername
|
||||
APIs
|
||||
app's
|
||||
aren
|
||||
args
|
||||
associativity
|
||||
async
|
||||
atomics
|
||||
AveragedCollection
|
||||
backend
|
||||
backported
|
||||
backtrace
|
||||
backtraces
|
||||
BACKTRACE
|
||||
Backtraces
|
||||
Baz’s
|
||||
benchmarking
|
||||
bioinformatics
|
||||
bitand
|
||||
BitAnd
|
||||
BitAndAssign
|
||||
bitor
|
||||
BitOr
|
||||
BitOrAssign
|
||||
bitwise
|
||||
Bitwise
|
||||
bitxor
|
||||
BitXor
|
||||
BitXorAssign
|
||||
Bjarne
|
||||
Boehm
|
||||
bool
|
||||
Boolean
|
||||
Booleans
|
||||
Bors
|
||||
BorrowMutError
|
||||
BTreeSet
|
||||
BuildHasher
|
||||
Cacher
|
||||
Cagain
|
||||
callsite
|
||||
CamelCase
|
||||
cargodoc
|
||||
ChangeColor
|
||||
ChangeColorMessage
|
||||
charset
|
||||
choo
|
||||
chXX
|
||||
chYY
|
||||
coercions
|
||||
combinator
|
||||
ConcreteType
|
||||
config
|
||||
Config
|
||||
const
|
||||
constant's
|
||||
copyeditor
|
||||
couldn
|
||||
CPUs
|
||||
cratesio
|
||||
CRLF
|
||||
cryptocurrencies
|
||||
cryptographic
|
||||
cryptographically
|
||||
CStr
|
||||
CString
|
||||
ctrl
|
||||
Ctrl
|
||||
customizable
|
||||
CustomSmartPointer
|
||||
CustomSmartPointers
|
||||
data’s
|
||||
deallocate
|
||||
deallocated
|
||||
deallocating
|
||||
deallocation
|
||||
debuginfo
|
||||
decrementing
|
||||
deps
|
||||
deref
|
||||
Deref
|
||||
dereference
|
||||
Dereference
|
||||
dereferenced
|
||||
dereferences
|
||||
dereferencing
|
||||
DerefMut
|
||||
DeriveInput
|
||||
destructor
|
||||
destructure
|
||||
destructured
|
||||
destructures
|
||||
destructuring
|
||||
Destructuring
|
||||
deterministically
|
||||
DevOps
|
||||
didn
|
||||
Dobrý
|
||||
doccargo
|
||||
doccratesio
|
||||
DOCTYPE
|
||||
doesn
|
||||
disambiguating
|
||||
DivAssign
|
||||
DraftPost
|
||||
DSTs
|
||||
ebooks
|
||||
Edsger
|
||||
egular
|
||||
else's
|
||||
emoji
|
||||
encodings
|
||||
enum
|
||||
Enum
|
||||
enums
|
||||
enum's
|
||||
Enums
|
||||
eprintln
|
||||
Erlang
|
||||
ErrorKind
|
||||
Executables
|
||||
expr
|
||||
extern
|
||||
favicon
|
||||
FFFD
|
||||
FFFF
|
||||
figcaption
|
||||
fieldname
|
||||
filename
|
||||
Filename
|
||||
filesystem
|
||||
Filesystem
|
||||
filesystems
|
||||
Firefox
|
||||
FnBox
|
||||
FnMut
|
||||
FnOnce
|
||||
formatter
|
||||
formatters
|
||||
FrenchToast
|
||||
FromIterator
|
||||
frontend
|
||||
getter
|
||||
GGraph
|
||||
GitHub
|
||||
gitignore
|
||||
grapheme
|
||||
Grapheme
|
||||
growable
|
||||
gzip
|
||||
hardcode
|
||||
hardcoded
|
||||
hardcoding
|
||||
hasher
|
||||
hashers
|
||||
HashMap
|
||||
HashSet
|
||||
Haskell
|
||||
hasn
|
||||
HelloMacro
|
||||
helloworld
|
||||
HelloWorld
|
||||
HelloWorldName
|
||||
Hmmm
|
||||
Hoare
|
||||
Hola
|
||||
homogenous
|
||||
html
|
||||
hyperoptimize
|
||||
Iceburgh
|
||||
ident
|
||||
IDE
|
||||
IDEs
|
||||
IDE's
|
||||
IEEE
|
||||
impl
|
||||
implementor
|
||||
implementors
|
||||
ImportantExcerpt
|
||||
incrementing
|
||||
IndexMut
|
||||
indices
|
||||
init
|
||||
initializer
|
||||
inline
|
||||
instantiation
|
||||
internet
|
||||
IntoIterator
|
||||
InvalidDigit
|
||||
invariants
|
||||
ioerror
|
||||
iokind
|
||||
ioresult
|
||||
iostdin
|
||||
IpAddr
|
||||
IpAddrKind
|
||||
irst
|
||||
isize
|
||||
iter
|
||||
iterator's
|
||||
JavaScript
|
||||
JoinHandle
|
||||
Kay's
|
||||
kinded
|
||||
lang
|
||||
latin
|
||||
liballoc
|
||||
libc
|
||||
libcollections
|
||||
libcore
|
||||
libpanic
|
||||
librarys
|
||||
libreoffice
|
||||
libstd
|
||||
lifecycle
|
||||
LimitTracker
|
||||
LLVM
|
||||
lobally
|
||||
locators
|
||||
LockResult
|
||||
login
|
||||
lookup
|
||||
loopback
|
||||
lossy
|
||||
lval
|
||||
macOS
|
||||
Matsakis
|
||||
mathematic
|
||||
memoization
|
||||
metadata
|
||||
Metadata
|
||||
metaprogramming
|
||||
mibbit
|
||||
Mibbit
|
||||
millis
|
||||
minigrep
|
||||
mixup
|
||||
mkdir
|
||||
MockMessenger
|
||||
modifiability
|
||||
modularity
|
||||
monomorphization
|
||||
Monomorphization
|
||||
monomorphized
|
||||
MoveMessage
|
||||
Mozilla
|
||||
mpsc
|
||||
msvc
|
||||
MulAssign
|
||||
multibyte
|
||||
multithreaded
|
||||
mutex
|
||||
mutex's
|
||||
Mutex
|
||||
mutexes
|
||||
Mutexes
|
||||
MutexGuard
|
||||
MyBox
|
||||
namespace
|
||||
namespaced
|
||||
namespaces
|
||||
namespacing
|
||||
natively
|
||||
newfound
|
||||
NewJob
|
||||
NewsArticle
|
||||
NewThread
|
||||
newtype
|
||||
newtypes
|
||||
nitty
|
||||
nocapture
|
||||
nomicon
|
||||
nondeterministic
|
||||
nonequality
|
||||
nongeneric
|
||||
NotFound
|
||||
null's
|
||||
OCaml
|
||||
offsetof
|
||||
online
|
||||
OpenGL
|
||||
optimizations
|
||||
OptionalFloatingPointNumber
|
||||
OptionalNumber
|
||||
OsStr
|
||||
OsString
|
||||
other's
|
||||
OutlinePrint
|
||||
overloadable
|
||||
overread
|
||||
param
|
||||
parameterize
|
||||
ParseIntError
|
||||
PartialEq
|
||||
PartialOrd
|
||||
PendingReview
|
||||
PendingReviewPost
|
||||
PlaceholderType
|
||||
polymorphism
|
||||
PoolCreationError
|
||||
portia
|
||||
powershell
|
||||
PowerShell
|
||||
powi
|
||||
preprocessing
|
||||
Preprocessing
|
||||
preprocessor
|
||||
PrimaryColor
|
||||
println
|
||||
priv
|
||||
proc
|
||||
pthreads
|
||||
pushups
|
||||
QuitMessage
|
||||
quux
|
||||
RAII
|
||||
randcrate
|
||||
RangeFrom
|
||||
RangeTo
|
||||
RangeFull
|
||||
README
|
||||
READMEs
|
||||
rect
|
||||
recurse
|
||||
recv
|
||||
redeclaring
|
||||
Refactoring
|
||||
refactor
|
||||
refactoring
|
||||
refcell
|
||||
RefCell
|
||||
RefMut
|
||||
refutability
|
||||
reimplement
|
||||
RemAssign
|
||||
repr
|
||||
representable
|
||||
request's
|
||||
resizes
|
||||
resizing
|
||||
retweet
|
||||
rewordings
|
||||
rint
|
||||
ripgrep
|
||||
runnable
|
||||
runtime
|
||||
runtimes
|
||||
Rustacean
|
||||
Rustaceans
|
||||
rUsT
|
||||
rustc
|
||||
rustdoc
|
||||
Rustonomicon
|
||||
rustfmt
|
||||
rustup
|
||||
screenshot
|
||||
searchstring
|
||||
SecondaryColor
|
||||
SelectBox
|
||||
semver
|
||||
SemVer
|
||||
serde
|
||||
ShlAssign
|
||||
ShrAssign
|
||||
shouldn
|
||||
Simula
|
||||
situps
|
||||
sizeof
|
||||
Smalltalk
|
||||
snuck
|
||||
someproject
|
||||
someusername
|
||||
SPDX
|
||||
spdx
|
||||
SpreadsheetCell
|
||||
sqrt
|
||||
stackoverflow
|
||||
startup
|
||||
StaticRef
|
||||
stderr
|
||||
stdin
|
||||
Stdin
|
||||
stdlib
|
||||
stdout
|
||||
steveklabnik's
|
||||
stringify
|
||||
Stroustrup
|
||||
Stroustrup's
|
||||
struct
|
||||
Struct
|
||||
structs
|
||||
struct's
|
||||
Structs
|
||||
SubAssign
|
||||
subclasses
|
||||
subcommand
|
||||
subcommands
|
||||
subdirectories
|
||||
subdirectory
|
||||
submodule
|
||||
submodules
|
||||
Submodules
|
||||
suboptimal
|
||||
substring
|
||||
subteams
|
||||
subtree
|
||||
subtyping
|
||||
supertrait
|
||||
supertraits
|
||||
TcpListener
|
||||
TcpStream
|
||||
templating
|
||||
test's
|
||||
TextField
|
||||
That'd
|
||||
there'd
|
||||
ThreadPool
|
||||
timestamp
|
||||
Tiếng
|
||||
timeline
|
||||
tlborm
|
||||
TODO
|
||||
TokenStream
|
||||
toml
|
||||
TOML
|
||||
toolchain
|
||||
toolchains
|
||||
ToString
|
||||
tradeoff
|
||||
tradeoffs
|
||||
TrafficLight
|
||||
transcoding
|
||||
trpl
|
||||
tuesday
|
||||
tuple
|
||||
tuples
|
||||
turbofish
|
||||
Turon
|
||||
typeof
|
||||
TypeName
|
||||
UFCS
|
||||
unary
|
||||
Unary
|
||||
uncomment
|
||||
Uncomment
|
||||
unevaluated
|
||||
Uninstalling
|
||||
uninstall
|
||||
unix
|
||||
unpopulated
|
||||
unoptimized
|
||||
UnsafeCell
|
||||
unsafety
|
||||
unsized
|
||||
unsynchronized
|
||||
URIs
|
||||
UsefulType
|
||||
username
|
||||
USERPROFILE
|
||||
usize
|
||||
UsState
|
||||
utils
|
||||
vals
|
||||
variable's
|
||||
variant's
|
||||
vers
|
||||
versa
|
||||
Versioning
|
||||
visualstudio
|
||||
Vlissides
|
||||
vtable
|
||||
wasn
|
||||
WeatherForecast
|
||||
WebSocket
|
||||
whitespace
|
||||
wildcard
|
||||
wildcards
|
||||
workflow
|
||||
workspace
|
||||
workspaces
|
||||
Workspaces
|
||||
wouldn
|
||||
writeln
|
||||
WriteMessage
|
||||
xpression
|
||||
yyyy
|
||||
ZipImpl
|
||||
26
2018-edition/dot/trpl04-01.dot
Normal file
26
2018-edition/dot/trpl04-01.dot
Normal file
@@ -0,0 +1,26 @@
|
||||
digraph {
|
||||
rankdir=LR;
|
||||
overlap=false;
|
||||
dpi=300.0;
|
||||
node [shape="plaintext"];
|
||||
|
||||
table0[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s1</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="pointer"></TD></TR>
|
||||
<TR><TD>len</TD><TD>5</TD></TR>
|
||||
<TR><TD>capacity</TD><TD>5</TD></TR>
|
||||
</TABLE>>];
|
||||
table1[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD>index</TD><TD>value</TD></TR>
|
||||
<TR><TD PORT="pointee">0</TD><TD>h</TD></TR>
|
||||
<TR><TD>1</TD><TD>e</TD></TR>
|
||||
<TR><TD>2</TD><TD>l</TD></TR>
|
||||
<TR><TD>3</TD><TD>l</TD></TR>
|
||||
<TR><TD>4</TD><TD>o</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
edge[tailclip="false"];
|
||||
table0:pointer:c -> table1:pointee;
|
||||
}
|
||||
|
||||
35
2018-edition/dot/trpl04-02.dot
Normal file
35
2018-edition/dot/trpl04-02.dot
Normal file
@@ -0,0 +1,35 @@
|
||||
digraph {
|
||||
rankdir=LR;
|
||||
overlap=false;
|
||||
dpi=300.0;
|
||||
node [shape="plaintext"];
|
||||
|
||||
table0[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s1</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="pointer"></TD></TR>
|
||||
<TR><TD>len</TD><TD>5</TD></TR>
|
||||
<TR><TD>capacity</TD><TD>5</TD></TR>
|
||||
</TABLE>>];
|
||||
table3[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s2</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="pointer"></TD></TR>
|
||||
<TR><TD>len</TD><TD>5</TD></TR>
|
||||
<TR><TD>capacity</TD><TD>5</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
table1[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD>index</TD><TD>value</TD></TR>
|
||||
<TR><TD PORT="pointee">0</TD><TD>h</TD></TR>
|
||||
<TR><TD>1</TD><TD>e</TD></TR>
|
||||
<TR><TD>2</TD><TD>l</TD></TR>
|
||||
<TR><TD>3</TD><TD>l</TD></TR>
|
||||
<TR><TD>4</TD><TD>o</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
edge[tailclip="false"];
|
||||
table0:pointer:c -> table1:pointee;
|
||||
table3:pointer:c -> table1:pointee;
|
||||
}
|
||||
|
||||
44
2018-edition/dot/trpl04-03.dot
Normal file
44
2018-edition/dot/trpl04-03.dot
Normal file
@@ -0,0 +1,44 @@
|
||||
digraph {
|
||||
rankdir=LR;
|
||||
overlap=false;
|
||||
dpi=300.0;
|
||||
node [shape="plaintext"];
|
||||
|
||||
table0[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s2</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="pointer"></TD></TR>
|
||||
<TR><TD>len</TD><TD>5</TD></TR>
|
||||
<TR><TD>capacity</TD><TD>5</TD></TR>
|
||||
</TABLE>>];
|
||||
table1[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD>index</TD><TD>value</TD></TR>
|
||||
<TR><TD PORT="pointee">0</TD><TD>h</TD></TR>
|
||||
<TR><TD>1</TD><TD>e</TD></TR>
|
||||
<TR><TD>2</TD><TD>l</TD></TR>
|
||||
<TR><TD>3</TD><TD>l</TD></TR>
|
||||
<TR><TD>4</TD><TD>o</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
table3[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s1</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="pointer"></TD></TR>
|
||||
<TR><TD>len</TD><TD>5</TD></TR>
|
||||
<TR><TD>capacity</TD><TD>5</TD></TR>
|
||||
</TABLE>>];
|
||||
table4[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD>index</TD><TD>value</TD></TR>
|
||||
<TR><TD PORT="pointee">0</TD><TD>h</TD></TR>
|
||||
<TR><TD>1</TD><TD>e</TD></TR>
|
||||
<TR><TD>2</TD><TD>l</TD></TR>
|
||||
<TR><TD>3</TD><TD>l</TD></TR>
|
||||
<TR><TD>4</TD><TD>o</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
|
||||
edge[tailclip="false"];
|
||||
table0:pointer:c -> table1:pointee;
|
||||
table3:pointer:c -> table4:pointee;
|
||||
}
|
||||
|
||||
35
2018-edition/dot/trpl04-04.dot
Normal file
35
2018-edition/dot/trpl04-04.dot
Normal file
@@ -0,0 +1,35 @@
|
||||
digraph {
|
||||
rankdir=LR;
|
||||
overlap=false;
|
||||
dpi=300.0;
|
||||
node [shape="plaintext"];
|
||||
|
||||
table0[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0" BGCOLOR="gray">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s1</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="pointer"></TD></TR>
|
||||
<TR><TD>len</TD><TD>5</TD></TR>
|
||||
<TR><TD>capacity</TD><TD>5</TD></TR>
|
||||
</TABLE>>];
|
||||
table3[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s2</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="pointer"></TD></TR>
|
||||
<TR><TD>len</TD><TD>5</TD></TR>
|
||||
<TR><TD>capacity</TD><TD>5</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
table1[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD>index</TD><TD>value</TD></TR>
|
||||
<TR><TD PORT="pointee">0</TD><TD>h</TD></TR>
|
||||
<TR><TD>1</TD><TD>e</TD></TR>
|
||||
<TR><TD>2</TD><TD>l</TD></TR>
|
||||
<TR><TD>3</TD><TD>l</TD></TR>
|
||||
<TR><TD>4</TD><TD>o</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
edge[tailclip="false"];
|
||||
table0:pointer:c -> table1:pointee;
|
||||
table3:pointer:c -> table1:pointee;
|
||||
}
|
||||
|
||||
32
2018-edition/dot/trpl04-05.dot
Normal file
32
2018-edition/dot/trpl04-05.dot
Normal file
@@ -0,0 +1,32 @@
|
||||
digraph {
|
||||
rankdir=LR;
|
||||
overlap=false;
|
||||
dpi=300.0;
|
||||
node [shape="plaintext"];
|
||||
|
||||
table0[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="borrower"></TD></TR>
|
||||
</TABLE>>];
|
||||
table1[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s1</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD PORT="borrowee">ptr</TD><TD PORT="pointer"></TD></TR>
|
||||
<TR><TD>len</TD><TD>5</TD></TR>
|
||||
<TR><TD>capacity</TD><TD>5</TD></TR>
|
||||
</TABLE>>];
|
||||
table2[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD>index</TD><TD>value</TD></TR>
|
||||
<TR><TD PORT="pointee">0</TD><TD>h</TD></TR>
|
||||
<TR><TD>1</TD><TD>e</TD></TR>
|
||||
<TR><TD>2</TD><TD>l</TD></TR>
|
||||
<TR><TD>3</TD><TD>l</TD></TR>
|
||||
<TR><TD>4</TD><TD>o</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
edge[tailclip="false"];
|
||||
table1:pointer:c -> table2:pointee;
|
||||
table0:borrower:c -> table1:borrowee;
|
||||
}
|
||||
|
||||
41
2018-edition/dot/trpl04-06.dot
Normal file
41
2018-edition/dot/trpl04-06.dot
Normal file
@@ -0,0 +1,41 @@
|
||||
digraph {
|
||||
rankdir=LR;
|
||||
overlap=false;
|
||||
dpi=300.0;
|
||||
node [shape="plaintext"];
|
||||
|
||||
table0[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">world</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="pointer2"></TD></TR>
|
||||
<TR><TD>len</TD><TD>5</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
table3[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">s</TD></TR>
|
||||
<TR><TD>name</TD><TD>value</TD></TR>
|
||||
<TR><TD>ptr</TD><TD PORT="pointer"></TD></TR>
|
||||
<TR><TD>len</TD><TD>11</TD></TR>
|
||||
<TR><TD>capacity</TD><TD>11</TD></TR>
|
||||
</TABLE>>];
|
||||
table4[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD>index</TD><TD>value</TD></TR>
|
||||
<TR><TD PORT="pointee">0</TD><TD>h</TD></TR>
|
||||
<TR><TD>1</TD><TD>e</TD></TR>
|
||||
<TR><TD>2</TD><TD>l</TD></TR>
|
||||
<TR><TD>3</TD><TD>l</TD></TR>
|
||||
<TR><TD>4</TD><TD>o</TD></TR>
|
||||
<TR><TD>5</TD><TD> </TD></TR>
|
||||
<TR><TD PORT="pointee2">6</TD><TD>w</TD></TR>
|
||||
<TR><TD>7</TD><TD>o</TD></TR>
|
||||
<TR><TD>8</TD><TD>r</TD></TR>
|
||||
<TR><TD>9</TD><TD>l</TD></TR>
|
||||
<TR><TD>10</TD><TD>d</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
|
||||
edge[tailclip="false"];
|
||||
table0:pointer2:c -> table4:pointee2;
|
||||
table3:pointer:c -> table4:pointee;
|
||||
}
|
||||
|
||||
24
2018-edition/dot/trpl15-01.dot
Normal file
24
2018-edition/dot/trpl15-01.dot
Normal file
@@ -0,0 +1,24 @@
|
||||
digraph {
|
||||
rankdir=LR;
|
||||
overlap=false;
|
||||
dpi=300.0;
|
||||
node [shape="plaintext"];
|
||||
|
||||
table0[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">Cons</TD></TR>
|
||||
<TR><TD>i32</TD><TD><TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">Cons</TD></TR>
|
||||
<TR><TD>i32</TD><TD><TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">Cons</TD></TR>
|
||||
<TR><TD>i32</TD><TD><TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">Cons</TD></TR>
|
||||
<TR><TD>i32</TD><TD><TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">Cons</TD></TR>
|
||||
<TR><TD>i32</TD><TD>∞</TD></TR>
|
||||
</TABLE></TD></TR>
|
||||
</TABLE></TD></TR>
|
||||
</TABLE></TD></TR>
|
||||
</TABLE></TD></TR>
|
||||
</TABLE>>];
|
||||
}
|
||||
|
||||
18
2018-edition/dot/trpl15-02.dot
Normal file
18
2018-edition/dot/trpl15-02.dot
Normal file
@@ -0,0 +1,18 @@
|
||||
digraph {
|
||||
rankdir=LR;
|
||||
overlap=false;
|
||||
dpi=300.0;
|
||||
node [shape="plaintext"];
|
||||
|
||||
table0[label=<
|
||||
<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD COLSPAN="2" SIDES="B">Cons</TD></TR>
|
||||
<TR><TD>i32</TD><TD>
|
||||
<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD SIDES="B">Box</TD></TR>
|
||||
<TR><TD>usize</TD></TR>
|
||||
</TABLE>
|
||||
</TD></TR>
|
||||
</TABLE>>];
|
||||
}
|
||||
|
||||
51
2018-edition/dot/trpl15-03.dot
Normal file
51
2018-edition/dot/trpl15-03.dot
Normal file
@@ -0,0 +1,51 @@
|
||||
digraph {
|
||||
rankdir=LR;
|
||||
overlap=false;
|
||||
dpi=300.0;
|
||||
node [shape="plaintext"];
|
||||
|
||||
table4[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD SIDES="B">b</TD><TD SIDES="B" PORT="ptr4"></TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
table5[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD PORT="pte4">3</TD><TD PORT="ptr5"> </TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
|
||||
table0[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD SIDES="B">a</TD><TD SIDES="B" PORT="ptr0"></TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
table1[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD PORT="pte0">5</TD><TD PORT="ptr1"> </TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
table2[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD PORT="pte1">10</TD><TD PORT="ptr2"> </TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
table3[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD PORT="pte2">Nil</TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
|
||||
table6[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD SIDES="B">c</TD><TD SIDES="B" PORT="ptr6"></TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
table7[label=<<TABLE BORDER="0" CELLBORDER="1" CELLSPACING="0">
|
||||
<TR><TD PORT="pte6">4</TD><TD PORT="ptr7"> </TD></TR>
|
||||
</TABLE>>];
|
||||
|
||||
|
||||
edge[tailclip="false"];
|
||||
table0:ptr0:c -> table1:pte0;
|
||||
table1:ptr1:c -> table2:pte1;
|
||||
table2:ptr2:c -> table3:pte2;
|
||||
table4:ptr4:c -> table5:pte4;
|
||||
table5:ptr5:c -> table1:pte0;
|
||||
table6:ptr6:c -> table7:pte6;
|
||||
table7:ptr7:c -> table1:pte0;
|
||||
}
|
||||
|
||||
101
2018-edition/spellcheck.sh
Normal file
101
2018-edition/spellcheck.sh
Normal file
@@ -0,0 +1,101 @@
|
||||
#!/bin/bash
|
||||
# Copyright 2016 The Rust Project Developers. See the COPYRIGHT
|
||||
# file at the top-level directory of this distribution and at
|
||||
# http://rust-lang.org/COPYRIGHT.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
||||
# http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
||||
# <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
||||
# option. This file may not be copied, modified, or distributed
|
||||
# except according to those terms.
|
||||
|
||||
aspell --version
|
||||
|
||||
# Checks project markdown files for spell errors
|
||||
|
||||
# Notes:
|
||||
|
||||
# This script needs dictionary file ($dict_filename) with project-specific
|
||||
# valid words. If this file is missing, first invocation of a script generates
|
||||
# a file of words considered typos at the moment. User should remove real typos
|
||||
# from this file and leave only valid words. When script generates false
|
||||
# positive after source modification, new valid word should be added
|
||||
# to dictionary file.
|
||||
|
||||
# Default mode of this script is interactive. Each source file is scanned for
|
||||
# typos. aspell opens window, suggesting fixes for each found typo. Original
|
||||
# files with errors will be backed up to files with format "filename.md.bak".
|
||||
|
||||
# When running in CI, this script should be run in "list" mode (pass "list"
|
||||
# as first argument). In this mode script scans all files and reports found
|
||||
# errors. Exit code in this case depends on scan result:
|
||||
# 1 if any errors found,
|
||||
# 0 if all is clear.
|
||||
|
||||
# Script skips words with length less than or equal to 3. This helps to avoid
|
||||
# some false positives.
|
||||
|
||||
# We can consider skipping source code in markdown files (```code```) to reduce
|
||||
# rate of false positives, but then we lose ability to detect typos in code
|
||||
# comments/strings etc.
|
||||
|
||||
shopt -s nullglob
|
||||
|
||||
dict_filename=./dictionary.txt
|
||||
markdown_sources=(./src/*.md)
|
||||
mode="check"
|
||||
|
||||
# aspell repeatedly modifies personal dictionary for some purpose,
|
||||
# so we should use a copy of our dictionary
|
||||
dict_path="/tmp/$dict_filename"
|
||||
|
||||
if [[ "$1" == "list" ]]; then
|
||||
mode="list"
|
||||
fi
|
||||
|
||||
if [[ ! -f "$dict_filename" ]]; then
|
||||
# Pre-check mode: generates dictionary of words aspell consider typos.
|
||||
# After user validates that this file contains only valid words, we can
|
||||
# look for typos using this dictionary and some default aspell dictionary.
|
||||
echo "Scanning files to generate dictionary file '$dict_filename'."
|
||||
echo "Please check that it doesn't contain any misspellings."
|
||||
|
||||
echo "personal_ws-1.1 en 0 utf-8" > "$dict_filename"
|
||||
cat "${markdown_sources[@]}" | aspell --ignore 3 list | sort -u >> "$dict_filename"
|
||||
elif [[ "$mode" == "list" ]]; then
|
||||
# List (default) mode: scan all files, report errors
|
||||
declare -i retval=0
|
||||
|
||||
cp "$dict_filename" "$dict_path"
|
||||
|
||||
if [ ! -f $dict_path ]; then
|
||||
retval=1
|
||||
exit "$retval"
|
||||
fi
|
||||
|
||||
for fname in "${markdown_sources[@]}"; do
|
||||
command=$(aspell --ignore 3 --personal="$dict_path" "$mode" < "$fname")
|
||||
if [[ -n "$command" ]]; then
|
||||
for error in $command; do
|
||||
# FIXME: Find more correct way to get line number
|
||||
# (ideally from aspell). Now it can make some false positives,
|
||||
# because it is just a grep
|
||||
grep --with-filename --line-number --color=always "$error" "$fname"
|
||||
done
|
||||
retval=1
|
||||
fi
|
||||
done
|
||||
exit "$retval"
|
||||
elif [[ "$mode" == "check" ]]; then
|
||||
# Interactive mode: fix typos
|
||||
cp "$dict_filename" "$dict_path"
|
||||
|
||||
if [ ! -f $dict_path ]; then
|
||||
retval=1
|
||||
exit "$retval"
|
||||
fi
|
||||
|
||||
for fname in "${markdown_sources[@]}"; do
|
||||
aspell --ignore 3 --dont-backup --personal="$dict_path" "$mode" "$fname"
|
||||
done
|
||||
fi
|
||||
132
2018-edition/src/SUMMARY.md
Normal file
132
2018-edition/src/SUMMARY.md
Normal file
@@ -0,0 +1,132 @@
|
||||
# The Rust Programming Language
|
||||
|
||||
[Foreword](foreword.md)
|
||||
[Introduction](ch00-00-introduction.md)
|
||||
|
||||
## Getting started
|
||||
|
||||
- [Getting Started](ch01-00-getting-started.md)
|
||||
- [Installation](ch01-01-installation.md)
|
||||
- [Hello, World!](ch01-02-hello-world.md)
|
||||
- [Hello, Cargo!](ch01-03-hello-cargo.md)
|
||||
|
||||
- [Programming a Guessing Game](ch02-00-guessing-game-tutorial.md)
|
||||
|
||||
- [Common Programming Concepts](ch03-00-common-programming-concepts.md)
|
||||
- [Variables and Mutability](ch03-01-variables-and-mutability.md)
|
||||
- [Data Types](ch03-02-data-types.md)
|
||||
- [How Functions Work](ch03-03-how-functions-work.md)
|
||||
- [Comments](ch03-04-comments.md)
|
||||
- [Control Flow](ch03-05-control-flow.md)
|
||||
|
||||
- [Understanding Ownership](ch04-00-understanding-ownership.md)
|
||||
- [What is Ownership?](ch04-01-what-is-ownership.md)
|
||||
- [References & Borrowing](ch04-02-references-and-borrowing.md)
|
||||
- [Slices](ch04-03-slices.md)
|
||||
|
||||
- [Using Structs to Structure Related Data](ch05-00-structs.md)
|
||||
- [Defining and Instantiating Structs](ch05-01-defining-structs.md)
|
||||
- [An Example Program Using Structs](ch05-02-example-structs.md)
|
||||
- [Method Syntax](ch05-03-method-syntax.md)
|
||||
|
||||
- [Enums and Pattern Matching](ch06-00-enums.md)
|
||||
- [Defining an Enum](ch06-01-defining-an-enum.md)
|
||||
- [The `match` Control Flow Operator](ch06-02-match.md)
|
||||
- [Concise Control Flow with `if let`](ch06-03-if-let.md)
|
||||
|
||||
## Basic Rust Literacy
|
||||
|
||||
- [Modules](ch07-00-modules.md)
|
||||
- [`mod` and the Filesystem](ch07-01-mod-and-the-filesystem.md)
|
||||
- [Controlling Visibility with `pub`](ch07-02-controlling-visibility-with-pub.md)
|
||||
- [Referring to Names in Different Modules](ch07-03-importing-names-with-use.md)
|
||||
|
||||
- [Common Collections](ch08-00-common-collections.md)
|
||||
- [Vectors](ch08-01-vectors.md)
|
||||
- [Strings](ch08-02-strings.md)
|
||||
- [Hash Maps](ch08-03-hash-maps.md)
|
||||
|
||||
- [Error Handling](ch09-00-error-handling.md)
|
||||
- [Unrecoverable Errors with `panic!`](ch09-01-unrecoverable-errors-with-panic.md)
|
||||
- [Recoverable Errors with `Result`](ch09-02-recoverable-errors-with-result.md)
|
||||
- [To `panic!` or Not To `panic!`](ch09-03-to-panic-or-not-to-panic.md)
|
||||
|
||||
- [Generic Types, Traits, and Lifetimes](ch10-00-generics.md)
|
||||
- [Generic Data Types](ch10-01-syntax.md)
|
||||
- [Traits: Defining Shared Behavior](ch10-02-traits.md)
|
||||
- [Validating References with Lifetimes](ch10-03-lifetime-syntax.md)
|
||||
|
||||
- [Testing](ch11-00-testing.md)
|
||||
- [Writing tests](ch11-01-writing-tests.md)
|
||||
- [Running tests](ch11-02-running-tests.md)
|
||||
- [Test Organization](ch11-03-test-organization.md)
|
||||
|
||||
- [An I/O Project: Building a Command Line Program](ch12-00-an-io-project.md)
|
||||
- [Accepting Command Line Arguments](ch12-01-accepting-command-line-arguments.md)
|
||||
- [Reading a File](ch12-02-reading-a-file.md)
|
||||
- [Refactoring to Improve Modularity and Error Handling](ch12-03-improving-error-handling-and-modularity.md)
|
||||
- [Developing the Library’s Functionality with Test Driven Development](ch12-04-testing-the-librarys-functionality.md)
|
||||
- [Working with Environment Variables](ch12-05-working-with-environment-variables.md)
|
||||
- [Writing Error Messages to Standard Error Instead of Standard Output](ch12-06-writing-to-stderr-instead-of-stdout.md)
|
||||
|
||||
## Thinking in Rust
|
||||
|
||||
- [Functional Language Features: Iterators and Closures](ch13-00-functional-features.md)
|
||||
- [Closures: Anonymous Functions that Can Capture Their Environment](ch13-01-closures.md)
|
||||
- [Processing a Series of Items with Iterators](ch13-02-iterators.md)
|
||||
- [Improving Our I/O Project](ch13-03-improving-our-io-project.md)
|
||||
- [Comparing Performance: Loops vs. Iterators](ch13-04-performance.md)
|
||||
|
||||
- [More about Cargo and Crates.io](ch14-00-more-about-cargo.md)
|
||||
- [Customizing Builds with Release Profiles](ch14-01-release-profiles.md)
|
||||
- [Publishing a Crate to Crates.io](ch14-02-publishing-to-crates-io.md)
|
||||
- [Cargo Workspaces](ch14-03-cargo-workspaces.md)
|
||||
- [Installing Binaries from Crates.io with `cargo install`](ch14-04-installing-binaries.md)
|
||||
- [Extending Cargo with Custom Commands](ch14-05-extending-cargo.md)
|
||||
|
||||
- [Smart Pointers](ch15-00-smart-pointers.md)
|
||||
- [`Box<T>` Points to Data on the Heap and Has a Known Size](ch15-01-box.md)
|
||||
- [The `Deref` Trait Allows Access to the Data Through a Reference](ch15-02-deref.md)
|
||||
- [The `Drop` Trait Runs Code on Cleanup](ch15-03-drop.md)
|
||||
- [`Rc<T>`, the Reference Counted Smart Pointer](ch15-04-rc.md)
|
||||
- [`RefCell<T>` and the Interior Mutability Pattern](ch15-05-interior-mutability.md)
|
||||
- [Creating Reference Cycles and Leaking Memory is Safe](ch15-06-reference-cycles.md)
|
||||
|
||||
- [Fearless Concurrency](ch16-00-concurrency.md)
|
||||
- [Threads](ch16-01-threads.md)
|
||||
- [Message Passing](ch16-02-message-passing.md)
|
||||
- [Shared State](ch16-03-shared-state.md)
|
||||
- [Extensible Concurrency: `Sync` and `Send`](ch16-04-extensible-concurrency-sync-and-send.md)
|
||||
|
||||
- [Object Oriented Programming Features of Rust](ch17-00-oop.md)
|
||||
- [Characteristics of Object-Oriented Languages](ch17-01-what-is-oo.md)
|
||||
- [Using Trait Objects that Allow for Values of Different Types](ch17-02-trait-objects.md)
|
||||
- [Implementing an Object-Oriented Design Pattern](ch17-03-oo-design-patterns.md)
|
||||
|
||||
## Advanced Topics
|
||||
|
||||
- [Patterns Match the Structure of Values](ch18-00-patterns.md)
|
||||
- [All the Places Patterns May be Used](ch18-01-all-the-places-for-patterns.md)
|
||||
- [Refutability: Whether a Pattern Might Fail to Match](ch18-02-refutability.md)
|
||||
- [All the Pattern Syntax](ch18-03-pattern-syntax.md)
|
||||
|
||||
- [Advanced Features](ch19-00-advanced-features.md)
|
||||
- [Unsafe Rust](ch19-01-unsafe-rust.md)
|
||||
- [Advanced Lifetimes](ch19-02-advanced-lifetimes.md)
|
||||
- [Advanced Traits](ch19-03-advanced-traits.md)
|
||||
- [Advanced Types](ch19-04-advanced-types.md)
|
||||
- [Advanced Functions & Closures](ch19-05-advanced-functions-and-closures.md)
|
||||
|
||||
- [Final Project: Building a Multithreaded Web Server](ch20-00-final-project-a-web-server.md)
|
||||
- [A Single Threaded Web Server](ch20-01-single-threaded.md)
|
||||
- [Turning our Single Threaded Server into a Multithreaded Server](ch20-02-multithreaded.md)
|
||||
- [Graceful Shutdown and Cleanup](ch20-03-graceful-shutdown-and-cleanup.md)
|
||||
|
||||
- [Appendix](appendix-00.md)
|
||||
- [A - Keywords](appendix-01-keywords.md)
|
||||
- [B - Operators and Symbols](appendix-02-operators.md)
|
||||
- [C - Derivable Traits](appendix-03-derivable-traits.md)
|
||||
- [D - Macros](appendix-04-macros.md)
|
||||
- [E - Translations](appendix-05-translation.md)
|
||||
- [F - Newest Features](appendix-06-newest-features.md)
|
||||
- [G - How Rust is Made and “Nightly Rust”](appendix-07-nightly-rust.md)
|
||||
4
2018-edition/src/appendix-00.md
Normal file
4
2018-edition/src/appendix-00.md
Normal file
@@ -0,0 +1,4 @@
|
||||
# Appendix
|
||||
|
||||
The following sections contain reference material you may find useful in your
|
||||
Rust journey.
|
||||
80
2018-edition/src/appendix-01-keywords.md
Normal file
80
2018-edition/src/appendix-01-keywords.md
Normal file
@@ -0,0 +1,80 @@
|
||||
## Appendix A: Keywords
|
||||
|
||||
The following is a list of keywords that are reserved for current or future use
|
||||
by the Rust language. As such, these may not be used as identifiers, such as
|
||||
names of functions, variables, parameters, struct fields, modules, crates,
|
||||
constants, macros, static values, attributes, types, traits, or lifetimes.
|
||||
|
||||
### Keywords Currently in Use
|
||||
|
||||
* `as` - perform primitive casting, disambiguate the specific trait
|
||||
containing an item, or rename items in `use` and `extern crate` statements
|
||||
* `break` - exit a loop immediately
|
||||
* `const` - define constant items or constant raw pointers
|
||||
* `continue` - continue to the next loop iteration
|
||||
* `crate` - link an external crate or a macro variable representing the crate
|
||||
in which the macro is defined
|
||||
* `else` - fallback for `if` and `if let` control flow constructs
|
||||
* `enum` - define an enumeration
|
||||
* `extern` - link an external crate, function, or variable
|
||||
* `false` - Boolean false literal
|
||||
* `fn` - define a function or the function pointer type
|
||||
* `for` - loop over items from an iterator, implement a trait, or specify a
|
||||
higher-ranked lifetime
|
||||
* `if` - branch based on the result of a conditional expression
|
||||
* `impl` - implement inherent or trait functionality
|
||||
* `in` - part of `for` loop syntax
|
||||
* `let` - bind a variable
|
||||
* `loop` - loop unconditionally
|
||||
* `match` - match a value to patterns
|
||||
* `mod` - define a module
|
||||
* `move` - make a closure take ownership of all its captures
|
||||
* `mut` - denote mutability in references, raw pointers, or pattern bindings
|
||||
* `pub` - denote public visibility in struct fields, `impl` blocks, or modules
|
||||
* `ref` - bind by reference
|
||||
* `return` - return from function
|
||||
* `Self` - a type alias for the type implementing a trait
|
||||
* `self` - method subject or current module
|
||||
* `static` - global variable or lifetime lasting the entire program execution
|
||||
* `struct` - define a structure
|
||||
* `super` - parent module of the current module
|
||||
* `trait` - define a trait
|
||||
* `true` - Boolean true literal
|
||||
* `type` - define a type alias or associated type
|
||||
* `unsafe` - denote unsafe code, functions, traits, or implementations
|
||||
* `use` - import symbols into scope
|
||||
* `where` - denote clauses that constrain a type
|
||||
* `while` - loop conditionally based on the result of an expression
|
||||
|
||||
<!-- we should make sure the definitions for each keyword are consistently
|
||||
phrased, so for example for enum we say "defining an enumeration" but for fn we
|
||||
passively call it a "function definition" -- perhaps a good medium would be
|
||||
"define an enumeration" and "define a function"? Can you go through and make
|
||||
those consistent? I've attempted it for a few, but am wary of changing meaning.
|
||||
Also, you may decide to go the passive definition route, which is fine by me,
|
||||
as long as it's consistent-->
|
||||
<!-- I've tried, I'm not sure how to be active for keywords that are nouns
|
||||
though. Please let me know if any still seem inconsistent /Carol -->
|
||||
|
||||
### Keywords Reserved for Future Use
|
||||
|
||||
These keywords do not have any functionality, but are reserved by Rust for
|
||||
potential future use.
|
||||
|
||||
* `abstract`
|
||||
* `alignof`
|
||||
* `become`
|
||||
* `box`
|
||||
* `do`
|
||||
* `final`
|
||||
* `macro`
|
||||
* `offsetof`
|
||||
* `override`
|
||||
* `priv`
|
||||
* `proc`
|
||||
* `pure`
|
||||
* `sizeof`
|
||||
* `typeof`
|
||||
* `unsized`
|
||||
* `virtual`
|
||||
* `yield`
|
||||
172
2018-edition/src/appendix-02-operators.md
Normal file
172
2018-edition/src/appendix-02-operators.md
Normal file
@@ -0,0 +1,172 @@
|
||||
## Appendix B: Operators and Symbols
|
||||
|
||||
<!-- We try not to stack headings even in the appendix, can you add some intro
|
||||
text about what this appendix contains? Quick example below -->
|
||||
<!-- Done! /Carol -->
|
||||
|
||||
This appendix is a glossary of Rust’s syntax, including operators and other
|
||||
symbols that appear by themselves or in the context of paths, generics, trait
|
||||
bounds, macros, attributes, comments, tuples, and brackets.
|
||||
|
||||
### Operators
|
||||
|
||||
The following lists the operators in Rust, an example of how the operator would
|
||||
appear in context, a short explanation, and whether that operator is
|
||||
overloadable. If an operator is overloadable, the relevant trait to use to
|
||||
overload that operator is listed.
|
||||
|
||||
<!-- PROD: I'm not sure how to handle this, would it be too big for a table? I
|
||||
think some structure with aligned columns would make it a great reference -->
|
||||
|
||||
* `!` (`ident!(…)`, `ident!{…}`, `ident![…]`): denotes macro expansion.
|
||||
* `!` (`!expr`): bitwise or logical complement. Overloadable (`Not`).
|
||||
* `!=` (`var != expr`): nonequality comparison. Overloadable (`PartialEq`).
|
||||
* `%` (`expr % expr`): arithmetic remainder. Overloadable (`Rem`).
|
||||
* `%=` (`var %= expr`): arithmetic remainder and assignment. Overloadable (`RemAssign`).
|
||||
* `&` (`&expr`, `&mut expr`): borrow.
|
||||
* `&` (`&type`, `&mut type`, `&'a type`, `&'a mut type`): borrowed pointer type.
|
||||
* `&` (`expr & expr`): bitwise AND. Overloadable (`BitAnd`).
|
||||
* `&=` (`var &= expr`): bitwise AND and assignment. Overloadable (`BitAndAssign`).
|
||||
* `&&` (`expr && expr`): logical AND.
|
||||
* `*` (`expr * expr`): arithmetic multiplication. Overloadable (`Mul`).
|
||||
* `*` (`*expr`): dereference.
|
||||
* `*` (`*const type`, `*mut type`): raw pointer.
|
||||
* `*=` (`var *= expr`): arithmetic multiplication and assignment. Overloadable (`MulAssign`).
|
||||
* `+` (`trait + trait`, `'a + trait`): compound type constraint.
|
||||
* `+` (`expr + expr`): arithmetic addition. Overloadable (`Add`).
|
||||
* `+=` (`var += expr`): arithmetic addition and assignment. Overloadable (`AddAssign`).
|
||||
* `,`: argument and element separator.
|
||||
* `-` (`- expr`): arithmetic negation. Overloadable (`Neg`).
|
||||
* `-` (`expr - expr`): arithmetic subtraction. Overloadable (`Sub`).
|
||||
* `-=` (`var -= expr`): arithmetic subtraction and assignment. Overloadable (`SubAssign`).
|
||||
* `->` (`fn(…) -> type`, `|…| -> type`): function and closure return type.
|
||||
* `.` (`expr.ident`): member access.
|
||||
* `..` (`..`, `expr..`, `..expr`, `expr..expr`): right-exclusive range literal.
|
||||
* `..` (`..expr`): struct literal update syntax.
|
||||
* `..` (`variant(x, ..)`, `struct_type { x, .. }`): “and the rest” pattern binding.
|
||||
* `...` (`expr...expr`) *in a pattern*: inclusive range pattern.
|
||||
* `/` (`expr / expr`): arithmetic division. Overloadable (`Div`).
|
||||
* `/=` (`var /= expr`): arithmetic division and assignment. Overloadable (`DivAssign`).
|
||||
* `:` (`pat: type`, `ident: type`): constraints.
|
||||
* `:` (`ident: expr`): struct field initializer.
|
||||
* `:` (`'a: loop {…}`): loop label.
|
||||
* `;`: statement and item terminator.
|
||||
* `;` (`[…; len]`): part of fixed-size array syntax
|
||||
* `<<` (`expr << expr`): left-shift. Overloadable (`Shl`).
|
||||
* `<<=` (`var <<= expr`): left-shift and assignment. Overloadable (`ShlAssign`).
|
||||
* `<` (`expr < expr`): less-than comparison. Overloadable (`PartialOrd`).
|
||||
* `<=` (`expr <= expr`): less-than or equal-to comparison. Overloadable (`PartialOrd`).
|
||||
* `=` (`var = expr`, `ident = type`): assignment/equivalence.
|
||||
* `==` (`expr == expr`): equality comparison. Overloadable (`PartialEq`).
|
||||
* `=>` (`pat => expr`): part of match arm syntax.
|
||||
* `>` (`expr > expr`): greater-than comparison. Overloadable (`PartialOrd`).
|
||||
* `>=` (`expr >= expr`): greater-than or equal-to comparison. Overloadable (`PartialOrd`).
|
||||
* `>>` (`expr >> expr`): right-shift. Overloadable (`Shr`).
|
||||
* `>>=` (`var >>= expr`): right-shift and assignment. Overloadable (`ShrAssign`).
|
||||
* `@` (`ident @ pat`): pattern binding.
|
||||
* `^` (`expr ^ expr`): bitwise exclusive OR. Overloadable (`BitXor`).
|
||||
* `^=` (`var ^= expr`): bitwise exclusive OR and assignment. Overloadable (`BitXorAssign`).
|
||||
* `|` (`pat | pat`): pattern alternatives.
|
||||
* `|` (`|…| expr`): closures.
|
||||
* `|` (`expr | expr`): bitwise OR. Overloadable (`BitOr`).
|
||||
* `|=` (`var |= expr`): bitwise OR and assignment. Overloadable (`BitOrAssign`).
|
||||
* `||` (`expr || expr`): logical OR.
|
||||
* `_`: “ignored” pattern binding. Also used to make integer-literals readable.
|
||||
* `?` (`expr?`): Error propagation.
|
||||
|
||||
### Non-operator Symbols
|
||||
|
||||
<!-- And maybe a quick explanation of what you mean by non-operator
|
||||
symbols/what counts as a non-operator symbol? -->
|
||||
<!-- I've tried but it's hard to explain, it's the kind of thing you know when
|
||||
you see it? /Carol -->
|
||||
|
||||
The following lists all non-letters that don’t function as operators; that is,
|
||||
they don’t behave like a function or method call.
|
||||
|
||||
#### Standalone Syntax
|
||||
|
||||
* `'ident`: named lifetime or loop label
|
||||
* `…u8`, `…i32`, `…f64`, `…usize`, *etc.*: numeric literal of specific type.
|
||||
* `"…"`: string literal.
|
||||
* `r"…"`, `r#"…"#`, `r##"…"##`, *etc.*: raw string literal, escape characters are not processed.
|
||||
* `b"…"`: byte string literal, constructs a `[u8]` instead of a string.
|
||||
* `br"…"`, `br#"…"#`, `br##"…"##`, *etc.*: raw byte string literal, combination of raw and byte string literal.
|
||||
* `'…'`: character literal.
|
||||
* `b'…'`: ASCII byte literal.
|
||||
* `|…| expr`: closure.
|
||||
* `!`: always empty bottom type for diverging functions.
|
||||
|
||||
#### Path-related Syntax
|
||||
|
||||
* `ident::ident`: namespace path.
|
||||
* `::path`: path relative to the crate root (*i.e.* an explicitly absolute path).
|
||||
* `self::path`: path relative to the current module (*i.e.* an explicitly relative path).
|
||||
* `super::path`: path relative to the parent of the current module.
|
||||
* `type::ident`, `<type as trait>::ident`: associated constants, functions, and types.
|
||||
* `<type>::…`: associated item for a type which cannot be directly named (*e.g.* `<&T>::…`, `<[T]>::…`, *etc.*).
|
||||
* `trait::method(…)`: disambiguating a method call by naming the trait which defines it.
|
||||
* `type::method(…)`: disambiguating a method call by naming the type for which it’s defined.
|
||||
* `<type as trait>::method(…)`: disambiguating a method call by naming the trait *and* type.
|
||||
|
||||
#### Generics
|
||||
|
||||
* `path<…>` (*e.g.* `Vec<u8>`): specifies parameters to generic type *in a type*.
|
||||
* `path::<…>`, `method::<…>` (*e.g.* `"42".parse::<i32>()`): specifies parameters to generic type, function, or method *in an expression*. Often referred to as *turbofish*.
|
||||
* `fn ident<…> …`: define generic function.
|
||||
* `struct ident<…> …`: define generic structure.
|
||||
* `enum ident<…> …`: define generic enumeration.
|
||||
* `impl<…> …`: define generic implementation.
|
||||
* `for<…> type`: higher-ranked lifetime bounds.
|
||||
* `type<ident=type>` (*e.g.* `Iterator<Item=T>`): a generic type where one or more associated types have specific assignments.
|
||||
|
||||
#### Trait Bound Constraints
|
||||
|
||||
* `T: U`: generic parameter `T` constrained to types that implement `U`.
|
||||
* `T: 'a`: generic type `T` must outlive lifetime `'a`. When we say that a type ‘outlives’ the lifetime, we mean that it cannot transitively contain any references with lifetimes shorter than `'a`.
|
||||
* `T : 'static`: The generic type `T` contains no borrowed references other than `'static` ones.
|
||||
* `'b: 'a`: generic lifetime `'b` must outlive lifetime `'a`.
|
||||
* `T: ?Sized`: allow generic type parameter to be a dynamically-sized type.
|
||||
* `'a + trait`, `trait + trait`: compound type constraint.
|
||||
|
||||
#### Macros and Attributes
|
||||
|
||||
* `#[meta]`: outer attribute.
|
||||
* `#![meta]`: inner attribute.
|
||||
* `$ident`: macro substitution.
|
||||
* `$ident:kind`: macro capture.
|
||||
* `$(…)…`: macro repetition.
|
||||
|
||||
#### Comments
|
||||
|
||||
* `//`: line comment.
|
||||
* `//!`: inner line doc comment.
|
||||
* `///`: outer line doc comment.
|
||||
* `/*…*/`: block comment.
|
||||
* `/*!…*/`: inner block doc comment.
|
||||
* `/**…*/`: outer block doc comment.
|
||||
|
||||
#### Tuples
|
||||
|
||||
* `()`: empty tuple (*a.k.a.* unit), both literal and type.
|
||||
* `(expr)`: parenthesized expression.
|
||||
* `(expr,)`: single-element tuple expression.
|
||||
* `(type,)`: single-element tuple type.
|
||||
* `(expr, …)`: tuple expression.
|
||||
* `(type, …)`: tuple type.
|
||||
* `expr(expr, …)`: function call expression. Also used to initialize tuple `struct`s and tuple `enum` variants.
|
||||
* `ident!(…)`, `ident!{…}`, `ident![…]`: macro invocation.
|
||||
* `expr.0`, `expr.1`, …: tuple indexing.
|
||||
|
||||
#### Curly Brackets
|
||||
|
||||
* `{…}`: block expression.
|
||||
* `Type {…}`: `struct` literal.
|
||||
|
||||
#### Square Brackets
|
||||
|
||||
* `[…]`: array literal.
|
||||
* `[expr; len]`: array literal containing `len` copies of `expr`.
|
||||
* `[type; len]`: array type containing `len` instances of `type`.
|
||||
* `expr[expr]`: collection indexing. Overloadable (`Index`, `IndexMut`).
|
||||
* `expr[..]`, `expr[a..]`, `expr[..b]`, `expr[a..b]`: collection indexing pretending to be collection slicing, using `Range`, `RangeFrom`, `RangeTo`, `RangeFull` as the “index”.
|
||||
230
2018-edition/src/appendix-03-derivable-traits.md
Normal file
230
2018-edition/src/appendix-03-derivable-traits.md
Normal file
@@ -0,0 +1,230 @@
|
||||
## C - Derivable Traits
|
||||
|
||||
In various places in the book, we’ve discussed the `derive` attribute
|
||||
that you can apply to a struct or enum definition.
|
||||
|
||||
<!-- Above -- I wasn't clear throughout whether the derive attribute is
|
||||
something passively applied to structs and enums by Rust, or something the
|
||||
reader applies. I've experimented with making the tone more active, but may
|
||||
have misinterpreted -- can you make it clear here? Should this be "we've
|
||||
discussed the `derive` attribute you can apply to a struct or enum"? -->
|
||||
<!-- Rust never edits your source code file for you. I'm curious to know what
|
||||
parts of the book have given you that impression... I've tried to clarify here
|
||||
but now I'm worried about other places in the book... /Carol -->
|
||||
|
||||
<!-- Below -- Can you lay out what it is we're showing them about derivable
|
||||
traits in this appendix, just showing them some common ones and how to use
|
||||
them? -->
|
||||
<!-- No, we're showing *all* of the derivable traits provided by the standard
|
||||
library. I guess explaining what we mean by "derivable" was too much of a
|
||||
tangent for the beginning of this section? I'm not sure where that would fit
|
||||
instead, so I took it out. So now the text that we had under the "standard
|
||||
library traits that can be derived" section is here where it seems like you
|
||||
were expecting it to be /Carol -->
|
||||
|
||||
The `derive` attribute generates code that will implement a trait with its own
|
||||
default implementation, on the type you have annotated with the `derive`
|
||||
syntax. In this appendix, we provide a reference of all of the traits in the
|
||||
standard library that can be used with `derive`. Each section covers:
|
||||
|
||||
- What operators and methods deriving this trait will enable
|
||||
- What the implementation of the trait provided by `derive` does
|
||||
- What implementing the trait signifies about the type
|
||||
- The conditions in which you’re allowed or not allowed to implement the trait
|
||||
- Examples of operations that require the trait
|
||||
|
||||
If you want different behavior than that provided by the `derive` attribute,
|
||||
consult the standard library documentation for each trait for details of how to
|
||||
manually implement them.
|
||||
|
||||
<!-- Liz: I've incorporated the small sections that were after the list of
|
||||
traits here and then moved the section headings out a level, what do you think?
|
||||
/Carol -->
|
||||
|
||||
The rest of the traits defined in the standard library can’t be implemented on
|
||||
your types using `derive`. These traits don’t have sensible default behavior,
|
||||
so it’s up to you to implement them in the way that makes sense for what you’re
|
||||
trying to accomplish.
|
||||
|
||||
An example of a trait that can’t be derived is `Display`, which handles
|
||||
formatting for end users. You should always put thought into the appropriate
|
||||
way to display a type to an end user: what parts of the type should an end user
|
||||
be allowed to see? What parts would they find relevant? What format of the data
|
||||
would be most relevant to them? The Rust compiler doesn’t have this insight and
|
||||
so can’t provide appropriate default behavior for you.
|
||||
|
||||
The list of derivable traits provided in this appendix is not comprehensive:
|
||||
libraries can implement `derive` for their own traits! In this way, the list of
|
||||
traits you can use `derive` with is truly open-ended. Implementing `derive`
|
||||
involves using a procedural macro, which is covered in Appendix D, “Macros.”
|
||||
|
||||
### `Debug` for Programmer Output
|
||||
|
||||
The `Debug` trait enables debug formatting in format strings, indicated by
|
||||
adding `:?` within `{}` placeholders.
|
||||
|
||||
The `Debug` trait allows you to print instances of a type for debugging
|
||||
purposes, so you and other programmers using your type can inspect an instance
|
||||
at a particular point in a program’s execution.
|
||||
|
||||
`Debug` is required, for example, in use of the `assert_eq!` macro, which
|
||||
prints the values of instances given as arguments if the equality assertion
|
||||
fails so programmers can see why the two instances weren’t equal.
|
||||
|
||||
### `PartialEq` and `Eq` for Equality Comparisons
|
||||
|
||||
<!-- I've tried to phrase these definitions in a more active way, it seems like
|
||||
we're saying using these traits gives us this capabilities --- apologies if
|
||||
I've misunderstood, feel free to change the phrasing back to the "signifies
|
||||
that..." version -->
|
||||
<!-- More active is fine. I feel like it lost a tiny bit of meaning-- not only
|
||||
can we use these capabilities on our own types, but other programmers using our
|
||||
types can use these capabilities too. I've tried to reinsert that sentiment
|
||||
occasionally. /Carol -->
|
||||
|
||||
The `PartialEq` trait allows you to compare instances of a type to check for
|
||||
equality, and enables use of the `==` and `!=` operators.
|
||||
|
||||
Deriving `PartialEq` implements the `eq` method. When `PartialEq` is derived on
|
||||
structs, two instances are equal only if *all* fields are equal, and not equal
|
||||
if any fields are not equal. When derived on enums, each variant is equal to
|
||||
itself and not equal to the other variants.
|
||||
|
||||
`PartialEq` is required, for example, with the use of the `assert_eq!` macro,
|
||||
which needs to be able to compare two instances of a type for equality.
|
||||
|
||||
The `Eq` trait has no methods. Its purpose is to signal that for every value of
|
||||
the annotated type, the value is equal to itself. The `Eq` trait can only be
|
||||
applied to types that also implement `PartialEq`, though not all types that
|
||||
implement `PartialEq` can implement `Eq`. One example of this is floating point
|
||||
number types: the implementation of floating point numbers says that two
|
||||
instances of the not-a-number value, `NaN`, are not equal to each other.
|
||||
|
||||
An example of when `Eq` is required is for keys in a `HashMap` so that the
|
||||
`HashMap` can tell whether two keys are the same.
|
||||
|
||||
### `PartialOrd` and `Ord` for Ordering Comparisons
|
||||
|
||||
The `PartialOrd` trait allows you to compare instances of a type for sorting
|
||||
purposes. A type that implements `PartialOrd` may be used with the `<`, `>`,
|
||||
`<=`, and `>=` operators. The `PartialOrd` trait can only be applied to types
|
||||
that also implement `PartialEq`.
|
||||
|
||||
Deriving `PartialOrd` implements the `partial_cmp` method, which returns an
|
||||
`Option<Ordering>` that will be `None` when the values given do not produce an
|
||||
ordering. An example of a value that doesn’t produce an ordering, even though
|
||||
most values of that type can be compared, is the not-a-number (`NaN`) floating
|
||||
point value. Calling `partial_cmp` with any floating point number and the `NaN`
|
||||
floating point value will return `None`.
|
||||
|
||||
<!-- Above -- you mean when the values cannot be ordered, for example if they
|
||||
are of types that can't be compared? -->
|
||||
<!-- No, if they're *types* that can't be compared, then the PartialOrd trait
|
||||
doesn't apply at all. I've tried to clarify and added an example /Carol-->
|
||||
|
||||
When derived on structs, `PartialOrd` compares two instances by comparing the
|
||||
value in each field in the order in which the fields appear in the struct
|
||||
definition. When derived on enums, variants of the enum declared earlier in the
|
||||
enum definition are considered greater than the variants listed later.
|
||||
|
||||
`PartialOrd` is required, for example, for the `gen_range` method from the
|
||||
`rand` crate that generates a random value in the range specified by a low
|
||||
value and a high value.
|
||||
|
||||
The `Ord` trait allows you to know that for any two values of the annotated
|
||||
type, a valid ordering will exist. The `Ord` trait implements the `cmp` method,
|
||||
which returns an `Ordering` rather than an `Option<Ordering>` because a valid
|
||||
ordering will always be possible. The `Ord` trait can only be applied to types
|
||||
that also implement `PartialOrd` and `Eq` (and `Eq` requires `PartialEq`). When
|
||||
derived on structs and enums, `cmp` behaves the same way as the derived
|
||||
implementation for `partial_cmp` does with `PartialOrd`.
|
||||
|
||||
An example of when `Ord` is required is when storing values in a `BTreeSet<T>`,
|
||||
a data structure that stores data based on the sort order of the values.
|
||||
|
||||
### `Clone` and `Copy` for Duplicating Values
|
||||
|
||||
<!-- Below -- I wasn't clear on the arbitrary code section of this explanation.
|
||||
Are we saying using Clone (as opposed to copy) risks bringing it arbitrary
|
||||
code? Why use Clone over copy? (I think we might have covered this in an
|
||||
earlier chapter, so feel free to cross ref there too if that's an easier
|
||||
explanation) -->
|
||||
<!-- Yes, we covered this in chapter 4 and I've added a cross reference. /Carol
|
||||
-->
|
||||
|
||||
The `Clone` trait allows you to explicitly create a deep copy of a value, and
|
||||
the duplication process might involve running arbitrary code and copying heap
|
||||
data. See the “Ways Variables and Data Interact: Clone” section in Chapter 4
|
||||
for more information on `Clone`.
|
||||
|
||||
Deriving `Clone` implements the `clone` method which, when implemented for the
|
||||
whole type, calls `clone` on each of the parts of the type. This means all of
|
||||
the fields or values in the type must also implement `Clone` to derive `Clone`.
|
||||
|
||||
An example of when `Clone` is required is when calling the `to_vec` method on a
|
||||
slice. The slice doesn’t own the type instances it contains, but the vector
|
||||
returned from `to_vec` will need to own its instances, so `to_vec` calls
|
||||
`clone` on each item. Thus, the type stored in the slice must implement `Clone`.
|
||||
|
||||
The `Copy` trait allows you to duplicate a value by only copying bits stored on
|
||||
the stack; no arbitrary code is necessary. See the “Stack-Only Data: Copy”
|
||||
section in Chapter 4 for more information on `Copy`.
|
||||
|
||||
<!-- I'm not clear on why the clone trait uses arbitrary code but copy doesn't
|
||||
-- is this important to make clear? -->
|
||||
<!-- We discussed this in chapter 4; I've added a cross ref. /Carol -->
|
||||
|
||||
The `Copy` trait does not define any methods to prevent programmers from
|
||||
overloading those methods violating the assumption that no arbitrary code is
|
||||
being run. That way, all programmers can assume that copying a value will be
|
||||
very fast.
|
||||
|
||||
<!-- above -- I couldn't follow this either, what does that mean practically
|
||||
for the programmer? What does overloading methods that violate the assumption
|
||||
mean? -->
|
||||
<!-- I added a sentence at the end of the paragraph, does that clear it up?
|
||||
/Carol -->
|
||||
|
||||
You can derive `Copy` on any type whose parts all implement `Copy`. The `Copy`
|
||||
trait can only be applied to types that also implement `Clone`, as a type that
|
||||
implements `Copy` has a trivial implementation of `Clone`, doing the same thing
|
||||
as `Copy`.
|
||||
|
||||
`Copy` is rarely required; types implement `Copy` have optimizations available
|
||||
mean you don’t have to call `clone`, making the code more concise.
|
||||
|
||||
<!-- By "nicer" do you mean more efficient and understandable? -->
|
||||
<!-- concise, I've changed /Carol -->
|
||||
|
||||
Everything possible with `Copy` can also be accomplished with `Clone`, but the
|
||||
code might be slower or have to use `clone` in places.
|
||||
|
||||
### `Hash` for Mapping a Value to a Value of Fixed Size
|
||||
|
||||
The `Hash` trait allows you to take an instance of a type of arbitrary size and
|
||||
map that instance to a value of fixed size, using a hash function. Deriving
|
||||
`Hash` implements the `hash` method. The derived implementation of the `hash`
|
||||
method combines the result of calling `hash` on each of the parts of the type,
|
||||
meaning all fields or values must also implement `Hash` to derive `Hash`.
|
||||
|
||||
An example of when `Hash` is required is in storing keys in a `HashMap`, in
|
||||
order to store data efficiently.
|
||||
|
||||
### `Default` for Default Values
|
||||
|
||||
The `Default` trait allows you to create a default value for a type. Deriving
|
||||
`Default` implements the `default` method. The derived implementation of the
|
||||
`default` method calls the `default` method on each part of the type, meaning
|
||||
all fields or values in the type must also implement `Default` to derive
|
||||
`Default.`
|
||||
|
||||
`Default::default` is commonly used in combination with the struct update
|
||||
syntax discussed in the “Creating Instances From Other Instances With Struct
|
||||
Update Syntax” section in Chapter 5. You can customize a few fields of a struct
|
||||
and then set and use a default value for the rest of the fields by using
|
||||
`..Default::default()`.
|
||||
|
||||
`Default` is required when, for example, you use the `unwrap_or_default` method
|
||||
on `Option<T>` instances. If the `Option<T>` is `None`, the `unwrap_or_default`
|
||||
method will return the result of `Default::default` for the type `T` stored in
|
||||
the `Option<T>`.
|
||||
504
2018-edition/src/appendix-04-macros.md
Normal file
504
2018-edition/src/appendix-04-macros.md
Normal file
@@ -0,0 +1,504 @@
|
||||
## Appendix D: Macros
|
||||
|
||||
We’ve used macros like `println!` throughout this book, but haven’t fully
|
||||
explored what a macro is and how it works. This appendix will explain:
|
||||
|
||||
- What macros are and how they differ from functions
|
||||
- How to define a declarative macro to do metaprogramming
|
||||
- How to define a procedural macro to create custom `derive` traits
|
||||
|
||||
We’re covering the details of macros in an appendix because they’re still
|
||||
evolving in Rust. Macros have changed and, in the near future, will change at a
|
||||
quicker rate than the rest of the language and standard library since Rust 1.0,
|
||||
so this section is more likely to date than the rest of the book. The code
|
||||
shown here will still continue to work with future versions, due to Rust’s
|
||||
stability guarantees, but there may be additional capabilities or easier ways
|
||||
to write macros that weren’t available at the time of this publication. Bear
|
||||
that in mind if you try to implement anything from this appendix.
|
||||
|
||||
### The Difference Between Macros and Functions
|
||||
|
||||
Fundamentally, macros are a way of writing code that writes other code, known
|
||||
as *metaprogramming*. In Appendix C, we discussed the `derive` attribute, which
|
||||
generates an implementation of various traits for you. We’ve also used the
|
||||
`println!` and `vec!` macros throughout the book. All of these macros *expand*
|
||||
to produce more code than the code you’ve written yourself.
|
||||
|
||||
Metaprogramming is useful for reducing the amount of code you have to write and
|
||||
maintain, which is also one of the roles of functions. However, macros have
|
||||
some additional powers that functions don’t have.
|
||||
|
||||
A function signature has to declare the number and type of parameters the
|
||||
function has. Macros, on the other hand, can take a variable number of
|
||||
parameters: we can call `println!("hello")` with one argument, or
|
||||
`println!("hello {}", name)` with two arguments. Also, macros are expanded
|
||||
before the compiler interprets the meaning of the code, so a macro can, for
|
||||
example, implement a trait on a given type. A function can’t, because it gets
|
||||
called at runtime and a trait needs to be implemented at compile time.
|
||||
|
||||
The downside to implementing a macro over a function is that macro definitions
|
||||
are more complex than function definitions because you’re writing Rust code
|
||||
that writes Rust code. Due to this indirection, macro definitions are generally
|
||||
more difficult to read, understand, and maintain than function definitions.
|
||||
|
||||
Another difference between macros and functions is that macro definitions
|
||||
aren’t namespaced within modules like function definitions are. In order to
|
||||
prevent unexpected name clashes when using external crates, you have to
|
||||
explicitly bring the macros into the scope of your project at the same time as
|
||||
bringing the external crate into scope, using the `#[macro_use]` annotation.
|
||||
The following example would bring all the macros defined in the `serde` crate
|
||||
into the scope of the current crate:
|
||||
|
||||
```rust,ignore
|
||||
#[macro_use]
|
||||
extern crate serde;
|
||||
```
|
||||
|
||||
If `extern crate` was able to bring macros into scope by default without this
|
||||
explicit annotation, you would be prevented from using two crates that happened
|
||||
to define macros with the same name. In practice this conflict doesn’t come up
|
||||
much, but the more crates you use, the more likely it is.
|
||||
|
||||
One last important difference between macros and functions: macros must be
|
||||
defined or brought into scope *before* they’re called in a file, whereas
|
||||
functions can be defined anywhere and called anywhere.
|
||||
|
||||
### Declarative Macros with `macro_rules!` for General Metaprogramming
|
||||
|
||||
The most widely used form of macros in Rust are *declarative macros*. These are
|
||||
also sometimes referred to as *macros by example*, *`macro_rules!` macros*, or
|
||||
just plain *macros*. At their core, declarative macros allow you to write
|
||||
something similar to a Rust `match` expression. As discussed in Chapter 6,
|
||||
`match` expressions are control structures that take an expression, compare the
|
||||
resulting value of the expression to patterns, and then run the code associated
|
||||
with the matching pattern. Macros also compare a value to patterns that have
|
||||
code associated with them, but in this case the value is the literal Rust
|
||||
source code passed to the macro, the patterns are compared with the structure
|
||||
of that source code, and the code associated with each pattern is the code that
|
||||
replaces the code passed to the macro. This all happens during compilation.
|
||||
|
||||
To define a macro, you use the `macro_rules!` construct. Let’s explore how to
|
||||
use `macro_rules!` by taking a look at how the `vec!` macro is defined. Chapter
|
||||
8 covered how we can use the `vec!` macro to create a new vector with
|
||||
particular values. For example, this macro creates a new vector with three
|
||||
integers inside:
|
||||
|
||||
```rust
|
||||
let v: Vec<u32> = vec![1, 2, 3];
|
||||
```
|
||||
|
||||
We could also use the `vec!` macro to make a vector of two integers or a vector
|
||||
of five string slices---we wouldn’t be able to use a function to do the same
|
||||
because we wouldn’t know the number or type of values up front.
|
||||
|
||||
Let’s take a look at a slightly simplified definition of the `vec!` macro in
|
||||
Listing AD-1:
|
||||
|
||||
```rust
|
||||
#[macro_export]
|
||||
macro_rules! vec {
|
||||
( $( $x:expr ),* ) => {
|
||||
{
|
||||
let mut temp_vec = Vec::new();
|
||||
$(
|
||||
temp_vec.push($x);
|
||||
)*
|
||||
temp_vec
|
||||
}
|
||||
};
|
||||
}
|
||||
```
|
||||
|
||||
Listing AD-1: A simplified version of the `vec!` macro definition
|
||||
|
||||
> Note: the actual definition of the `vec!` macro in the standard library
|
||||
> includes code to pre-allocate the correct amount of memory up-front. That
|
||||
> code is an optimization that we’ve chosen not to include here to make the
|
||||
> example simpler.
|
||||
|
||||
The `#[macro_export]` annotation indicates that this macro should be made
|
||||
available whenever the crate in which we’re defining the macro is imported.
|
||||
Without this annotation, even if someone depending on this crate uses the
|
||||
`#[macro_use]` annotation, the macro would not be brought into scope.
|
||||
|
||||
We then start the macro definition with `macro_rules!` and the name of the
|
||||
macro we’re defining *without* the exclamation mark. The name---in this case
|
||||
`vec`---is followed by curly brackets denoting the body of the macro definition.
|
||||
|
||||
The structure in the `vec!` body is similar to the structure of a `match`
|
||||
expression. Here we have one arm with the pattern `( $( $x:expr ),* )`,
|
||||
followed by `=>` and the block of code associated with this pattern. If the
|
||||
pattern matches, the associated block of code will be emitted. Given that this
|
||||
is the only pattern in this macro, there’s only one valid way to match; any
|
||||
other will be an error. More complex macros will have more than one arm.
|
||||
|
||||
Valid pattern syntax in macro definitions is different than the pattern syntax
|
||||
covered in Chapter 18 because macro patterns are matched against Rust code
|
||||
structure rather than values. Let’s walk through what the pieces of the pattern
|
||||
in Listing AD-1 mean; for the full macro pattern syntax, see [the reference].
|
||||
|
||||
[the reference]: ../../reference/macros.html
|
||||
|
||||
First, a set of parentheses encompasses the whole pattern. Next comes a dollar
|
||||
sign (`$`) followed by a set of parentheses, which captures values that match
|
||||
the pattern within the parentheses for use in the replacement code. Within
|
||||
`$()` is `$x:expr`, which matches any Rust expression and gives the expression
|
||||
the name `$x`.
|
||||
|
||||
The comma following `$()` indicates that a literal comma separator character
|
||||
could optionally appear after the code that matches the code captured in `$()`.
|
||||
The `*` following the comma specifies that the pattern matches zero or more of
|
||||
whatever precedes the `*`.
|
||||
|
||||
When we call this macro with `vec![1, 2, 3];`, the `$x` pattern matches three
|
||||
times with the three expressions `1`, `2`, and `3`.
|
||||
|
||||
Now let’s look at the pattern in the body of the code associated with this arm:
|
||||
The `temp_vec.push()` code within the `$()*` part is generated for each part
|
||||
that matches `$()` in the pattern, zero or more times depending on how many
|
||||
times the pattern matches. The `$x` is replaced with each expression matched.
|
||||
When we call this macro with `vec![1, 2, 3];`, the code generated that replaces
|
||||
this macro call will be:
|
||||
|
||||
<!-- Above What about temp_vec.push, do you want to quickly mention that? Or do
|
||||
you mean "The `$()*` part and the content of the parentheses is generated for
|
||||
each part that matches `$()` in the pattern"-->
|
||||
<!-- The latter, I've tried to clarify /Carol -->
|
||||
|
||||
```rust,ignore
|
||||
let mut temp_vec = Vec::new();
|
||||
temp_vec.push(1);
|
||||
temp_vec.push(2);
|
||||
temp_vec.push(3);
|
||||
temp_vec
|
||||
```
|
||||
|
||||
We’ve defined a macro that can take any number of arguments of any type and can
|
||||
generate code to create a vector containing the specified elements.
|
||||
|
||||
Given that most Rust programmers will *use* macros more than *write* macros,
|
||||
that’s all we’ll discuss about `macro_rules!` in this book. To learn more about
|
||||
how to write macros, consult the online documentation or other resources such
|
||||
as [The Little Book of Rust Macros][tlborm].
|
||||
|
||||
[tlborm]: https://danielkeep.github.io/tlborm/book/index.html
|
||||
|
||||
### Procedural Macros for Custom `derive`
|
||||
|
||||
The second form of macros is called *procedural macros* because they’re more
|
||||
like functions (which are a type of procedure). Procedural macros accept some
|
||||
Rust code as an input, operate on that code, and produce some Rust code as an
|
||||
output, rather than matching against patterns and replacing the code with other
|
||||
code as declarative macros do. At the time of writing, you can only really
|
||||
define procedural macros to allow your traits to be implemented on a type by
|
||||
specifying the trait name in a `derive` annotation.
|
||||
|
||||
We’re going to create a crate named `hello_macro` that defines a trait named
|
||||
`HelloMacro` with one associated function named `hello_macro`. Rather than
|
||||
making users of our crate implement the `HelloMacro` trait for each of their
|
||||
types, we’ll provide a procedural macro so users can annotate their type with
|
||||
`#[derive(HelloMacro)]` to get a default implementation of the `hello_macro`
|
||||
function. The default implementation will print `Hello, Macro! My name is
|
||||
TypeName!` where `TypeName` is the name of the type on which this trait has
|
||||
been defined.
|
||||
|
||||
In other words, we’re going to write a crate that enables another programmer to
|
||||
write code like Listing AD-2 using our crate:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
extern crate hello_macro;
|
||||
#[macro_use]
|
||||
extern crate hello_macro_derive;
|
||||
|
||||
use hello_macro::HelloMacro;
|
||||
|
||||
#[derive(HelloMacro)]
|
||||
struct Pancakes;
|
||||
|
||||
fn main() {
|
||||
Pancakes::hello_macro();
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing AD-2: The code a user of our crate will be able
|
||||
to write with use of our procedural macro</span>
|
||||
|
||||
This code will print `Hello, Macro! My name is Pancakes!` when we’re done. Let’s
|
||||
get started! First we need to make a new library crate:
|
||||
|
||||
```text
|
||||
$ cargo new hello_macro --lib
|
||||
```
|
||||
|
||||
Now we’ll define the `HelloMacro` trait and its associated function:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub trait HelloMacro {
|
||||
fn hello_macro();
|
||||
}
|
||||
```
|
||||
|
||||
We have a trait and its function. At this point, a user of our crate would be
|
||||
able to implement the trait themselves to achieve the desired functionality,
|
||||
like so:
|
||||
|
||||
```rust,ignore
|
||||
extern crate hello_macro;
|
||||
|
||||
use hello_macro::HelloMacro;
|
||||
|
||||
struct Pancakes;
|
||||
|
||||
impl HelloMacro for Pancakes {
|
||||
fn hello_macro() {
|
||||
println!("Hello, Macro! My name is Pancakes!");
|
||||
}
|
||||
}
|
||||
|
||||
fn main() {
|
||||
Pancakes::hello_macro();
|
||||
}
|
||||
```
|
||||
|
||||
However, they would need to write out the implementation block for each type
|
||||
they wanted to use with `hello_macro`; we’d like to save them this work.
|
||||
|
||||
Additionally, we can’t yet provide a default implementation for the
|
||||
`hello_macro` function that will print out the name of the type the trait is
|
||||
implemented on: Rust doesn’t have reflection capabilities, so can’t look up the
|
||||
type’s name at runtime. We need a macro to generate code at compile time.
|
||||
|
||||
<!--Defining Procedural Macros Requires a Separate Crate--> <!-- Since this is
|
||||
a lone subheading, okay to merge with the general procedural macros section? -->
|
||||
<!-- Sure /Carol -->
|
||||
|
||||
The next step is to define the procedural macro. At the time of writing,
|
||||
procedural macros need to be in their own crate. Eventually, this restriction
|
||||
may be lifted. The convention for structuring crates and macro crates is as
|
||||
such: for a crate named `foo`, a custom derive procedural macro crate is called
|
||||
`foo-derive`. Let’s start a new crate called `hello_macro_derive` inside our
|
||||
`hello_macro` project:
|
||||
|
||||
```text
|
||||
$ cargo new hello_macro_derive --lib
|
||||
```
|
||||
|
||||
Our two crates are tightly related, so we create the procedural macro crate
|
||||
within the directory of our `hello_macro` crate. If we change the trait
|
||||
definition in `hello_macro`, we’ll have to change the implementation of the
|
||||
procedural macro in `hello_macro_derive` as well. The two crates will need to
|
||||
be published separately, though, and programmers using these crates will need
|
||||
to add both as dependencies and bring them both into scope. We could instead
|
||||
have the `hello_macro` crate use `hello_macro_derive` as a dependency and
|
||||
re-export the procedural macro code, but the way we’ve structured the project
|
||||
makes it possible for programmers to use `hello_macro` even if they don’t want
|
||||
the `derive` functionality.
|
||||
|
||||
We need to declare the `hello_macro_derive` crate as a procedural macro crate.
|
||||
We’ll also need functionality from the `syn` and `quote` crates, as we’ll see
|
||||
in a moment, so we need to add them as dependencies. Add the following to the
|
||||
*Cargo.toml* file for `hello_macro_derive`:
|
||||
|
||||
<span class="filename">Filename: hello_macro_derive/Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[lib]
|
||||
proc-macro = true
|
||||
|
||||
[dependencies]
|
||||
syn = "0.11.11"
|
||||
quote = "0.3.15"
|
||||
```
|
||||
|
||||
To start defining the procedural macro, place the code from Listing AD-3 in
|
||||
your *src/lib.rs* for the `hello_macro_derive` crate. Note that this won’t
|
||||
compile until we add a definition for the `impl_hello_macro` function.
|
||||
|
||||
Note the way we’ve split the functions in AD-3; this will be the same for
|
||||
almost every procedural macro crate you see or create, as it makes writing a
|
||||
procedural macro more convenient. What you choose to do in the place where the
|
||||
`impl_hello_macro` function is called will be different depending on the
|
||||
purpose of your procedural macro.
|
||||
|
||||
<span class="filename">Filename: hello_macro_derive/src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
extern crate proc_macro;
|
||||
extern crate syn;
|
||||
#[macro_use]
|
||||
extern crate quote;
|
||||
|
||||
use proc_macro::TokenStream;
|
||||
|
||||
#[proc_macro_derive(HelloMacro)]
|
||||
pub fn hello_macro_derive(input: TokenStream) -> TokenStream {
|
||||
// Construct a string representation of the type definition
|
||||
let s = input.to_string();
|
||||
|
||||
// Parse the string representation
|
||||
let ast = syn::parse_derive_input(&s).unwrap();
|
||||
|
||||
// Build the impl
|
||||
let gen = impl_hello_macro(&ast);
|
||||
|
||||
// Return the generated impl
|
||||
gen.parse().unwrap()
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing AD-3: Code that most procedural macro crates will
|
||||
need to have for processing Rust code</span>
|
||||
|
||||
We have introduced three new crates: `proc_macro`, [`syn`], and [`quote`]. The
|
||||
`proc_macro` crate comes with Rust, so we didn’t need to add that to the
|
||||
dependencies in *Cargo.toml*. The `proc_macro` crate allows us to convert Rust
|
||||
code into a string containing that Rust code. The `syn` crate parses Rust code
|
||||
from a string into a data structure that we can perform operations on. The
|
||||
`quote` crate takes `syn` data structures and turns them back into Rust code.
|
||||
These crates make it much simpler to parse any sort of Rust code we might want
|
||||
to handle: writing a full parser for Rust code is no simple task.
|
||||
|
||||
[`syn`]: https://crates.io/crates/syn
|
||||
[`quote`]: https://crates.io/crates/quote
|
||||
|
||||
The `hello_macro_derive` function will get called when a user of our library
|
||||
specifies `#[derive(HelloMacro)]` on a type, because we’ve annotated the
|
||||
`hello_macro_derive` function here with `proc_macro_derive` and specified the
|
||||
name, `HelloMacro`, which matches our trait name; that’s the convention most
|
||||
procedural macros follow.
|
||||
|
||||
This function first converts the `input` from a `TokenStream` to a `String` by
|
||||
calling `to_string`. This `String` is a string representation of the Rust code
|
||||
for which we are deriving `HelloMacro`. In the example in Listing AD-2, `s`
|
||||
will have the `String` value `struct Pancakes;` because that’s the Rust code we
|
||||
added the `#[derive(HelloMacro)]` annotation to.
|
||||
|
||||
<!-- I'm not sure why we convert to a string then to a structure we can use,
|
||||
will that be clear to the reader here? -->
|
||||
<!-- This is just how procedural macros work and what you have to do, which is
|
||||
why we have the next note. /Carol -->
|
||||
|
||||
> Note: At the time of writing, the only thing you can do with a `TokenStream`
|
||||
> is convert it to a string. A richer API will exist in the future.
|
||||
|
||||
Now we need to be able to parse the Rust code `String` into a data structure
|
||||
that we can then interpret and perform operations on. This is where `syn` comes
|
||||
to play. The `parse_derive_input` function in `syn` takes a `String` and
|
||||
returns a `DeriveInput` struct representing the parsed Rust code. The following
|
||||
shows the relevant parts of the `DeriveInput` struct we get from parsing the
|
||||
string `struct Pancakes;`:
|
||||
|
||||
```rust,ignore
|
||||
DeriveInput {
|
||||
// --snip--
|
||||
|
||||
ident: Ident(
|
||||
"Pancakes"
|
||||
),
|
||||
body: Struct(
|
||||
Unit
|
||||
)
|
||||
}
|
||||
```
|
||||
|
||||
The fields of this struct show that the Rust code we’ve parsed is a unit struct
|
||||
with the `ident` (identifier, meaning the name) of `Pancakes`. There are more
|
||||
fields on this struct for describing all sorts of Rust code; check the [`syn`
|
||||
API docs for `DeriveInput`][syn-docs] for more information.
|
||||
|
||||
[syn-docs]: https://docs.rs/syn/0.11.11/syn/struct.DeriveInput.html
|
||||
|
||||
At this point we haven’t defined the `impl_hello_macro` function, which is
|
||||
where we’ll build the new Rust code we want to include. Before we get to that,
|
||||
the last part of this `hello_macro_derive` function is using the `parse`
|
||||
function from the `quote` crate to turn the output of the `impl_hello_macro`
|
||||
function back into a `TokenStream`. The returned `TokenStream` is added to the
|
||||
code that users of our crate write so that when they compile their crate, they
|
||||
get extra functionality we provide.
|
||||
|
||||
You may have noticed that we’re calling `unwrap` to panic if the calls to the
|
||||
`parse_derive_input` or `parse` functions fail here. Panicking on errors is
|
||||
necessary in procedural macro code because `proc_macro_derive` functions must
|
||||
return `TokenStream` rather than `Result` in order to conform to the procedural
|
||||
macro API. We’ve chosen to keep this example simple by using `unwrap`; in
|
||||
production code you should provide more specific error messages about what went
|
||||
wrong by using `expect` or `panic!`.
|
||||
|
||||
Now that we have the code to turn the annotated Rust code from a `TokenStream`
|
||||
into a `String` and a `DeriveInput` instance, let’s generate the code
|
||||
implementing the `HelloMacro` trait on the annotated type:
|
||||
|
||||
<span class="filename">Filename: hello_macro_derive/src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn impl_hello_macro(ast: &syn::DeriveInput) -> quote::Tokens {
|
||||
let name = &ast.ident;
|
||||
quote! {
|
||||
impl HelloMacro for #name {
|
||||
fn hello_macro() {
|
||||
println!("Hello, Macro! My name is {}", stringify!(#name));
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
We get an `Ident` struct instance containing the name (identifier) of the
|
||||
annotated type using `ast.ident`. With the code from Listing AD-2, `name` will
|
||||
be `Ident("Pancakes")`.
|
||||
|
||||
The `quote!` macro lets us write up the Rust code that we want to return and
|
||||
convert it into `quote::Tokens`. This macro also provides some really cool
|
||||
templating mechanics; we can write `#name` and `quote!` will replace it with
|
||||
the value in the variable named `name`. You can even do some repetition similar
|
||||
to the way regular macros work. Check out [the `quote` crate’s
|
||||
docs][quote-docs] for a thorough introduction.
|
||||
|
||||
[quote-docs]: https://docs.rs/quote
|
||||
|
||||
We want our procedural macro to generate an implementation of our `HelloMacro`
|
||||
trait for the type the user annotated, which we can get by using `#name`. The
|
||||
trait implementation has one function, `hello_macro`, whose body contains the
|
||||
functionality we want to provide: printing `Hello, Macro! My name is` and then
|
||||
the name of the annotated type.
|
||||
|
||||
The `stringify!` macro used here is built into Rust. It takes a Rust
|
||||
expression, such as `1 + 2`, and at compile time turns the expression into a
|
||||
string literal, such as `"1 + 2"`. This is different than `format!` or
|
||||
`println!`, which evaluate the expression and then turn the result into a
|
||||
`String`. There’s a possibility that the `#name` input might be an expression
|
||||
to print out literally so we use `stringify!`. Using `stringify!` also saves an
|
||||
allocation by converting `#name` to a string literal at compile time.
|
||||
|
||||
At this point, `cargo build` should complete successfully in both `hello_macro`
|
||||
and `hello_macro_derive`. Let’s hook these crates up to the code in Listing
|
||||
AD-2 to see it in action! Create a new binary project in your `projects`
|
||||
directory with `cargo new --bin pancakes`. We need to add both `hello_macro`
|
||||
and `hello_macro_derive` as dependencies in the `pancakes` crate’s
|
||||
*Cargo.toml*. If you’ve chosen to publish your versions of `hello_macro` and
|
||||
`hello_macro_derive` to *https://crates.io* they would be regular dependencies;
|
||||
if not, you can specify them as `path` dependencies as follows:
|
||||
|
||||
```toml
|
||||
[dependencies]
|
||||
hello_macro = { path = "../hello_macro" }
|
||||
hello_macro_derive = { path = "../hello_macro/hello_macro_derive" }
|
||||
```
|
||||
|
||||
Put the code from Listing AD-2 into *src/main.rs*, and when you run `cargo run`
|
||||
it should print `Hello, Macro! My name is Pancakes!` The implementation of the
|
||||
`HelloMacro` trait from the procedural macro was included without the
|
||||
`pancakes` crate needing to implement it; the `#[derive(HelloMacro)]` took care
|
||||
of adding the trait implementation.
|
||||
|
||||
### The Future of Macros
|
||||
|
||||
In the future, we’ll be expanding both declarative and procedural macros. Rust
|
||||
will use better declarative macro system with the `macro` keyword, and we’ll
|
||||
add more types of procedural macros, for more powerful tasks than just
|
||||
`derive`. These systems are still under development at the time of publication;
|
||||
please consult the online Rust documentation for the latest information.
|
||||
22
2018-edition/src/appendix-05-translation.md
Normal file
22
2018-edition/src/appendix-05-translation.md
Normal file
@@ -0,0 +1,22 @@
|
||||
## Appendix E: Translations of the Book
|
||||
|
||||
For resources in languages other than English. Most are still in progress; see
|
||||
[the Translations label][label] to help or let us know about a new translation!
|
||||
|
||||
[label]: https://github.com/rust-lang/book/issues?q=is%3Aopen+is%3Aissue+label%3ATranslations
|
||||
|
||||
- [Português](https://github.com/rust-br/rust-book-pt-br) (BR)
|
||||
- [Português](https://github.com/nunojesus/rust-book-pt-pt) (PT)
|
||||
- [Tiếng việt](https://github.com/hngnaig/rust-lang-book/tree/vi-VN)
|
||||
- [简体中文](http://www.broadview.com.cn/article/144), [alternate](https://github.com/KaiserY/trpl-zh-cn)
|
||||
- [Українська](https://github.com/pavloslav/rust-book-uk-ua)
|
||||
- [Español](https://github.com/thecodix/book)
|
||||
- [Italiano](https://github.com/CodelessFuture/trpl2-it)
|
||||
- [Русский](https://github.com/iDeBugger/rust-book-ru)
|
||||
- [한국어](https://github.com/rinthel/rust-lang-book-ko)
|
||||
- [日本語](https://github.com/hazama-yuinyan/book)
|
||||
- [Français](https://github.com/quadrifoglio/rust-book-fr)
|
||||
- [Polski](https://github.com/paytchoo/book-pl)
|
||||
- [עברית](https://github.com/idanmel/rust-book-heb)
|
||||
- [Cebuano](https://github.com/agentzero1/book)
|
||||
- [Tagalog](https://github.com/josephace135/book)
|
||||
128
2018-edition/src/appendix-06-newest-features.md
Normal file
128
2018-edition/src/appendix-06-newest-features.md
Normal file
@@ -0,0 +1,128 @@
|
||||
# Appendix F - Newest Features
|
||||
|
||||
This appendix documents features that have been added to stable Rust since the
|
||||
main part of the book was completed.
|
||||
|
||||
|
||||
## Field init shorthand
|
||||
|
||||
We can initialize a data structure (struct, enum, union) with named
|
||||
fields, by writing `fieldname` as a shorthand for `fieldname: fieldname`.
|
||||
This allows a compact syntax for initialization, with less duplication:
|
||||
|
||||
```rust
|
||||
#[derive(Debug)]
|
||||
struct Person {
|
||||
name: String,
|
||||
age: u8,
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let name = String::from("Peter");
|
||||
let age = 27;
|
||||
|
||||
// Using full syntax:
|
||||
let peter = Person { name: name, age: age };
|
||||
|
||||
let name = String::from("Portia");
|
||||
let age = 27;
|
||||
|
||||
// Using field init shorthand:
|
||||
let portia = Person { name, age };
|
||||
|
||||
println!("{:?}", portia);
|
||||
}
|
||||
```
|
||||
|
||||
|
||||
## Returning from loops
|
||||
|
||||
One of the uses of a `loop` is to retry an operation you know can fail, such as
|
||||
checking if a thread completed its job. However, you might need to pass the
|
||||
result of that operation to the rest of your code. If you add it to the `break`
|
||||
expression you use to stop the loop, it will be returned by the broken loop:
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let mut counter = 0;
|
||||
|
||||
let result = loop {
|
||||
counter += 1;
|
||||
|
||||
if counter == 10 {
|
||||
break counter * 2;
|
||||
}
|
||||
};
|
||||
|
||||
assert_eq!(result, 20);
|
||||
}
|
||||
```
|
||||
|
||||
## Nested groups in `use` declarations
|
||||
|
||||
If you have a complex module tree with many different submodules and you need
|
||||
to import a few items from each one, it might be useful to group all the
|
||||
imports in the same declaration to keep your code clean and avoid repeating the
|
||||
base modules’ name.
|
||||
|
||||
The `use` declaration supports nesting to help you in those cases, both with
|
||||
simple imports and glob ones. For example this snippets imports `bar`, `Foo`,
|
||||
all the items in `baz` and `Bar`:
|
||||
|
||||
```rust
|
||||
# #![allow(unused_imports, dead_code)]
|
||||
#
|
||||
# mod foo {
|
||||
# pub mod bar {
|
||||
# pub type Foo = ();
|
||||
# }
|
||||
# pub mod baz {
|
||||
# pub mod quux {
|
||||
# pub type Bar = ();
|
||||
# }
|
||||
# }
|
||||
# }
|
||||
#
|
||||
use foo::{
|
||||
bar::{self, Foo},
|
||||
baz::{*, quux::Bar},
|
||||
};
|
||||
#
|
||||
# fn main() {}
|
||||
```
|
||||
|
||||
## Inclusive ranges
|
||||
|
||||
Previously, when a range (`..` or `...`) was used as an expression, it had to be
|
||||
`..`, which is exclusive of the upper bound, while patterns had to use `...`,
|
||||
which is inclusive of the upper bound. Now, `..=` is accepted as syntax for
|
||||
inclusive ranges in both expression and range context:
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
for i in 0 ..= 10 {
|
||||
match i {
|
||||
0 ..= 5 => println!("{}: low", i),
|
||||
6 ..= 10 => println!("{}: high", i),
|
||||
_ => println!("{}: out of range", i),
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
The `...` syntax is still accepted in matches, but it is not accepted in
|
||||
expressions. `..=` should be preferred.
|
||||
|
||||
## 128-bit integers
|
||||
|
||||
Rust 1.26.0 added 128-bit integer primitives:
|
||||
|
||||
- `u128`: A 128-bit unsigned integer with range [0, 2^128 - 1]
|
||||
- `i128`: A 128-bit signed integer with range [-(2^127), 2^127 - 1]
|
||||
|
||||
These primitives are implemented efficiently via LLVM support. They are
|
||||
available even on platforms that don’t natively support 128-bit integers and
|
||||
can be used like the other integer types.
|
||||
|
||||
These primitives can be very useful for algorithms that need to use very large
|
||||
integers efficiently, such as certain cryptographic algorithms.
|
||||
204
2018-edition/src/appendix-07-nightly-rust.md
Normal file
204
2018-edition/src/appendix-07-nightly-rust.md
Normal file
@@ -0,0 +1,204 @@
|
||||
# Appendix G - How Rust is Made and “Nightly Rust”
|
||||
|
||||
This appendix is about how Rust is made and how that affects you as a Rust
|
||||
developer. We mentioned that the output in this book was generated by stable
|
||||
Rust 1.21.0, but any examples that compile should continue to compile in any
|
||||
stable version of Rust greater than that. This section is to explain how we
|
||||
ensure this is true!
|
||||
|
||||
### Stability Without Stagnation
|
||||
|
||||
As a language, Rust cares a *lot* about the stability of your code. We want
|
||||
Rust to be a rock-solid foundation you can build on, and if things were
|
||||
constantly changing, that would be impossible. At the same time, if we can’t
|
||||
experiment with new features, we may not find out important flaws until after
|
||||
their release, when we can no longer change things.
|
||||
|
||||
Our solution to this problem is what we call “stability without stagnation”,
|
||||
and our guiding principle is this: you should never have to fear upgrading to a
|
||||
new version of stable Rust. Each upgrade should be painless, but should also
|
||||
bring you new features, fewer bugs, and faster compile times.
|
||||
|
||||
### Choo, Choo! Release Channels and Riding the Trains
|
||||
|
||||
Rust development operates on a *train schedule*. That is, all development is
|
||||
done on the `master` branch of the Rust repository. Releases follow a software
|
||||
release train model, which has been used by Cisco IOS and other software
|
||||
projects. There are three *release channels* for Rust:
|
||||
|
||||
* Nightly
|
||||
* Beta
|
||||
* Stable
|
||||
|
||||
Most Rust developers primarily use the stable channel, but those who want to
|
||||
try out experimental new features may use nightly or beta.
|
||||
|
||||
Here’s an example of how the development and release process works: let’s
|
||||
assume that the Rust team is working on the release of Rust 1.5. That release
|
||||
happened in December of 2015, but it will provide us with realistic version
|
||||
numbers. A new feature is added to Rust: a new commit lands on the `master`
|
||||
branch. Each night, a new nightly version of Rust is produced. Every day is a
|
||||
release day, and these releases are created by our release infrastructure
|
||||
automatically. So as time passes, our releases look like this, once a night:
|
||||
|
||||
```text
|
||||
nightly: * - - * - - *
|
||||
```
|
||||
|
||||
Every six weeks, it’s time to prepare a new release! The `beta` branch of the
|
||||
Rust repository branches off from the `master` branch used by nightly. Now,
|
||||
there are two releases:
|
||||
|
||||
```text
|
||||
nightly: * - - * - - *
|
||||
|
|
||||
beta: *
|
||||
```
|
||||
|
||||
Most Rust users do not use beta releases actively, but test against beta in
|
||||
their CI system to help Rust discover possible regressions. In the meantime,
|
||||
there’s still a nightly release every night:
|
||||
|
||||
```text
|
||||
nightly: * - - * - - * - - * - - *
|
||||
|
|
||||
beta: *
|
||||
```
|
||||
|
||||
Let’s say a regression is found. Good thing we had some time to test the beta
|
||||
release before the regression snuck into a stable release! The fix is applied
|
||||
to `master`, so that nightly is fixed, and then the fix is backported to the
|
||||
`beta` branch, and a new release of beta is produced:
|
||||
|
||||
```text
|
||||
nightly: * - - * - - * - - * - - * - - *
|
||||
|
|
||||
beta: * - - - - - - - - *
|
||||
```
|
||||
|
||||
Six weeks after the first beta was created, it’s time for a stable release! The
|
||||
`stable` branch is produced from the `beta` branch:
|
||||
|
||||
```text
|
||||
nightly: * - - * - - * - - * - - * - - * - * - *
|
||||
|
|
||||
beta: * - - - - - - - - *
|
||||
|
|
||||
stable: *
|
||||
```
|
||||
|
||||
Hooray! Rust 1.5 is done! However, we’ve forgotten one thing: because the six
|
||||
weeks have gone by, we also need a new beta of the *next* version of Rust, 1.6.
|
||||
So after `stable` branches off of `beta`, the next version of `beta` branches
|
||||
off of `nightly` again:
|
||||
|
||||
```text
|
||||
nightly: * - - * - - * - - * - - * - - * - * - *
|
||||
| |
|
||||
beta: * - - - - - - - - * *
|
||||
|
|
||||
stable: *
|
||||
```
|
||||
|
||||
This is called the “train model” because every six weeks, a release “leaves the
|
||||
station”, but still has to take a journey through the beta channel before it
|
||||
arrives as a stable release.
|
||||
|
||||
Rust releases every six weeks, like clockwork. If you know the date of one Rust
|
||||
release, you can know the date of the next one: it’s six weeks later. A nice
|
||||
aspect of having releases scheduled every six weeks is that the next train is
|
||||
coming soon. If a feature happens to miss a particular release, there’s no need
|
||||
to worry: another one is happening in a short time! This helps reduce pressure
|
||||
to sneak possibly unpolished features in close to the release deadline.
|
||||
|
||||
Thanks to this process, you can always check out the next build of Rust and
|
||||
verify for yourself that it’s easy to upgrade to: if a beta release doesn’t
|
||||
work as expected, you can report it to the team and get it fixed before the
|
||||
next stable release happens! Breakage in a beta release is relatively rare, but
|
||||
`rustc` is still a piece of software, and bugs do exist.
|
||||
|
||||
### Unstable Features
|
||||
|
||||
There’s one more catch with this release model: unstable features. Rust uses a
|
||||
technique called “feature flags” to determine what features are enabled in a
|
||||
given release. If a new feature is under active development, it lands on
|
||||
`master`, and therefore, in nightly, but behind a *feature flag*. If you, as a
|
||||
user, wish to try out the work-in-progress feature, you can, but you must be
|
||||
using a nightly release of Rust and annotate your source code with the
|
||||
appropriate flag to opt in.
|
||||
|
||||
If you’re using a beta or stable release of Rust, you can’t use any feature
|
||||
flags. This is the key that allows us to get practical use with new features
|
||||
before we declare them stable forever. Those who wish to opt into the bleeding
|
||||
edge can do so, and those who want a rock-solid experience can stick with
|
||||
stable and know that their code won’t break. Stability without stagnation.
|
||||
|
||||
This book only contains information about stable features, as in-progress
|
||||
features are still changing, and surely they’ll be different between when this
|
||||
book was written and when they get enabled in stable builds. You can find
|
||||
documentation for nightly-only features online.
|
||||
|
||||
### Rustup and the Role of Rust Nightly
|
||||
|
||||
Rustup makes it easy to change between different release channels of Rust, on a
|
||||
global or per-project basis. By default, you’ll have stable Rust installed. To
|
||||
install nightly, for example:
|
||||
|
||||
```text
|
||||
$ rustup install nightly
|
||||
```
|
||||
|
||||
You can see all of the *toolchains* (releases of Rust and associated
|
||||
components) you have installed with `rustup` as well. Here’s an example on one
|
||||
of your authors’ computers:
|
||||
|
||||
```powershell
|
||||
> rustup toolchain list
|
||||
stable-x86_64-pc-windows-msvc (default)
|
||||
beta-x86_64-pc-windows-msvc
|
||||
nightly-x86_64-pc-windows-msvc
|
||||
```
|
||||
|
||||
As you can see, the stable toolchain is the default. Most Rust users use stable
|
||||
most of the time. You might want to use stable most of the time, but use
|
||||
nightly on a specific project, because you care about a cutting-edge feature.
|
||||
To do so, you can use `rustup override` in that project’s directory to set the
|
||||
nightly toolchain as the one `rustup` should use when you’re in that directory:
|
||||
|
||||
```text
|
||||
$ cd ~/projects/needs-nightly
|
||||
$ rustup override add nightly
|
||||
```
|
||||
|
||||
Now, every time you call `rustc` or `cargo` inside of
|
||||
*~/projects/needs-nightly*, `rustup` will make sure that you are using nightly
|
||||
Rust, rather than your default of stable Rust. This comes in handy when you
|
||||
have a lot of Rust projects!
|
||||
|
||||
### The RFC Process and Teams
|
||||
|
||||
So how do you learn about these new features? Rust’s development model follows
|
||||
a *Request For Comments (RFC) process*. If you’d like an improvement in Rust,
|
||||
you can write up a proposal, called an RFC.
|
||||
|
||||
Anyone can write RFCs to improve Rust, and the proposals are reviewed and
|
||||
discussed by the Rust team, which is comprised of many topic subteams. There’s
|
||||
a full list of the teams [on Rust’s
|
||||
website](https://www.rust-lang.org/en-US/team.html), which includes teams for
|
||||
each area of the project: language design, compiler implementation,
|
||||
infrastructure, documentation, and more. The appropriate team reads the
|
||||
proposal and the comments, writes some comments of their own, and eventually,
|
||||
there’s consensus to accept or reject the feature.
|
||||
|
||||
If the feature is accepted, an issue is opened on the Rust repository, and
|
||||
someone can implement it. The person who implements it very well may not be the
|
||||
person who proposed the feature in the first place! When the implementation is
|
||||
ready, it lands on the `master` branch behind a feature gate, as we discussed
|
||||
in the “Unstable Features” section.
|
||||
|
||||
After some time, once Rust developers who use nightly releases have been able
|
||||
to try out the new feature, team members will discuss the feature, how it’s
|
||||
worked out on nightly, and decide if it should make it into stable Rust or not.
|
||||
If the decision is to move forward, the feature gate is removed, and the
|
||||
feature is now considered stable! It rides the trains into a new stable release
|
||||
of Rust.
|
||||
173
2018-edition/src/ch00-00-introduction.md
Normal file
173
2018-edition/src/ch00-00-introduction.md
Normal file
@@ -0,0 +1,173 @@
|
||||
# Introduction
|
||||
|
||||
Welcome to *The Rust Programming Language*, an introductory book about Rust.
|
||||
|
||||
The Rust programming language helps you write faster, more reliable software.
|
||||
High-level ergonomics and low-level control are often at odds in programming
|
||||
language design; Rust challenges that conflict. Through balancing powerful
|
||||
technical capacity and a great developer experience, Rust gives you the option
|
||||
to control low-level details (such as memory usage) without all the hassle
|
||||
traditionally associated with such control.
|
||||
|
||||
## Who Rust Is For
|
||||
|
||||
Rust is ideal for many people for a variety of reasons. Let’s look at a few of
|
||||
the most important groups.
|
||||
|
||||
### Teams of Developers
|
||||
|
||||
Rust is proving to be a productive tool for collaborating among large teams of
|
||||
developers with varying levels of systems programming knowledge. Low-level code
|
||||
is prone to a variety of subtle bugs, which in most other languages can only be
|
||||
caught through extensive testing and careful code review by experienced
|
||||
developers. In Rust, the compiler plays a gatekeeper role by refusing to
|
||||
compile code with these elusive bugs, including concurrency bugs. By working
|
||||
alongside the compiler, the team can spend more time focusing on the program’s
|
||||
logic rather than chasing down bugs.
|
||||
|
||||
Rust also brings contemporary developer tools to the systems programming world:
|
||||
|
||||
* Cargo, the included dependency manager and build tool, makes adding,
|
||||
compiling, and managing dependencies painless and consistent across the Rust
|
||||
ecosystem.
|
||||
* Rustfmt ensures a consistent coding style across developers.
|
||||
* The Rust Language Server powers Integrated Development Environment (IDE)
|
||||
integration for code completion and inline error messages.
|
||||
|
||||
By using these and other tools in the Rust ecosystem, developers can be
|
||||
productive while writing systems-level code.
|
||||
|
||||
### Students
|
||||
|
||||
Rust is for students and those who are interested in learning about systems
|
||||
concepts. Using Rust, many people have learned about topics like operating
|
||||
systems development. The community is very welcoming and happy to answer
|
||||
student questions. Through efforts such as this book, the Rust teams want to
|
||||
make systems concepts more accessible to more people, especially those new to
|
||||
programming.
|
||||
|
||||
### Companies
|
||||
|
||||
Hundreds of companies, large and small, use Rust in production for a variety of
|
||||
tasks. Those tasks include command line tools, web services, DevOps tooling,
|
||||
embedded devices, audio and video analysis and transcoding, cryptocurrencies,
|
||||
bioinformatics, search engines, internet of things applications, machine
|
||||
learning, and even major parts of the Firefox web browser.
|
||||
|
||||
### Open Source Developers
|
||||
|
||||
Rust is for people who want to build the Rust programming language, community,
|
||||
developer tools, and libraries. We’d love to have you contribute to the Rust
|
||||
language.
|
||||
|
||||
### People Who Value Speed and Stability
|
||||
|
||||
Rust is for people who crave speed and stability in a language. By speed, we
|
||||
mean the speed of the programs that you can create with Rust and the speed at
|
||||
which Rust lets you write them. The Rust compiler’s checks ensure stability
|
||||
through feature additions and refactoring as opposed to brittle legacy code in
|
||||
languages without these checks that developers are afraid to modify. By
|
||||
striving for zero-cost abstractions, higher-level features that compile to
|
||||
lower-level code as fast as code written manually, Rust endeavors to make safe
|
||||
code be fast code as well.
|
||||
|
||||
Although we’ve not provided a complete list of everyone the Rust language hopes
|
||||
to support, those we have mentioned are some of the biggest stakeholders.
|
||||
Overall, Rust’s greatest ambition is to eliminate the dichotomy of the
|
||||
trade-offs that programmers have accepted for decades: safety *and*
|
||||
productivity, speed *and* ergonomics. Give Rust a try, and see if its choices
|
||||
work for you.
|
||||
|
||||
## Who This Book Is For
|
||||
|
||||
This book assumes that you’ve written code in another programming language but
|
||||
doesn’t make any assumptions about which one. We’ve tried to make the material
|
||||
broadly accessible to those from a wide variety of programming backgrounds. We
|
||||
don’t spend a lot of time talking about what programming *is* or how to think
|
||||
about it. If you’re entirely new to programming, you would be better served by
|
||||
reading a book that specifically provides an introduction to programming.
|
||||
|
||||
## How to Use This Book
|
||||
|
||||
In general, this book assumes that you’re reading it in sequence from front to
|
||||
back. Later chapters build on concepts in earlier chapters, and earlier
|
||||
chapters might not delve into details on a topic; we typically revisit the
|
||||
topic in a later chapter.
|
||||
|
||||
You’ll find two kinds of chapters in this book: concept chapters and project
|
||||
chapters. In concept chapters, you’ll learn about an aspect of Rust. In project
|
||||
chapters, we’ll build small programs together, applying what you’ve learned so
|
||||
far. Chapters 2, 12, and 20 are project chapters; the rest are concept chapters.
|
||||
|
||||
Additionally, Chapter 2 is a hands-on introduction to the Rust language. We’ll
|
||||
cover concepts at a high level, and later chapters will provide additional
|
||||
detail. If you want to get your hands dirty right away, Chapter 2 is the one
|
||||
for that. At first, you might even want to skip Chapter 3, which covers Rust
|
||||
features similar to other programming language features, and head straight to
|
||||
Chapter 4 to learn about Rust’s ownership system. However, if you’re a
|
||||
particularly meticulous learner who prefers to learn every detail before moving
|
||||
onto the next, you might want to skip Chapter 2 and go straight to Chapter 3,
|
||||
returning to Chapter 2 when you’d like to work on a project applying those
|
||||
details.
|
||||
|
||||
Chapter 5 discusses structs and methods, and Chapter 6 covers enums, `match`
|
||||
expressions, and the `if let` control flow construct. You’ll use structs and
|
||||
enums to make custom types in Rust.
|
||||
|
||||
In Chapter 7, you’ll learn about Rust’s module system and about privacy rules
|
||||
for organizing your code and its public Application Programming Interface
|
||||
(API). Chapter 8 discusses some common collection data structures that the
|
||||
standard library provides, such as vectors, strings, and hash maps. Chapter 9
|
||||
explores Rust’s error handling philosophy and techniques.
|
||||
|
||||
Chapter 10 digs into generics, traits, and lifetimes, which give you the power
|
||||
to define code that applies to multiple types. Chapter 11 is all about testing,
|
||||
which is still necessary even with Rust’s safety guarantees to ensure your
|
||||
program’s logic is correct. In Chapter 12, we’ll build our own implementation
|
||||
of a subset of functionality from the `grep` command line tool that searches
|
||||
for text within files. For this, we’ll use many of the concepts we discussed in
|
||||
the previous chapters.
|
||||
|
||||
Chapter 13 explores closures and iterators: features of Rust that come from
|
||||
functional programming languages. In Chapter 14, we’ll examine Cargo in more
|
||||
depth and talk about best practices for sharing your libraries with others.
|
||||
Chapter 15 discusses smart pointers that the standard library provides and the
|
||||
traits that enable their functionality.
|
||||
|
||||
In Chapter 16, we’ll walk through different models of concurrent programming
|
||||
and talk about how Rust helps you to program in multiple threads fearlessly.
|
||||
Chapter 17 looks at how Rust idioms compare to object oriented programming
|
||||
principles you might be familiar with.
|
||||
|
||||
Chapter 18 is a reference on patterns and pattern matching, which are powerful
|
||||
ways of expressing ideas throughout Rust programs. Chapter 19 contains a
|
||||
smorgasbord of advanced topics of interest, including unsafe Rust and more
|
||||
about lifetimes, traits, types, functions, and closures.
|
||||
|
||||
In Chapter 20, we’ll complete a project in which we’ll implement a low-level
|
||||
multithreaded web server!
|
||||
|
||||
Finally, some appendixes contain useful information about the language in a
|
||||
more reference-like format. Appendix A covers Rust’s keywords. Appendix B
|
||||
covers Rust’s operators and symbols. Appendix C covers derivable traits
|
||||
provided by the standard library. Appendix D covers macros.
|
||||
|
||||
There is no wrong way to read this book: if you want to skip ahead, go for it!
|
||||
You might have to jump back to earlier chapters if you experience any
|
||||
confusion. But do whatever works for you.
|
||||
|
||||
An important part of the process of learning Rust is learning how to read the
|
||||
error messages the compiler displays: these will guide you toward working code.
|
||||
As such, we’ll provide many examples of code that don’t compile along with the
|
||||
error message the compiler will show you in each situation. Know that if you
|
||||
enter and run a random example, it may not compile! Make sure you read the
|
||||
surrounding text to see whether the example you’re trying to run is meant to
|
||||
error. In most situations, we’ll lead you to the correct version of any code
|
||||
that doesn’t compile.
|
||||
|
||||
## Source Code
|
||||
|
||||
The source files from which this book is generated can be found on
|
||||
[GitHub][book].
|
||||
|
||||
[book]: https://github.com/rust-lang/book/tree/master/2018-edition/src
|
||||
12
2018-edition/src/ch01-00-getting-started.md
Normal file
12
2018-edition/src/ch01-00-getting-started.md
Normal file
@@ -0,0 +1,12 @@
|
||||
# Getting Started
|
||||
|
||||
<!-- If you want to use this paragraph in the Introduction, can you replace it
|
||||
with some other introductory text for the chapter here? Maybe just lay out
|
||||
what's in this chapter so they know it's important not to skip it. -->
|
||||
<!-- Yep, done! /Carol -->
|
||||
|
||||
Let’s get your Rust journey started! In this chapter, we’ll discuss:
|
||||
|
||||
- Installing Rust on Linux, Mac, or Windows
|
||||
- Writing a program that prints “Hello, world!”
|
||||
- Using `cargo`, Rust’s package manager and build system
|
||||
154
2018-edition/src/ch01-01-installation.md
Normal file
154
2018-edition/src/ch01-01-installation.md
Normal file
@@ -0,0 +1,154 @@
|
||||
## Installation
|
||||
|
||||
The first step to using Rust is to install it. We’ll download Rust through
|
||||
`rustup`, a command-line tool for managing Rust versions and associated tools.
|
||||
For this you’ll need an internet connection.
|
||||
|
||||
The following steps will install the latest stable version of the Rust
|
||||
compiler. The examples and output shown in this book all use stable Rust
|
||||
1.21.0. Rust’s stability guarantees ensure that all of the examples in the book
|
||||
that compile will continue to compile with newer versions of Rust. The output
|
||||
may differ slightly between versions, as error messages and warnings are often
|
||||
improved. In other words, any newer, stable version of Rust you will install
|
||||
with these steps should work as expected with the content of this book.
|
||||
|
||||
<!-- PROD: Start Box -->
|
||||
|
||||
> #### Command Line Notation
|
||||
>
|
||||
> In this chapter and throughout the book we’ll be showing some commands used
|
||||
> in the terminal. Lines that should be entered in a terminal all start with
|
||||
> `$`. You don’t need to type in the `$` character, it is simply there to
|
||||
> indicate the start of each command. Many tutorials use this convention: `$`
|
||||
> for commands run as a regular user, and `#` for commands you should be
|
||||
> running as an administrator. Lines that don’t start with `$` are typically
|
||||
> showing the output of the previous command. Additionally, PowerShell specific
|
||||
> examples will use `>` rather than `$`.
|
||||
|
||||
<!-- PROD: End box -->
|
||||
|
||||
### Installing Rustup on Linux or Mac
|
||||
|
||||
If you’re on Linux or a Mac, open a terminal and enter the following command:
|
||||
|
||||
```text
|
||||
$ curl https://sh.rustup.rs -sSf | sh
|
||||
```
|
||||
|
||||
This will download a script and start the installation of the `rustup` tool,
|
||||
which installs the latest stable version of Rust. You may be prompted for your
|
||||
password. If it all goes well, you’ll see this appear:
|
||||
|
||||
```text
|
||||
Rust is installed now. Great!
|
||||
```
|
||||
|
||||
Of course, if you distrust using `curl URL | sh` to install software, you can
|
||||
download, inspect, and run the script however you like.
|
||||
|
||||
The installation script automatically adds Rust to your system PATH after your
|
||||
next login. If you want to start using Rust right away instead of restarting
|
||||
your terminal, run the following command in your shell to add Rust to your
|
||||
system PATH manually:
|
||||
|
||||
<!-- what does this command do? Do you mean instead of logging out and logging
|
||||
in, enter the following? -->
|
||||
<!-- It runs a script that adds Rust to your system PATH manually. I've
|
||||
clarified that yes, this is instead of logging out and back in to your
|
||||
terminal. /Carol -->
|
||||
|
||||
```text
|
||||
$ source $HOME/.cargo/env
|
||||
```
|
||||
|
||||
Alternatively, you can add the following line to your `~/.bash_profile`:
|
||||
|
||||
```text
|
||||
$ export PATH="$HOME/.cargo/bin:$PATH"
|
||||
```
|
||||
|
||||
Finally, you’ll need a linker of some kind. It’s likely you already have one
|
||||
installed, but if you try to compile a Rust program and get errors telling you
|
||||
that a linker could not be executed, you’ll need to install one. You can
|
||||
install a C compiler, as that will usually come with the correct linker. Check
|
||||
your platform’s documentation for how to install a C compiler. Some common Rust
|
||||
packages depend on C code and will need a C compiler too, so it may be worth
|
||||
installing one now regardless.
|
||||
|
||||
### Installing Rustup on Windows
|
||||
|
||||
On Windows, go to [https://www.rust-lang.org/en-US/install.html][install] and
|
||||
follow the instructions for installing Rust. At some point in the installation
|
||||
you’ll receive a message telling you you’ll also need the C++ build tools for
|
||||
Visual Studio 2013 or later. The easiest way to acquire the build tools is to
|
||||
install [Build Tools for Visual Studio 2017][visualstudio], found in the Other
|
||||
Tools and Frameworks section.
|
||||
|
||||
[install]: https://www.rust-lang.org/en-US/install.html
|
||||
[visualstudio]: https://www.visualstudio.com/downloads/
|
||||
|
||||
The rest of this book will use commands that work in both `cmd.exe` and
|
||||
PowerShell. If there are specific differences, we’ll explain which to use.
|
||||
|
||||
### Custom Installations Without Rustup
|
||||
|
||||
If you have reasons for preferring not to use `rustup`, please see [the Rust
|
||||
installation page](https://www.rust-lang.org/install.html) for other options.
|
||||
|
||||
### Updating and Uninstalling
|
||||
|
||||
Once you have Rust installed via `rustup`, updating to the latest version is
|
||||
easy. From your shell, run the update script:
|
||||
|
||||
```text
|
||||
$ rustup update
|
||||
```
|
||||
|
||||
To uninstall Rust and `rustup`, from your shell, run the uninstall script:
|
||||
|
||||
```text
|
||||
$ rustup self uninstall
|
||||
```
|
||||
|
||||
### Troubleshooting
|
||||
|
||||
To check whether you have Rust installed correctly, open up a shell and enter:
|
||||
|
||||
```text
|
||||
$ rustc --version
|
||||
```
|
||||
|
||||
You should see the version number, commit hash, and commit date for the latest
|
||||
stable version at the time you install in the following format:
|
||||
|
||||
```text
|
||||
rustc x.y.z (abcabcabc yyyy-mm-dd)
|
||||
```
|
||||
|
||||
If you see this, Rust has been installed successfully! Congrats!
|
||||
|
||||
If you don’t and you’re on Windows, check that Rust is in your `%PATH%` system
|
||||
variable.
|
||||
|
||||
If that’s all correct and Rust still isn’t working, there are a number of
|
||||
places you can get help. The easiest is [the #rust IRC channel on
|
||||
irc.mozilla.org][irc]<!-- ignore -->, which you can access through
|
||||
[Mibbit][mibbit]. Go to that address, and you’ll be chatting with other
|
||||
Rustaceans (a silly nickname we call ourselves) who can help you out. Other
|
||||
great resources include [the Users forum][users] and [Stack
|
||||
Overflow][stackoverflow].
|
||||
|
||||
[irc]: irc://irc.mozilla.org/#rust
|
||||
[mibbit]: http://chat.mibbit.com/?server=irc.mozilla.org&channel=%23rust
|
||||
[users]: https://users.rust-lang.org/
|
||||
[stackoverflow]: http://stackoverflow.com/questions/tagged/rust
|
||||
|
||||
### Local Documentation
|
||||
|
||||
The installer also includes a copy of the documentation locally, so you can
|
||||
read it offline. Run `rustup doc` to open the local documentation in your
|
||||
browser.
|
||||
|
||||
Any time there’s a type or function provided by the standard library and you’re
|
||||
not sure what it does or how to use it, use the API (Application Programming
|
||||
Interface) documentation to find out!
|
||||
218
2018-edition/src/ch01-02-hello-world.md
Normal file
218
2018-edition/src/ch01-02-hello-world.md
Normal file
@@ -0,0 +1,218 @@
|
||||
## Hello, World!
|
||||
|
||||
Now that you have Rust installed, let’s write your first Rust program. It’s
|
||||
traditional when learning a new language to write a little program to print the
|
||||
text “Hello, world!” to the screen, so we’ll do the same here!
|
||||
|
||||
> Note: This book assumes basic familiarity with the command line. Rust itself
|
||||
> makes no specific demands about your editing, tooling, or where your code
|
||||
> lives, so if you prefer an IDE (Integrated Development Environment) to the
|
||||
> command line, feel free to use your favorite IDE. Many IDEs now have some
|
||||
> degree of Rust support; check the IDE’s documentation for details. Enabling
|
||||
> great IDE support has been a recent focus of the Rust team, and progress
|
||||
> has been made rapidly on that front!
|
||||
|
||||
### Creating a Project Directory
|
||||
|
||||
First, make a directory to put your Rust code in. Rust doesn’t care where your
|
||||
code lives, but for the exercises and projects in this book, we’d suggest
|
||||
making a *projects* directory in your home directory and keeping all your
|
||||
projects there.
|
||||
|
||||
Open a terminal and enter the following commands to make a *projects* directory
|
||||
and, inside that, a directory for this “Hello, world!” project:
|
||||
|
||||
Linux and Mac:
|
||||
|
||||
```text
|
||||
$ mkdir ~/projects
|
||||
$ cd ~/projects
|
||||
$ mkdir hello_world
|
||||
$ cd hello_world
|
||||
```
|
||||
|
||||
Windows CMD:
|
||||
|
||||
```cmd
|
||||
> mkdir "%USERPROFILE%\projects"
|
||||
> cd /d "%USERPROFILE%\projects"
|
||||
> mkdir hello_world
|
||||
> cd hello_world
|
||||
```
|
||||
|
||||
Windows PowerShell:
|
||||
|
||||
```powershell
|
||||
> mkdir $env:USERPROFILE\projects
|
||||
> cd $env:USERPROFILE\projects
|
||||
> mkdir hello_world
|
||||
> cd hello_world
|
||||
```
|
||||
|
||||
### Writing and Running a Rust Program
|
||||
|
||||
Next, make a new source file and call it *main.rs*---Rust files always end with
|
||||
the *.rs* extension. If you’re using more than one word in your filename, use
|
||||
an underscore to separate them. For example, you’d use *hello_world.rs* rather
|
||||
than *helloworld.rs*.
|
||||
|
||||
Now open the *main.rs* file you just created, and enter the code shown in
|
||||
Listing 1-1:
|
||||
|
||||
<span class="filename">Filename: main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
println!("Hello, world!");
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 1-1: A program that prints “Hello, world!”</span>
|
||||
|
||||
Save the file, and go back to your terminal window. On Linux or macOS, enter
|
||||
the following commands to compile and run the file:
|
||||
|
||||
```text
|
||||
$ rustc main.rs
|
||||
$ ./main
|
||||
Hello, world!
|
||||
```
|
||||
|
||||
On Windows, use `.\main.exe` instead of `./main`.
|
||||
|
||||
```powershell
|
||||
> rustc main.rs
|
||||
> .\main.exe
|
||||
Hello, world!
|
||||
```
|
||||
|
||||
Regardless of your operating system, you should see the string `Hello, world!`
|
||||
print to the terminal. If you don’t see this output, see the “Troubleshooting”
|
||||
section earlier for ways to get help.
|
||||
|
||||
If you did see `Hello, world!` printed, then congratulations! You’ve officially
|
||||
written a Rust program. That makes you a Rust programmer! Welcome!
|
||||
|
||||
<!-- Any quick words of advice for if they didn't? (Disclosure: I tried
|
||||
following this using Bash on windows and couldn't get it working) -->
|
||||
<!-- Added a pointer to the previous troubleshooting section which also applies
|
||||
here /Carol -->
|
||||
|
||||
### Anatomy of a Rust Program
|
||||
|
||||
Now, let’s go over what just happened in your “Hello, world!” program in
|
||||
detail. Here’s the first piece of the puzzle:
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
|
||||
}
|
||||
```
|
||||
|
||||
These lines define a *function* in Rust. The `main` function is special: it is
|
||||
always the first code that is run for every executable Rust program. The first
|
||||
line declares a function named `main` that has no parameters and returns
|
||||
nothing. If there were parameters, their names would go inside the parentheses,
|
||||
`(` and `)`.
|
||||
|
||||
Also note that the function body is wrapped in curly brackets, `{` and `}`.
|
||||
Rust requires these around all function bodies. It’s considered good style to
|
||||
place the opening curly bracket on the same line as the function declaration,
|
||||
with one space in between.
|
||||
|
||||
> At the time of writing, an automatic formatter, `rustfmt`, is under
|
||||
> development. If you’d like to stick to a standard style across Rust projects,
|
||||
> `rustfmt` is a tool that will format your code in a particular style. The
|
||||
> plan is to eventually include it with the standard Rust distribution, like
|
||||
> `rustc`, so depending on when you read this book, you may have it already
|
||||
> installed! Check the online documentation for more details.
|
||||
|
||||
Inside the `main` function, we have this code:
|
||||
|
||||
```rust
|
||||
println!("Hello, world!");
|
||||
```
|
||||
|
||||
This line does all of the work in this little program: it prints text to the
|
||||
screen. There are a number of details to notice here. The first is that Rust
|
||||
style is to indent with four spaces, not a tab.
|
||||
|
||||
The second important detail is the `println!` call. This code is calling a Rust
|
||||
*macro*. If it were calling a function instead, it would be entered as
|
||||
`println` (without the `!`). We’ll discuss Rust macros in more detail in
|
||||
Appendix D, but for now you just need to know that when you see a `!` that
|
||||
means that you’re calling a macro instead of a normal function.
|
||||
|
||||
<!-- I might suggest just cutting this next macro section -- for the sake of
|
||||
the intro, we don't really need this info, and I feel like this first exercise
|
||||
should be short and sweet and simple -->
|
||||
<!-- I'm ok with cutting this; it's a fairly common question that some folks
|
||||
have at this point, but I'm ok with those people having to do some research
|
||||
online if they're curious /Carol -->
|
||||
|
||||
Next comes`"Hello, world!"` which is a *string*. We pass this string as an
|
||||
argument to `println!` and the total effect is that the string is printed to
|
||||
the screen. Easy enough!
|
||||
|
||||
We end the line with a semicolon `;`, which indicates that this expression is
|
||||
over, and the next one is ready to begin. Most lines of Rust code end with a
|
||||
`;`.
|
||||
|
||||
### Compiling and Running Are Separate Steps
|
||||
|
||||
You’ve just seen how to run a newly created program, so now let’s break that
|
||||
process down and examine each step.
|
||||
|
||||
Before running a Rust program, you have to compile it using the Rust compiler
|
||||
by entering the `rustc` command and passing it the name of your source file,
|
||||
like this:
|
||||
|
||||
```text
|
||||
$ rustc main.rs
|
||||
```
|
||||
|
||||
If you come from a C or C++ background, you’ll notice that this is similar to
|
||||
`gcc` or `clang`. After compiling successfully, Rust outputs a binary
|
||||
executable.
|
||||
|
||||
On Linux, Mac, and PowerShell on Windows, you can see the executable by
|
||||
entering the `ls` command in your shell as follows:
|
||||
|
||||
```text
|
||||
$ ls
|
||||
main main.rs
|
||||
```
|
||||
|
||||
With CMD on Windows, you’d enter:
|
||||
|
||||
```cmd
|
||||
> dir /B %= the /B option says to only show the file names =%
|
||||
main.exe
|
||||
main.pdb
|
||||
main.rs
|
||||
```
|
||||
|
||||
This shows we have two files: the source code, with the *.rs* extension, and
|
||||
the executable (*main.exe* on Windows, *main* everywhere else). All that’s left
|
||||
to do from here is run the *main* or *main.exe* file, like this:
|
||||
|
||||
```text
|
||||
$ ./main # or .\main.exe on Windows
|
||||
```
|
||||
|
||||
If *main.rs* were your “Hello, world!” program, this would print `Hello,
|
||||
world!` to your terminal.
|
||||
|
||||
If you come from a dynamic language like Ruby, Python, or JavaScript, you may
|
||||
not be used to compiling and running a program being separate steps. Rust is an
|
||||
*ahead-of-time compiled* language, which means that you can compile a program,
|
||||
give the executable to someone else, and they can run it even without having
|
||||
Rust installed. If you give someone a `.rb`, `.py`, or `.js` file, on the other
|
||||
hand, they need to have a Ruby, Python, or JavaScript implementation installed
|
||||
(respectively), but you only need one command to both compile and run your
|
||||
program. Everything is a tradeoff in language design.
|
||||
|
||||
Just compiling with `rustc` is fine for simple programs, but as your project
|
||||
grows, you’ll want to be able to manage all of the options and make it easy to
|
||||
share your code. Next, we’ll introduce you to a tool called Cargo, which will
|
||||
help you write real-world Rust programs.
|
||||
266
2018-edition/src/ch01-03-hello-cargo.md
Normal file
266
2018-edition/src/ch01-03-hello-cargo.md
Normal file
@@ -0,0 +1,266 @@
|
||||
## Hello, Cargo!
|
||||
|
||||
Cargo is Rust’s build system and package manager. Most Rustaceans will use this
|
||||
tool to manage their Rust projects because Cargo takes care of a lot of tasks
|
||||
for you, such as building your code, downloading the libraries your code
|
||||
depends on, and building those libraries. (We call libraries your code needs
|
||||
*dependencies*.)
|
||||
|
||||
The simplest Rust programs, like the one we’ve written so far, don’t have any
|
||||
dependencies, so if we had built the Hello World project with Cargo, it would
|
||||
only be using the part of Cargo that takes care of building your code. As you
|
||||
write more complex Rust programs, you’ll want to add dependencies, and if you
|
||||
start the project off using Cargo, that will be a lot easier to do.
|
||||
|
||||
As the vast majority of Rust projects use Cargo, the rest of this book will
|
||||
assume that you’re using Cargo too. Cargo comes installed with Rust itself, if
|
||||
you used the official installers as covered in the “Installation” section. If
|
||||
you installed Rust through some other means, you can check if you have Cargo
|
||||
installed by entering the following into your terminal:
|
||||
|
||||
```text
|
||||
$ cargo --version
|
||||
```
|
||||
|
||||
If you see a version number, great! If you see an error like `command not
|
||||
found`, then you should look at the documentation for your method of
|
||||
installation to determine how to install Cargo separately.
|
||||
|
||||
### Creating a Project with Cargo
|
||||
|
||||
Let’s create a new project using Cargo and look at how it differs from our
|
||||
original Hello World project. Navigate back to your *projects* directory (or
|
||||
whichever location you decided to place your code) and then on any operating
|
||||
system run:
|
||||
|
||||
```text
|
||||
$ cargo new hello_cargo --bin
|
||||
$ cd hello_cargo
|
||||
```
|
||||
|
||||
<!-- Below -- so we always have to start a cargo project with the --bin option
|
||||
if we want it to be something we can execute and not just a library, is that
|
||||
right? It might be worth laying that out -->
|
||||
<!-- As of Rust 1.21.0 (the version we're using for the book), yes, you must
|
||||
always specify `--bin`. In a version of Rust in the near future (1.25 or 1.26),
|
||||
binary crates will become the default kind of crate that `cargo new` makes, so
|
||||
you won't have to specify `--bin` (but you can if you want and the behavior
|
||||
will be the same). We'd rather not go into any more detail than we have here
|
||||
because of this change; I think "The `--bin` argument to passed to `cargo new`
|
||||
makes an executable application (often just called a *binary*), as opposed to a
|
||||
library." lays this out enough. /Carol -->
|
||||
|
||||
This creates a new binary executable called `hello_cargo`. The `--bin` argument
|
||||
to passed to `cargo new` makes an executable application (often just called a
|
||||
*binary*), as opposed to a library. We’ve given `hello_cargo` as the name for
|
||||
our project, and Cargo creates its files in a directory of the same name.
|
||||
|
||||
Go into the *hello_cargo* directory and list the files, and you should see that
|
||||
Cargo has generated two files and one directory for us: a *Cargo.toml* and a
|
||||
*src* directory with a *main.rs* file inside. It has also initialized a new git
|
||||
repository, along with a *.gitignore* file.
|
||||
|
||||
> Note: Git is a common version control system. You can change `cargo new` to
|
||||
> use a different version control system, or no version control system, by
|
||||
> using the `--vcs` flag. Run `cargo new --help` to see the available options.
|
||||
|
||||
Open up *Cargo.toml* in your text editor of choice. It should look similar to
|
||||
the code in Listing 1-2:
|
||||
|
||||
<span class="filename">Filename: Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[package]
|
||||
name = "hello_cargo"
|
||||
version = "0.1.0"
|
||||
authors = ["Your Name <you@example.com>"]
|
||||
|
||||
[dependencies]
|
||||
```
|
||||
|
||||
<span class="caption">Listing 1-2: Contents of *Cargo.toml* generated by `cargo
|
||||
new`</span>
|
||||
|
||||
This file is in the [*TOML*][toml]<!-- ignore --> (Tom’s Obvious, Minimal
|
||||
Language) format, which is what Cargo uses as its configuration format.
|
||||
|
||||
[toml]: https://github.com/toml-lang/toml
|
||||
|
||||
The first line, `[package]`, is a section heading that indicates that the
|
||||
following statements are configuring a package. As we add more information to
|
||||
this file, we’ll add other sections.
|
||||
|
||||
The next three lines set the configuration information Cargo needs in order to
|
||||
know that it should compile your program: the name, the version, and who wrote
|
||||
it. Cargo gets your name and email information from your environment, so if
|
||||
that’s not correct, go ahead and fix that and save the file.
|
||||
|
||||
The last line, `[dependencies]`, is the start of a section for you to list any
|
||||
of your project’s dependencies. In Rust, packages of code are referred to as
|
||||
*crates*. We won’t need any other crates for this project, but we will in the
|
||||
first project in Chapter 2, so we’ll use this dependencies section then.
|
||||
|
||||
Now open up *src/main.rs* and take a look:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
println!("Hello, world!");
|
||||
}
|
||||
```
|
||||
|
||||
Cargo has generated a “Hello World!” for you, just like the one we wrote in
|
||||
Listing 1-1! So far, the differences between our previous project and the
|
||||
project generated by Cargo are that with Cargo our code goes in the *src*
|
||||
directory, and we have a *Cargo.toml* configuration file in the top directory.
|
||||
|
||||
Cargo expects your source files to live inside the *src* directory; the
|
||||
top-level project directory is just for READMEs, license information,
|
||||
configuration files, and anything else not related to your code. In this way,
|
||||
using Cargo helps you keep your projects nice and tidy. There’s a place for
|
||||
everything, and everything is in its place.
|
||||
|
||||
If you started a project that doesn’t use Cargo, as we did with our project in
|
||||
the *hello_world* directory, you can convert it to a project that does use
|
||||
Cargo by moving the project code into the *src* directory and creating an
|
||||
appropriate *Cargo.toml*.
|
||||
|
||||
### Building and Running a Cargo Project
|
||||
|
||||
Now let’s look at what’s different about building and running your Hello World
|
||||
program through Cargo! From your project directory, build your project by
|
||||
entering the following commands:
|
||||
|
||||
```text
|
||||
$ cargo build
|
||||
Compiling hello_cargo v0.1.0 (file:///projects/hello_cargo)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 2.85 secs
|
||||
```
|
||||
|
||||
This creates an executable file in *target/debug/hello_cargo* (or
|
||||
*target\\debug\\hello_cargo.exe* on Windows), which you can run with this
|
||||
command:
|
||||
|
||||
```text
|
||||
$ ./target/debug/hello_cargo # or .\target\debug\hello_cargo.exe on Windows
|
||||
Hello, world!
|
||||
```
|
||||
|
||||
Bam! If all goes well, `Hello, world!` should print to the terminal once more.
|
||||
Running `cargo build` for the first time also causes Cargo to create a new file
|
||||
at the top level called *Cargo.lock*, which is used to keep track of the exact
|
||||
versions of dependencies in your project. This project doesn’t have
|
||||
dependencies, so the file is a bit sparse. You won’t ever need to touch this
|
||||
file yourself; Cargo will manage its contents for you.
|
||||
|
||||
We just built a project with `cargo build` and ran it with
|
||||
`./target/debug/hello_cargo`, but we can also use `cargo run` to compile and
|
||||
then run all in one go:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/hello_cargo`
|
||||
Hello, world!
|
||||
```
|
||||
|
||||
Notice that this time, we didn’t see the output telling us that Cargo was
|
||||
compiling `hello_cargo`. Cargo figured out that the files haven’t changed, so
|
||||
it just ran the binary. If you had modified your source code, Cargo would have
|
||||
rebuilt the project before running it, and you would have seen output like this:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling hello_cargo v0.1.0 (file:///projects/hello_cargo)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.33 secs
|
||||
Running `target/debug/hello_cargo`
|
||||
Hello, world!
|
||||
```
|
||||
|
||||
Finally, there’s `cargo check`. This command will quickly check your code to
|
||||
make sure that it compiles, but not bother producing an executable:
|
||||
|
||||
```text
|
||||
$ cargo check
|
||||
Compiling hello_cargo v0.1.0 (file:///projects/hello_cargo)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.32 secs
|
||||
```
|
||||
|
||||
Why would you not want an executable? `cargo check` is often much faster than
|
||||
`cargo build`, because it skips the entire step of producing the executable. If
|
||||
you’re checking your work throughout the process of writing the code, using
|
||||
`cargo check` will speed things up! As such, many Rustaceans run `cargo check`
|
||||
periodically as they write their program to make sure that it compiles, and
|
||||
then run `cargo build` once they’re ready to give it a spin themselves.
|
||||
|
||||
So to recap, using Cargo:
|
||||
|
||||
- We can build a project using `cargo build` or `cargo check`
|
||||
- We can build and run the project in one step with `cargo run`
|
||||
- Instead of the result of the build being put in the same directory as our
|
||||
code, Cargo will put it in the *target/debug* directory.
|
||||
|
||||
A final advantage of using Cargo is that the commands are the same no matter
|
||||
what operating system you’re on, so at this point we will no longer be
|
||||
providing specific instructions for Linux and Mac versus Windows.
|
||||
|
||||
### Building for Release
|
||||
|
||||
When your project is finally ready for release, you can use `cargo build
|
||||
--release` to compile your project with optimizations. This will create an
|
||||
executable in *target/release* instead of *target/debug*. These optimizations
|
||||
make your Rust code run faster, but turning them on increases the compilation
|
||||
time of your program. This is why there are two different profiles: one for
|
||||
development when you want to be able to rebuild quickly and often, and one for
|
||||
building the final program you’ll give to a user that won’t be rebuilt
|
||||
repeatedly and that will run as fast as possible. If you’re benchmarking the
|
||||
running time of your code, be sure to run `cargo build --release` and benchmark
|
||||
with the executable in *target/release*.
|
||||
|
||||
### Cargo as Convention
|
||||
|
||||
With simple projects, Cargo doesn’t provide a whole lot of value over just
|
||||
using `rustc`, but it will prove its worth as you continue. With complex
|
||||
projects composed of multiple crates, it’s much easier to let Cargo coordinate
|
||||
the build.
|
||||
|
||||
Even though the `hello_cargo` project is simple, it now uses much of the real
|
||||
tooling you’ll use for the rest of your Rust career. In fact, to work on any
|
||||
existing projects you can use the following commands to check out the code
|
||||
using Git, change into the project directory, and build:
|
||||
|
||||
```text
|
||||
$ git clone someurl.com/someproject
|
||||
$ cd someproject
|
||||
$ cargo build
|
||||
```
|
||||
|
||||
If you want to look at Cargo in more detail, check out [its documentation].
|
||||
|
||||
[its documentation]: https://doc.rust-lang.org/cargo/
|
||||
|
||||
<!--Below -- I`m not sure this is the place for this conversation, it seems too
|
||||
deep into the weeds for the "getting started" chapter. I know we discussed
|
||||
Nightly Rust as an appendix previously, but honestly I think this is more
|
||||
suited somewhere online, perhaps in the extended docs. I like the idea of
|
||||
finishing the chapter here, on this practical note, and I think at this point
|
||||
readers will want to get stuck in anyway and may skip this and never come back
|
||||
because it's buried at the end of a chapter that's not really related to it. If
|
||||
it's online somewhere separate they can come to it when they're ready. What do
|
||||
you think?-->
|
||||
<!-- Ok, I can see that. /Carol -->
|
||||
|
||||
## Summary
|
||||
|
||||
You’re already off to a great start on your Rust journey! In this chapter,
|
||||
you’ve:
|
||||
|
||||
* Installed the latest stable version of Rust
|
||||
* Written a “Hello, world!” program using both `rustc` directly and using
|
||||
the conventions of `cargo`
|
||||
|
||||
This is a great time to build a more substantial program, to get used to
|
||||
reading and writing Rust code. In the next chapter, we’ll build a guessing game
|
||||
program. If you’d rather start by learning about how common programming
|
||||
concepts work in Rust, see Chapter 3.
|
||||
1011
2018-edition/src/ch02-00-guessing-game-tutorial.md
Normal file
1011
2018-edition/src/ch02-00-guessing-game-tutorial.md
Normal file
File diff suppressed because it is too large
Load Diff
21
2018-edition/src/ch03-00-common-programming-concepts.md
Normal file
21
2018-edition/src/ch03-00-common-programming-concepts.md
Normal file
@@ -0,0 +1,21 @@
|
||||
# Common Programming Concepts
|
||||
|
||||
This chapter covers concepts that appear in almost every programming language
|
||||
and how they work in Rust. Many programming languages have much in common at
|
||||
their core. None of the concepts presented in this chapter are unique to Rust,
|
||||
but we’ll discuss them in the context of Rust and explain the conventions
|
||||
around using these concepts.
|
||||
|
||||
Specifically, you’ll learn about variables, basic types, functions, comments,
|
||||
and control flow. These foundations will be in every Rust program, and learning
|
||||
them early will give you a strong core to start from.
|
||||
|
||||
> ### Keywords
|
||||
>
|
||||
> The Rust language has a set of *keywords* that are reserved for use by
|
||||
> the language only, much as in other languages. Keep in mind that you cannot
|
||||
> use these words as names of variables or functions. Most of the keywords have
|
||||
> special meanings, and you’ll be using them to do various tasks in your Rust
|
||||
> programs; a few have no current functionality associated with them but have
|
||||
> been reserved for functionality that might be added to Rust in the future. You
|
||||
> can find a list of the keywords in Appendix A.
|
||||
228
2018-edition/src/ch03-01-variables-and-mutability.md
Normal file
228
2018-edition/src/ch03-01-variables-and-mutability.md
Normal file
@@ -0,0 +1,228 @@
|
||||
## Variables and Mutability
|
||||
|
||||
As mentioned in Chapter 2, by default variables are immutable. This is one of
|
||||
many nudges Rust gives you to write your code in a way that takes advantage of
|
||||
the safety and easy concurrency that Rust offers. However, you still have the
|
||||
option to make your variables mutable. Let’s explore how and why Rust
|
||||
encourages you to favor immutability and why sometimes you might want to opt
|
||||
out.
|
||||
|
||||
When a variable is immutable, once a value is bound to a name, you can’t change
|
||||
that value. To illustrate this, let’s generate a new project called *variables*
|
||||
in your *projects* directory by using `cargo new --bin variables`.
|
||||
|
||||
Then, in your new *variables* directory, open *src/main.rs* and replace its
|
||||
code with the following code that won’t compile just yet:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let x = 5;
|
||||
println!("The value of x is: {}", x);
|
||||
x = 6;
|
||||
println!("The value of x is: {}", x);
|
||||
}
|
||||
```
|
||||
|
||||
Save and run the program using `cargo run`. You should receive an error
|
||||
message, as shown in this output:
|
||||
|
||||
```text
|
||||
error[E0384]: cannot assign twice to immutable variable `x`
|
||||
--> src/main.rs:4:5
|
||||
|
|
||||
2 | let x = 5;
|
||||
| - first assignment to `x`
|
||||
3 | println!("The value of x is: {}", x);
|
||||
4 | x = 6;
|
||||
| ^^^^^ cannot assign twice to immutable variable
|
||||
```
|
||||
|
||||
This example shows how the compiler helps you find errors in your programs.
|
||||
Even though compiler errors can be frustrating, they only mean your program
|
||||
isn’t safely doing what you want it to do yet; they do *not* mean that you’re
|
||||
not a good programmer! Experienced Rustaceans still get compiler errors.
|
||||
|
||||
The error indicates that the cause of the error is that you `cannot assign twice
|
||||
to immutable variable x`, because you tried to assign a second value to the
|
||||
immutable `x` variable.
|
||||
|
||||
It’s important that we get compile-time errors when we attempt to change a
|
||||
value that we previously designated as immutable because this very situation
|
||||
can lead to bugs. If one part of our code operates on the assumption that a
|
||||
value will never change and another part of our code changes that value, it’s
|
||||
possible that the first part of the code won’t do what it was designed to do.
|
||||
The cause of this kind of bug can be difficult to track down after the fact,
|
||||
especially when the second piece of code changes the value only *sometimes*.
|
||||
|
||||
In Rust, the compiler guarantees that when you state that a value won’t change,
|
||||
it really won’t change. That means that when you’re reading and writing code,
|
||||
you don’t have to keep track of how and where a value might change. Your code
|
||||
is thus easier to reason through.
|
||||
|
||||
But mutability can be very useful. Variables are immutable only by default; as
|
||||
you did in Chapter 2, you can make them mutable by adding `mut` in front of the
|
||||
variable name. In addition to allowing this value to change, `mut` conveys
|
||||
intent to future readers of the code by indicating that other parts of the code
|
||||
will be changing this variable value.
|
||||
|
||||
For example, let’s change *src/main.rs* to the following:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let mut x = 5;
|
||||
println!("The value of x is: {}", x);
|
||||
x = 6;
|
||||
println!("The value of x is: {}", x);
|
||||
}
|
||||
```
|
||||
|
||||
When we run the program now, we get this:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling variables v0.1.0 (file:///projects/variables)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.30 secs
|
||||
Running `target/debug/variables`
|
||||
The value of x is: 5
|
||||
The value of x is: 6
|
||||
```
|
||||
|
||||
We’re allowed to change the value that `x` binds to from `5` to `6` when `mut`
|
||||
is used. In some cases, you’ll want to make a variable mutable because it makes
|
||||
the code more convenient to write than if it had only immutable variables.
|
||||
|
||||
There are multiple trade-offs to consider in addition to the prevention of
|
||||
bugs. For example, in cases where you’re using large data structures, mutating
|
||||
an instance in place may be faster than copying and returning newly allocated
|
||||
instances. With smaller data structures, creating new instances and writing in
|
||||
a more functional programming style may be easier to think through, so lower
|
||||
performance might be a worthwhile penalty for gaining that clarity.
|
||||
|
||||
### Differences Between Variables and Constants
|
||||
|
||||
Being unable to change the value of a variable might have reminded you of
|
||||
another programming concept that most other languages have: *constants*. Like
|
||||
immutable variables, constants are values that are bound to a name and are not
|
||||
allowed to change, but there are a few differences between constants and
|
||||
variables.
|
||||
|
||||
First, you aren’t allowed to use `mut` with constants. Constants aren’t just
|
||||
immutable by default—they’re always immutable.
|
||||
|
||||
You declare constants using the `const` keyword instead of the `let` keyword,
|
||||
and the type of the value *must* be annotated. We’re about to cover types and
|
||||
type annotations in the next section, “Data Types,” so don’t worry about the
|
||||
details right now. Just know that you must always annotate the type.
|
||||
|
||||
Constants can be declared in any scope, including the global scope, which makes
|
||||
them useful for values that many parts of code need to know about.
|
||||
|
||||
The last difference is that constants may be set only to a constant expression,
|
||||
not the result of a function call or any other value that could only be
|
||||
computed at runtime.
|
||||
|
||||
Here’s an example of a constant declaration where the constant’s name is
|
||||
`MAX_POINTS` and its value is set to 100,000. (Rust’s constant naming
|
||||
convention is to use all uppercase with underscores between words):
|
||||
|
||||
```rust
|
||||
const MAX_POINTS: u32 = 100_000;
|
||||
```
|
||||
|
||||
Constants are valid for the entire time a program runs, within the scope they
|
||||
were declared in, making them a useful choice for values in your application
|
||||
domain that multiple parts of the program might need to know about, such as the
|
||||
maximum number of points any player of a game is allowed to earn or the speed
|
||||
of light.
|
||||
|
||||
Naming hardcoded values used throughout your program as constants is useful in
|
||||
conveying the meaning of that value to future maintainers of the code. It also
|
||||
helps to have only one place in your code you would need to change if the
|
||||
hardcoded value needed to be updated in the future.
|
||||
|
||||
### Shadowing
|
||||
|
||||
As you saw in the “Comparing the Guess to the Secret Number” section in Chapter
|
||||
2, you can declare a new variable with the same name as a previous variable,
|
||||
and the new variable shadows the previous variable. Rustaceans say that the
|
||||
first variable is *shadowed* by the second, which means that the second
|
||||
variable’s value is what appears when the variable is used. We can shadow a
|
||||
variable by using the same variable’s name and repeating the use of the `let`
|
||||
keyword as follows:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let x = 5;
|
||||
|
||||
let x = x + 1;
|
||||
|
||||
let x = x * 2;
|
||||
|
||||
println!("The value of x is: {}", x);
|
||||
}
|
||||
```
|
||||
|
||||
This program first binds `x` to a value of `5`. Then it shadows `x` by
|
||||
repeating `let x =`, taking the original value and adding `1` so the value of
|
||||
`x` is then `6`. The third `let` statement also shadows `x`, multiplying the
|
||||
previous value by `2` to give `x` a final value of `12`. When we run this
|
||||
program, it will output the following:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling variables v0.1.0 (file:///projects/variables)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.31 secs
|
||||
Running `target/debug/variables`
|
||||
The value of x is: 12
|
||||
```
|
||||
|
||||
Shadowing is different than marking a variable as `mut`, because we’ll get a
|
||||
compile-time error if we accidentally try to reassign to this variable without
|
||||
using the `let` keyword. By using `let`, we can perform a few transformations
|
||||
on a value but have the variable be immutable after those transformations have
|
||||
been completed.
|
||||
|
||||
The other difference between `mut` and shadowing is that because we’re
|
||||
effectively creating a new variable when we use the `let` keyword again, we can
|
||||
change the type of the value but reuse the same name. For example, say our
|
||||
program asks a user to show how many spaces they want between some text by
|
||||
inputting space characters, but we really want to store that input as a number:
|
||||
|
||||
```rust
|
||||
let spaces = " ";
|
||||
let spaces = spaces.len();
|
||||
```
|
||||
|
||||
This construct is allowed because the first `spaces` variable is a string type
|
||||
and the second `spaces` variable, which is a brand-new variable that happens to
|
||||
have the same name as the first one, is a number type. Shadowing thus spares us
|
||||
from having to come up with different names, such as `spaces_str` and
|
||||
`spaces_num`; instead, we can reuse the simpler `spaces` name. However, if we
|
||||
try to use `mut` for this, as shown here, we’ll get a compile-time error:
|
||||
|
||||
```rust,ignore
|
||||
let mut spaces = " ";
|
||||
spaces = spaces.len();
|
||||
```
|
||||
|
||||
The error says we’re not allowed to mutate a variable’s type:
|
||||
|
||||
```text
|
||||
error[E0308]: mismatched types
|
||||
--> src/main.rs:3:14
|
||||
|
|
||||
3 | spaces = spaces.len();
|
||||
| ^^^^^^^^^^^^ expected &str, found usize
|
||||
|
|
||||
= note: expected type `&str`
|
||||
found type `usize`
|
||||
```
|
||||
|
||||
Now that we’ve explored how variables work, let’s look at more data types they
|
||||
can have.
|
||||
364
2018-edition/src/ch03-02-data-types.md
Normal file
364
2018-edition/src/ch03-02-data-types.md
Normal file
@@ -0,0 +1,364 @@
|
||||
## Data Types
|
||||
|
||||
Every value in Rust is of a certain *data type*, which tells Rust what kind of
|
||||
data is being specified so it knows how to work with that data. We’ll look at
|
||||
two data type subsets: scalar and compound.
|
||||
|
||||
Keep in mind that Rust is a *statically typed* language, which means that it
|
||||
must know the types of all variables at compile time. The compiler can usually
|
||||
infer what type we want to use based on the value and how we use it. In cases
|
||||
when many types are possible, such as when we converted a `String` to a numeric
|
||||
type using `parse` in the “Comparing the Guess to the Secret Number” section in
|
||||
Chapter 2, we must add a type annotation, like this:
|
||||
|
||||
```rust
|
||||
let guess: u32 = "42".parse().expect("Not a number!");
|
||||
```
|
||||
|
||||
If we don’t add the type annotation here, Rust will display the following
|
||||
error, which means the compiler needs more information from us to know which
|
||||
type we want to use:
|
||||
|
||||
```text
|
||||
error[E0282]: type annotations needed
|
||||
--> src/main.rs:2:9
|
||||
|
|
||||
2 | let guess = "42".parse().expect("Not a number!");
|
||||
| ^^^^^
|
||||
| |
|
||||
| cannot infer type for `_`
|
||||
| consider giving `guess` a type
|
||||
```
|
||||
|
||||
You’ll see different type annotations for other data types.
|
||||
|
||||
### Scalar Types
|
||||
|
||||
A *scalar* type represents a single value. Rust has four primary scalar types:
|
||||
integers, floating-point numbers, Booleans, and characters. You may recognize
|
||||
these from other programming languages. Let’s jump into how they work in Rust.
|
||||
|
||||
#### Integer Types
|
||||
|
||||
An *integer* is a number without a fractional component. We used one integer
|
||||
type in Chapter 2, the `u32` type. This type declaration indicates that the
|
||||
value it’s associated with should be an unsigned integer (signed integer types
|
||||
start with `i`, instead of `u`) that takes up 32 bits of space. Table 3-1 shows
|
||||
the built-in integer types in Rust. Each variant in the Signed and Unsigned
|
||||
columns (for example, `i16`) can be used to declare the type of an integer
|
||||
value.
|
||||
|
||||
<span class="caption">Table 3-1: Integer Types in Rust</span>
|
||||
|
||||
| Length | Signed | Unsigned |
|
||||
|--------|---------|----------|
|
||||
| 8-bit | `i8` | `u8` |
|
||||
| 16-bit | `i16` | `u16` |
|
||||
| 32-bit | `i32` | `u32` |
|
||||
| 64-bit | `i64` | `u64` |
|
||||
| arch | `isize` | `usize` |
|
||||
|
||||
Each variant can be either signed or unsigned and has an explicit size.
|
||||
*Signed* and *unsigned* refer to whether it’s possible for the number to be
|
||||
negative or positive—in other words, whether the number needs to have a sign
|
||||
with it (signed) or whether it will only ever be positive and can therefore be
|
||||
represented without a sign (unsigned). It’s like writing numbers on paper: when
|
||||
the sign matters, a number is shown with a plus sign or a minus sign; however,
|
||||
when it’s safe to assume the number is positive, it’s shown with no sign.
|
||||
Signed numbers are stored using two’s complement representation (if you’re
|
||||
unsure what this is, you can search for it online; an explanation is outside
|
||||
the scope of this book).
|
||||
|
||||
Each signed variant can store numbers from -(2<sup>n - 1</sup>) to 2<sup>n -
|
||||
1</sup> - 1 inclusive, where *n* is the number of bits that variant uses. So an
|
||||
`i8` can store numbers from -(2<sup>7</sup>) to 2<sup>7</sup> - 1, which equals
|
||||
-128 to 127. Unsigned variants can store numbers from 0 to 2<sup>n</sup> - 1,
|
||||
so a `u8` can store numbers from 0 to 2<sup>8</sup> - 1, which equals 0 to 255.
|
||||
|
||||
Additionally, the `isize` and `usize` types depend on the kind of computer your
|
||||
program is running on: 64 bits if you’re on a 64-bit architecture and 32 bits
|
||||
if you’re on a 32-bit architecture.
|
||||
|
||||
You can write integer literals in any of the forms shown in Table 3-2. Note
|
||||
that all number literals except the byte literal allow a type suffix, such as
|
||||
`57u8`, and `_` as a visual separator, such as `1_000`.
|
||||
|
||||
<span class="caption">Table 3-2: Integer Literals in Rust</span>
|
||||
|
||||
| Number literals | Example |
|
||||
|------------------|---------------|
|
||||
| Decimal | `98_222` |
|
||||
| Hex | `0xff` |
|
||||
| Octal | `0o77` |
|
||||
| Binary | `0b1111_0000` |
|
||||
| Byte (`u8` only) | `b'A'` |
|
||||
|
||||
So how do you know which type of integer to use? If you’re unsure, Rust’s
|
||||
defaults are generally good choices, and integer types default to `i32`: this
|
||||
type is generally the fastest, even on 64-bit systems. The primary situation in
|
||||
which you’d use `isize` or `usize` is when indexing some sort of collection.
|
||||
|
||||
#### Floating-Point Types
|
||||
|
||||
Rust also has two primitive types for *floating-point numbers*, which are
|
||||
numbers with decimal points. Rust’s floating-point types are `f32` and `f64`,
|
||||
which are 32 bits and 64 bits in size, respectively. The default type is `f64`
|
||||
because on modern CPUs it’s roughly the same speed as `f32` but is capable of
|
||||
more precision.
|
||||
|
||||
Here’s an example that shows floating-point numbers in action:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let x = 2.0; // f64
|
||||
|
||||
let y: f32 = 3.0; // f32
|
||||
}
|
||||
```
|
||||
|
||||
Floating-point numbers are represented according to the IEEE-754 standard. The
|
||||
`f32` type is a single-precision float, and `f64` has double precision.
|
||||
|
||||
#### Numeric Operations
|
||||
|
||||
Rust supports the basic mathematical operations you’d expect for all of the
|
||||
number types: addition, subtraction, multiplication, division, and remainder.
|
||||
The following code shows how you’d use each one in a `let` statement:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
// addition
|
||||
let sum = 5 + 10;
|
||||
|
||||
// subtraction
|
||||
let difference = 95.5 - 4.3;
|
||||
|
||||
// multiplication
|
||||
let product = 4 * 30;
|
||||
|
||||
// division
|
||||
let quotient = 56.7 / 32.2;
|
||||
|
||||
// remainder
|
||||
let remainder = 43 % 5;
|
||||
}
|
||||
```
|
||||
|
||||
Each expression in these statements uses a mathematical operator and evaluates
|
||||
to a single value, which is then bound to a variable. Appendix B contains a
|
||||
list of all operators that Rust provides.
|
||||
|
||||
#### The Boolean Type
|
||||
|
||||
As in most other programming languages, a Boolean type in Rust has two possible
|
||||
values: `true` and `false`. The Boolean type in Rust is specified using `bool`.
|
||||
For example:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let t = true;
|
||||
|
||||
let f: bool = false; // with explicit type annotation
|
||||
}
|
||||
```
|
||||
|
||||
The main way to consume Boolean values is through conditionals, such as an `if`
|
||||
expression. We’ll cover how `if` expressions work in Rust in the “Control Flow”
|
||||
section.
|
||||
|
||||
#### The Character Type
|
||||
|
||||
So far we’ve worked only with numbers, but Rust supports letters too. Rust’s
|
||||
`char` type is the language’s most primitive alphabetic type, and the following
|
||||
code shows one way to use it. (Note that the `char` type is specified with
|
||||
single quotes, as opposed to strings, which use double quotes.)
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let c = 'z';
|
||||
let z = 'ℤ';
|
||||
let heart_eyed_cat = '😻';
|
||||
}
|
||||
```
|
||||
|
||||
Rust’s `char` type represents a Unicode Scalar Value, which means it can
|
||||
represent a lot more than just ASCII. Accented letters; Chinese, Japanese, and
|
||||
Korean ideographs; emoji; and zero-width spaces are all valid `char` values in
|
||||
Rust. Unicode Scalar Values range from `U+0000` to `U+D7FF` and `U+E000` to
|
||||
`U+10FFFF` inclusive. However, a “character” isn’t really a concept in Unicode,
|
||||
so your human intuition for what a “character” is may not match up with what a
|
||||
`char` is in Rust. We’ll discuss this topic in detail in “Strings” in Chapter 8.
|
||||
|
||||
### Compound Types
|
||||
|
||||
*Compound types* can group multiple values into one type. Rust has two
|
||||
primitive compound types: tuples and arrays.
|
||||
|
||||
#### The Tuple Type
|
||||
|
||||
A tuple is a general way of grouping together some number of other values with
|
||||
a variety of types into one compound type.
|
||||
|
||||
We create a tuple by writing a comma-separated list of values inside
|
||||
parentheses. Each position in the tuple has a type, and the types of the
|
||||
different values in the tuple don’t have to be the same. We’ve added optional
|
||||
type annotations in this example:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let tup: (i32, f64, u8) = (500, 6.4, 1);
|
||||
}
|
||||
```
|
||||
|
||||
The variable `tup` binds to the entire tuple, because a tuple is considered a
|
||||
single compound element. To get the individual values out of a tuple, we can
|
||||
use pattern matching to destructure a tuple value, like this:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let tup = (500, 6.4, 1);
|
||||
|
||||
let (x, y, z) = tup;
|
||||
|
||||
println!("The value of y is: {}", y);
|
||||
}
|
||||
```
|
||||
|
||||
This program first creates a tuple and binds it to the variable `tup`. It then
|
||||
uses a pattern with `let` to take `tup` and turn it into three separate
|
||||
variables, `x`, `y`, and `z`. This is called *destructuring*, because it breaks
|
||||
the single tuple into three parts. Finally, the program prints the value of
|
||||
`y`, which is `6.4`.
|
||||
|
||||
In addition to destructuring through pattern matching, we can access a tuple
|
||||
element directly by using a period (`.`) followed by the index of the value we
|
||||
want to access. For example:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let x: (i32, f64, u8) = (500, 6.4, 1);
|
||||
|
||||
let five_hundred = x.0;
|
||||
|
||||
let six_point_four = x.1;
|
||||
|
||||
let one = x.2;
|
||||
}
|
||||
```
|
||||
|
||||
This program creates a tuple, `x`, and then makes new variables for each
|
||||
element by using their index. As with most programming languages, the first
|
||||
index in a tuple is 0.
|
||||
|
||||
#### The Array Type
|
||||
|
||||
Another way to have a collection of multiple values is with an *array*. Unlike
|
||||
a tuple, every element of an array must have the same type. Arrays in Rust are
|
||||
different from arrays in some other languages because arrays in Rust have a
|
||||
fixed length: once declared, they cannot grow or shrink in size.
|
||||
|
||||
In Rust, the values going into an array are written as a comma-separated list
|
||||
inside square brackets:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let a = [1, 2, 3, 4, 5];
|
||||
}
|
||||
```
|
||||
|
||||
Arrays are useful when you want your data allocated on the stack rather than
|
||||
the heap (we will discuss the stack and the heap more in Chapter 4), or when
|
||||
you want to ensure you always have a fixed number of elements. An array isn’t
|
||||
as flexible as the vector type, though. A vector is a similar collection type
|
||||
provided by the standard library that *is* allowed to grow or shrink in size.
|
||||
If you’re unsure whether to use an array or a vector, you should probably use a
|
||||
vector. Chapter 8 discusses vectors in more detail.
|
||||
|
||||
An example of when you might want to use an array rather than a vector is in a
|
||||
program that needs to know the names of the months of the year. It’s very
|
||||
unlikely that such a program will need to add or remove months, so you can use
|
||||
an array because you know it will always contain 12 items:
|
||||
|
||||
```rust
|
||||
let months = ["January", "February", "March", "April", "May", "June", "July",
|
||||
"August", "September", "October", "November", "December"];
|
||||
```
|
||||
|
||||
##### Accessing Array Elements
|
||||
|
||||
An array is a single chunk of memory allocated on the stack. You can access
|
||||
elements of an array using indexing, like this:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let a = [1, 2, 3, 4, 5];
|
||||
|
||||
let first = a[0];
|
||||
let second = a[1];
|
||||
}
|
||||
```
|
||||
|
||||
In this example, the variable named `first` will get the value `1`, because
|
||||
that is the value at index `[0]` in the array. The variable named `second` will
|
||||
get the value `2` from index `[1]` in the array.
|
||||
|
||||
##### Invalid Array Element Access
|
||||
|
||||
What happens if you try to access an element of an array that is past the end
|
||||
of the array? Say you change the example to the following code, which will
|
||||
compile but exit with an error when it runs:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let a = [1, 2, 3, 4, 5];
|
||||
let index = 10;
|
||||
|
||||
let element = a[index];
|
||||
|
||||
println!("The value of element is: {}", element);
|
||||
}
|
||||
```
|
||||
|
||||
Running this code using `cargo run` produces the following result:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling arrays v0.1.0 (file:///projects/arrays)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.31 secs
|
||||
Running `target/debug/arrays`
|
||||
thread '<main>' panicked at 'index out of bounds: the len is 5 but the index is
|
||||
10', src/main.rs:6
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
```
|
||||
|
||||
The compilation didn’t produce any errors, but the program resulted in a
|
||||
*runtime* error and didn’t exit successfully. When you attempt to access an
|
||||
element using indexing, Rust will check that the index you’ve specified is less
|
||||
than the array length. If the index is greater than the length, Rust will
|
||||
*panic*, which is the term Rust uses when a program exits with an error.
|
||||
|
||||
This is the first example of Rust’s safety principles in action. In many
|
||||
low-level languages, this kind of check is not done, and when you provide an
|
||||
incorrect index, invalid memory can be accessed. Rust protects you against this
|
||||
kind of error by immediately exiting instead of allowing the memory access and
|
||||
continuing. Chapter 9 discusses more of Rust’s error handling.
|
||||
346
2018-edition/src/ch03-03-how-functions-work.md
Normal file
346
2018-edition/src/ch03-03-how-functions-work.md
Normal file
@@ -0,0 +1,346 @@
|
||||
## Functions
|
||||
|
||||
Functions are pervasive in Rust code. You’ve already seen one of the most
|
||||
important functions in the language: the `main` function, which is the entry
|
||||
point of many programs. You’ve also seen the `fn` keyword, which allows you to
|
||||
declare new functions.
|
||||
|
||||
Rust code uses *snake case* as the conventional style for function and variable
|
||||
names. In snake case, all letters are lowercase and underscores separate words.
|
||||
Here’s a program that contains an example function definition:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
println!("Hello, world!");
|
||||
|
||||
another_function();
|
||||
}
|
||||
|
||||
fn another_function() {
|
||||
println!("Another function.");
|
||||
}
|
||||
```
|
||||
|
||||
Function definitions in Rust start with `fn` and have a set of parentheses
|
||||
after the function name. The curly brackets tell the compiler where the
|
||||
function body begins and ends.
|
||||
|
||||
We can call any function we’ve defined by entering its name followed by a set
|
||||
of parentheses. Because `another_function` is defined in the program, it can be
|
||||
called from inside the `main` function. Note that we defined `another_function`
|
||||
*after* the `main` function in the source code; we could have defined it before
|
||||
as well. Rust doesn’t care where you define your functions, only that they’re
|
||||
defined somewhere.
|
||||
|
||||
Let’s start a new binary project named *functions* to explore functions
|
||||
further. Place the `another_function` example in *src/main.rs* and run it. You
|
||||
should see the following output:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling functions v0.1.0 (file:///projects/functions)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.28 secs
|
||||
Running `target/debug/functions`
|
||||
Hello, world!
|
||||
Another function.
|
||||
```
|
||||
|
||||
The lines execute in the order in which they appear in the `main` function.
|
||||
First, the “Hello, world!” message prints, and then `another_function` is
|
||||
called and its message is printed.
|
||||
|
||||
### Function Parameters
|
||||
|
||||
Functions can also be defined to have *parameters*, which are special variables
|
||||
that are part of a function’s signature. When a function has parameters, you
|
||||
can provide it with concrete values for those parameters. Technically, the
|
||||
concrete values are called *arguments*, but in casual conversation, people tend
|
||||
to use the words *parameter* and *argument* interchangeably for either the
|
||||
variables in a function’s definition or the concrete values passed in when you
|
||||
call a function.
|
||||
|
||||
The following rewritten version of `another_function` shows what parameters
|
||||
look like in Rust:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
another_function(5);
|
||||
}
|
||||
|
||||
fn another_function(x: i32) {
|
||||
println!("The value of x is: {}", x);
|
||||
}
|
||||
```
|
||||
|
||||
Try running this program; you should get the following output:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling functions v0.1.0 (file:///projects/functions)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 1.21 secs
|
||||
Running `target/debug/functions`
|
||||
The value of x is: 5
|
||||
```
|
||||
|
||||
The declaration of `another_function` has one parameter named `x`. The type of
|
||||
`x` is specified as `i32`. When `5` is passed to `another_function`, the
|
||||
`println!` macro puts `5` where the pair of curly brackets were in the format
|
||||
string.
|
||||
|
||||
In function signatures, you *must* declare the type of each parameter. This is
|
||||
a deliberate decision in Rust’s design: requiring type annotations in function
|
||||
definitions means the compiler almost never needs you to use them elsewhere in
|
||||
the code to figure out what you mean.
|
||||
|
||||
When you want a function to have multiple parameters, separate the parameter
|
||||
declarations with commas, like this:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
another_function(5, 6);
|
||||
}
|
||||
|
||||
fn another_function(x: i32, y: i32) {
|
||||
println!("The value of x is: {}", x);
|
||||
println!("The value of y is: {}", y);
|
||||
}
|
||||
```
|
||||
|
||||
This example creates a function with two parameters, both of which are `i32`
|
||||
types. The function then prints the values in both of its parameters. Note that
|
||||
function parameters don’t all need to be the same type, they just happen to be
|
||||
in this example.
|
||||
|
||||
Let’s try running this code. Replace the program currently in your *functions*
|
||||
project’s *src/main.rs* file with the preceding example and run it using `cargo
|
||||
run`:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling functions v0.1.0 (file:///projects/functions)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.31 secs
|
||||
Running `target/debug/functions`
|
||||
The value of x is: 5
|
||||
The value of y is: 6
|
||||
```
|
||||
|
||||
Because we called the function with `5` as the value for `x` and `6` is passed
|
||||
as the value for `y`, the two strings are printed with these values.
|
||||
|
||||
### Function Bodies
|
||||
|
||||
Function bodies are made up of a series of statements optionally ending in an
|
||||
expression. So far, we’ve only covered functions without an ending expression,
|
||||
but you have seen an expression as part of statements. Because Rust is an
|
||||
expression-based language, this is an important distinction to understand.
|
||||
Other languages don’t have the same distinctions, so let’s look at what
|
||||
statements and expressions are and how their differences affect the bodies of
|
||||
functions.
|
||||
|
||||
### Statements and Expressions
|
||||
|
||||
We’ve actually already used statements and expressions. *Statements* are
|
||||
instructions that perform some action and do not return a value. *Expressions*
|
||||
evaluate to a resulting value. Let’s look at some examples.
|
||||
|
||||
Creating a variable and assigning a value to it with the `let` keyword is a
|
||||
statement. In Listing 3-1, `let y = 6;` is a statement:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let y = 6;
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 3-1: A `main` function declaration containing one statement</span>
|
||||
|
||||
Function definitions are also statements; the entire preceding example is a
|
||||
statement in itself.
|
||||
|
||||
Statements do not return values. Therefore, you can’t assign a `let` statement
|
||||
to another variable, as the following code tries to do; you’ll get an error:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let x = (let y = 6);
|
||||
}
|
||||
```
|
||||
|
||||
When you run this program, the error you’ll get looks like this:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling functions v0.1.0 (file:///projects/functions)
|
||||
error: expected expression, found statement (`let`)
|
||||
--> src/main.rs:2:14
|
||||
|
|
||||
2 | let x = (let y = 6);
|
||||
| ^^^
|
||||
|
|
||||
= note: variable declaration using `let` is a statement
|
||||
```
|
||||
|
||||
The `let y = 6` statement does not return a value, so there isn’t anything for
|
||||
`x` to bind to. This is different from what happens in other languages, such as
|
||||
C and Ruby, where the assignment returns the value of the assignment. In those
|
||||
languages, you can write `x = y = 6` and have both `x` and `y` have the value
|
||||
`6`; that is not the case in Rust.
|
||||
|
||||
Expressions evaluate to something and make up most of the rest of the code that
|
||||
you’ll write in Rust. Consider a simple math operation, such as `5 + 6`, which
|
||||
is an expression that evaluates to the value `11`. Expressions can be part of
|
||||
statements: in Listing 3-1, the `6` in the statement `let y = 6;` is an
|
||||
expression that evaluates to the value `6`. Calling a function is an
|
||||
expression. Calling a macro is an expression. The block that we use to create
|
||||
new scopes, `{}`, is an expression, for example:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let x = 5;
|
||||
|
||||
let y = {
|
||||
let x = 3;
|
||||
x + 1
|
||||
};
|
||||
|
||||
println!("The value of y is: {}", y);
|
||||
}
|
||||
```
|
||||
|
||||
This expression:
|
||||
|
||||
```rust,ignore
|
||||
{
|
||||
let x = 3;
|
||||
x + 1
|
||||
}
|
||||
```
|
||||
|
||||
is a block that, in this case, evaluates to `4`. That value gets bound to `y`
|
||||
as part of the `let` statement. Note the `x + 1` line without a semicolon at
|
||||
the end, which is unlike most of the lines you’ve seen so far. Expressions do
|
||||
not include ending semicolons. If you add a semicolon to the end of an
|
||||
expression, you turn it into a statement, which will then not return a value.
|
||||
Keep this in mind as you explore function return values and expressions next.
|
||||
|
||||
### Functions with Return Values
|
||||
|
||||
Functions can return values to the code that calls them. We don’t name return
|
||||
values, but we do declare their type after an arrow (`->`). In Rust, the return
|
||||
value of the function is synonymous with the value of the final expression in
|
||||
the block of the body of a function. You can return early from a function by
|
||||
using the `return` keyword and specifying a value, but most functions return
|
||||
the last expression implicitly. Here’s an example of a function that returns a
|
||||
value:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn five() -> i32 {
|
||||
5
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let x = five();
|
||||
|
||||
println!("The value of x is: {}", x);
|
||||
}
|
||||
```
|
||||
|
||||
There are no function calls, macros, or even `let` statements in the `five`
|
||||
function—just the number `5` by itself. That’s a perfectly valid function in
|
||||
Rust. Note that the function’s return type is specified, too, as `-> i32`. Try
|
||||
running this code; the output should look like this:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling functions v0.1.0 (file:///projects/functions)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.30 secs
|
||||
Running `target/debug/functions`
|
||||
The value of x is: 5
|
||||
```
|
||||
|
||||
The `5` in `five` is the function’s return value, which is why the return type
|
||||
is `i32`. Let’s examine this in more detail. There are two important bits:
|
||||
first, the line `let x = five();` shows that we’re using the return value of a
|
||||
function to initialize a variable. Because the function `five` returns a `5`,
|
||||
that line is the same as the following:
|
||||
|
||||
```rust
|
||||
let x = 5;
|
||||
```
|
||||
|
||||
Second, the `five` function has no parameters and defines the type of the
|
||||
return value, but the body of the function is a lonely `5` with no semicolon
|
||||
because it’s an expression whose value we want to return.
|
||||
|
||||
Let’s look at another example:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let x = plus_one(5);
|
||||
|
||||
println!("The value of x is: {}", x);
|
||||
}
|
||||
|
||||
fn plus_one(x: i32) -> i32 {
|
||||
x + 1
|
||||
}
|
||||
```
|
||||
|
||||
Running this code will print `The value of x is: 6`. But if we place a
|
||||
semicolon at the end of the line containing `x + 1`, changing it from an
|
||||
expression to a statement, we’ll get an error.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let x = plus_one(5);
|
||||
|
||||
println!("The value of x is: {}", x);
|
||||
}
|
||||
|
||||
fn plus_one(x: i32) -> i32 {
|
||||
x + 1;
|
||||
}
|
||||
```
|
||||
|
||||
Running this code produces an error, as follows:
|
||||
|
||||
```text
|
||||
error[E0308]: mismatched types
|
||||
--> src/main.rs:7:28
|
||||
|
|
||||
7 | fn plus_one(x: i32) -> i32 {
|
||||
| ____________________________^
|
||||
8 | | x + 1;
|
||||
| | - help: consider removing this semicolon
|
||||
9 | | }
|
||||
| |_^ expected i32, found ()
|
||||
|
|
||||
= note: expected type `i32`
|
||||
found type `()`
|
||||
```
|
||||
|
||||
The main error message, “mismatched types,” reveals the core issue with this
|
||||
code. The definition of the function `plus_one` says that it will return an
|
||||
`i32`, but statements don’t evaluate to a value, which is expressed by `()`,
|
||||
the empty tuple. Therefore, nothing is returned, which contradicts the function
|
||||
definition and results in an error. In this output, Rust provides a message to
|
||||
possibly help rectify this issue: it suggests removing the semicolon, which
|
||||
would fix the error.
|
||||
47
2018-edition/src/ch03-04-comments.md
Normal file
47
2018-edition/src/ch03-04-comments.md
Normal file
@@ -0,0 +1,47 @@
|
||||
## Comments
|
||||
|
||||
All programmers strive to make their code easy to understand, but sometimes
|
||||
extra explanation is warranted. In these cases, programmers leave notes, or
|
||||
*comments*, in their source code that the compiler will ignore but people
|
||||
reading the source code may find useful.
|
||||
|
||||
Here’s a simple comment:
|
||||
|
||||
```rust
|
||||
// Hello, world.
|
||||
```
|
||||
|
||||
In Rust, comments must start with two slashes and continue until the end of the
|
||||
line. For comments that extend beyond a single line, you’ll need to include
|
||||
`//` on each line, like this:
|
||||
|
||||
```rust
|
||||
// So we’re doing something complicated here, long enough that we need
|
||||
// multiple lines of comments to do it! Whew! Hopefully, this comment will
|
||||
// explain what’s going on.
|
||||
```
|
||||
|
||||
Comments can also be placed at the end of lines containing code:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let lucky_number = 7; // I’m feeling lucky today.
|
||||
}
|
||||
```
|
||||
|
||||
But you’ll more often see them used in this format, with the comment on a
|
||||
separate line above the code it’s annotating:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
// I’m feeling lucky today.
|
||||
let lucky_number = 7;
|
||||
}
|
||||
```
|
||||
|
||||
Rust also has another kind of comment, documentation comments, which we’ll
|
||||
discuss in Chapter 14.
|
||||
462
2018-edition/src/ch03-05-control-flow.md
Normal file
462
2018-edition/src/ch03-05-control-flow.md
Normal file
@@ -0,0 +1,462 @@
|
||||
## Control Flow
|
||||
|
||||
Deciding whether or not to run some code depending on if a condition is true
|
||||
and deciding to run some code repeatedly while a condition is true are basic
|
||||
building blocks in most programming languages. The most common constructs that
|
||||
let you control the flow of execution of Rust code are `if` expressions and
|
||||
loops.
|
||||
|
||||
### `if` Expressions
|
||||
|
||||
An `if` expression allows you to branch your code depending on conditions. You
|
||||
provide a condition and then state, “If this condition is met, run this block
|
||||
of code. If the condition is not met, do not run this block of code.”
|
||||
|
||||
Create a new project called *branches* in your *projects* directory to explore
|
||||
the `if` expression. In the *src/main.rs* file, input the following:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let number = 3;
|
||||
|
||||
if number < 5 {
|
||||
println!("condition was true");
|
||||
} else {
|
||||
println!("condition was false");
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<!-- NEXT PARAGRAPH WRAPPED WEIRD INTENTIONALLY SEE #199 -->
|
||||
|
||||
All `if` expressions start with the keyword `if`, which is followed by a
|
||||
condition. In this case, the condition checks whether or not the variable
|
||||
`number` has a value less than 5. The block of code we want to execute if the
|
||||
condition is true is placed immediately after the condition inside curly
|
||||
brackets. Blocks of code associated with the conditions in `if` expressions are
|
||||
sometimes called *arms*, just like the arms in `match` expressions that we
|
||||
discussed in the “Comparing the Guess to the Secret Number” section of
|
||||
Chapter 2.
|
||||
|
||||
Optionally, we can also include an `else` expression, which we chose
|
||||
to do here, to give the program an alternative block of code to execute should
|
||||
the condition evaluate to false. If you don’t provide an `else` expression and
|
||||
the condition is false, the program will just skip the `if` block and move on
|
||||
to the next bit of code.
|
||||
|
||||
Try running this code; you should see the following output:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling branches v0.1.0 (file:///projects/branches)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.31 secs
|
||||
Running `target/debug/branches`
|
||||
condition was true
|
||||
```
|
||||
|
||||
Let’s try changing the value of `number` to a value that makes the condition
|
||||
`false` to see what happens:
|
||||
|
||||
```rust,ignore
|
||||
let number = 7;
|
||||
```
|
||||
|
||||
Run the program again, and look at the output:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling branches v0.1.0 (file:///projects/branches)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.31 secs
|
||||
Running `target/debug/branches`
|
||||
condition was false
|
||||
```
|
||||
|
||||
It’s also worth noting that the condition in this code *must* be a `bool`. If
|
||||
the condition isn’t a `bool`, we’ll get an error. For example:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let number = 3;
|
||||
|
||||
if number {
|
||||
println!("number was three");
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
The `if` condition evaluates to a value of `3` this time, and Rust throws an
|
||||
error:
|
||||
|
||||
```text
|
||||
error[E0308]: mismatched types
|
||||
--> src/main.rs:4:8
|
||||
|
|
||||
4 | if number {
|
||||
| ^^^^^^ expected bool, found integral variable
|
||||
|
|
||||
= note: expected type `bool`
|
||||
found type `{integer}`
|
||||
```
|
||||
|
||||
The error indicates that Rust expected a `bool` but got an integer. Unlike
|
||||
languages such as Ruby and JavaScript, Rust will not automatically try to
|
||||
convert non-Boolean types to a Boolean. You must be explicit and always provide
|
||||
`if` with a Boolean as its condition. If we want the `if` code block to run
|
||||
only when a number is not equal to `0`, for example, we can change the `if`
|
||||
expression to the following:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let number = 3;
|
||||
|
||||
if number != 0 {
|
||||
println!("number was something other than zero");
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
Running this code will print `number was something other than zero`.
|
||||
|
||||
#### Handling Multiple Conditions with `else if`
|
||||
|
||||
You can have multiple conditions by combining `if` and `else` in an `else if`
|
||||
expression. For example:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let number = 6;
|
||||
|
||||
if number % 4 == 0 {
|
||||
println!("number is divisible by 4");
|
||||
} else if number % 3 == 0 {
|
||||
println!("number is divisible by 3");
|
||||
} else if number % 2 == 0 {
|
||||
println!("number is divisible by 2");
|
||||
} else {
|
||||
println!("number is not divisible by 4, 3, or 2");
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
This program has four possible paths it can take. After running it, you should
|
||||
see the following output:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling branches v0.1.0 (file:///projects/branches)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.31 secs
|
||||
Running `target/debug/branches`
|
||||
number is divisible by 3
|
||||
```
|
||||
|
||||
When this program executes, it checks each `if` expression in turn and executes
|
||||
the first body for which the condition holds true. Note that even though 6 is
|
||||
divisible by 2, we don’t see the output `number is divisible by 2`, nor do we
|
||||
see the `number is not divisible by 4, 3, or 2` text from the `else` block.
|
||||
That’s because Rust only executes the block for the first true condition, and
|
||||
once it finds one, it doesn’t even check the rest.
|
||||
|
||||
Using too many `else if` expressions can clutter your code, so if you have more
|
||||
than one, you might want to refactor your code. Chapter 6 describes a powerful
|
||||
Rust branching construct called `match` for these cases.
|
||||
|
||||
#### Using `if` in a `let` Statement
|
||||
|
||||
Because `if` is an expression, we can use it on the right side of a `let`
|
||||
statement, as in Listing 3-2:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let condition = true;
|
||||
let number = if condition {
|
||||
5
|
||||
} else {
|
||||
6
|
||||
};
|
||||
|
||||
println!("The value of number is: {}", number);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 3-2: Assigning the result of an `if` expression
|
||||
to a variable</span>
|
||||
|
||||
The `number` variable will be bound to a value based on the outcome of the `if`
|
||||
expression. Run this code to see what happens:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling branches v0.1.0 (file:///projects/branches)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.30 secs
|
||||
Running `target/debug/branches`
|
||||
The value of number is: 5
|
||||
```
|
||||
|
||||
Remember that blocks of code evaluate to the last expression in them, and
|
||||
numbers by themselves are also expressions. In this case, the value of the
|
||||
whole `if` expression depends on which block of code executes. This means the
|
||||
values that have the potential to be results from each arm of the `if` must be
|
||||
the same type; in Listing 3-2, the results of both the `if` arm and the `else`
|
||||
arm were `i32` integers. If the types are mismatched, as in the following
|
||||
example, we’ll get an error:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let condition = true;
|
||||
|
||||
let number = if condition {
|
||||
5
|
||||
} else {
|
||||
"six"
|
||||
};
|
||||
|
||||
println!("The value of number is: {}", number);
|
||||
}
|
||||
```
|
||||
|
||||
When we try to run this code, we’ll get an error. The `if` and `else` arms have
|
||||
value types that are incompatible, and Rust indicates exactly where to find the
|
||||
problem in the program:
|
||||
|
||||
```text
|
||||
error[E0308]: if and else have incompatible types
|
||||
--> src/main.rs:4:18
|
||||
|
|
||||
4 | let number = if condition {
|
||||
| __________________^
|
||||
5 | | 5
|
||||
6 | | } else {
|
||||
7 | | "six"
|
||||
8 | | };
|
||||
| |_____^ expected integral variable, found &str
|
||||
|
|
||||
= note: expected type `{integer}`
|
||||
found type `&str`
|
||||
```
|
||||
|
||||
The expression in the `if` block evaluates to an integer, and the expression in
|
||||
the `else` block evaluates to a string. This won’t work because variables must
|
||||
have a single type. Rust needs to know at compile time what type the `number`
|
||||
variable is, definitively, so it can verify at compile time that its type is
|
||||
valid everywhere we use `number`. Rust wouldn’t be able to do that if the type
|
||||
of `number` was only determined at runtime; the compiler would be more complex
|
||||
and would make fewer guarantees about the code if it had to keep track of
|
||||
multiple hypothetical types for any variable.
|
||||
|
||||
### Repetition with Loops
|
||||
|
||||
It’s often useful to execute a block of code more than once. For this task,
|
||||
Rust provides several *loops*. A loop runs through the code inside the loop
|
||||
body to the end and then starts immediately back at the beginning. To
|
||||
experiment with loops, let’s make a new project called *loops*.
|
||||
|
||||
Rust has three kinds of loops: `loop`, `while`, and `for`. Let’s try each one.
|
||||
|
||||
#### Repeating Code with `loop`
|
||||
|
||||
The `loop` keyword tells Rust to execute a block of code over and over again
|
||||
forever or until you explicitly tell it to stop.
|
||||
|
||||
As an example, change the *src/main.rs* file in your *loops* directory to look
|
||||
like this:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
loop {
|
||||
println!("again!");
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
When we run this program, we’ll see `again!` printed over and over continuously
|
||||
until we stop the program manually. Most terminals support a keyboard shortcut,
|
||||
<span class="keystroke">ctrl-c</span>, to halt a program that is stuck in a
|
||||
continual loop. Give it a try:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling loops v0.1.0 (file:///projects/loops)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.29 secs
|
||||
Running `target/debug/loops`
|
||||
again!
|
||||
again!
|
||||
again!
|
||||
again!
|
||||
^Cagain!
|
||||
```
|
||||
|
||||
The symbol `^C` represents where you pressed <span class="keystroke">ctrl-c
|
||||
</span>. You may or may not see the word `again!` printed after the `^C`,
|
||||
depending on where the code was in the loop when it received the halt signal.
|
||||
|
||||
Fortunately, Rust provides another, more reliable way to break out of a loop.
|
||||
You can place the `break` keyword within the loop to tell the program when to
|
||||
stop executing the loop. Recall that we did this in the guessing game in the
|
||||
“Quitting After a Correct Guess” section of Chapter 2 to exit the
|
||||
program when the user won the game by guessing the correct number.
|
||||
|
||||
#### Conditional Loops with `while`
|
||||
|
||||
It’s often useful for a program to evaluate a condition within a loop. While
|
||||
the condition is true, the loop runs. When the condition ceases to be true, the
|
||||
program calls `break`, stopping the loop. This loop type could be implemented
|
||||
using a combination of `loop`, `if`, `else`, and `break`; you could try that
|
||||
now in a program, if you’d like.
|
||||
|
||||
However, this pattern is so common that Rust has a built-in language construct
|
||||
for it, called a `while` loop. Listing 3-3 uses `while`: the program loops
|
||||
three times, counting down each time, and then, after the loop, it prints
|
||||
another message and exits.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let mut number = 3;
|
||||
|
||||
while number != 0 {
|
||||
println!("{}!", number);
|
||||
|
||||
number = number - 1;
|
||||
}
|
||||
|
||||
println!("LIFTOFF!!!");
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 3-3: Using a `while` loop to run code while a
|
||||
condition holds true</span>
|
||||
|
||||
This construct eliminates a lot of nesting that would be necessary if you used
|
||||
`loop`, `if`, `else`, and `break`, and it’s clearer. While a condition holds
|
||||
true, the code runs; otherwise, it exits the loop.
|
||||
|
||||
#### Looping Through a Collection with `for`
|
||||
|
||||
You could use the `while` construct to loop over the elements of a collection,
|
||||
such as an array. For example, let’s look at Listing 3-4:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let a = [10, 20, 30, 40, 50];
|
||||
let mut index = 0;
|
||||
|
||||
while index < 5 {
|
||||
println!("the value is: {}", a[index]);
|
||||
|
||||
index = index + 1;
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 3-4: Looping through each element of a collection
|
||||
using a `while` loop</span>
|
||||
|
||||
Here, the code counts up through the elements in the array. It starts at index
|
||||
`0`, and then loops until it reaches the final index in the array (that is,
|
||||
when `index < 5` is no longer true). Running this code will print every element
|
||||
in the array:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling loops v0.1.0 (file:///projects/loops)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.32 secs
|
||||
Running `target/debug/loops`
|
||||
the value is: 10
|
||||
the value is: 20
|
||||
the value is: 30
|
||||
the value is: 40
|
||||
the value is: 50
|
||||
```
|
||||
|
||||
All five array values appear in the terminal, as expected. Even though `index`
|
||||
will reach a value of `5` at some point, the loop stops executing before trying
|
||||
to fetch a sixth value from the array.
|
||||
|
||||
But this approach is error prone; we could cause the program to panic if the
|
||||
index length is incorrect. It’s also slow, because the compiler adds runtime
|
||||
code to perform the conditional check on every element on every iteration
|
||||
through the loop.
|
||||
|
||||
As a more concise alternative, you can use a `for` loop and execute some code
|
||||
for each item in a collection. A `for` loop looks like this code in Listing 3-5:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let a = [10, 20, 30, 40, 50];
|
||||
|
||||
for element in a.iter() {
|
||||
println!("the value is: {}", element);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 3-5: Looping through each element of a collection
|
||||
using a `for` loop</span>
|
||||
|
||||
When we run this code, we’ll see the same output as in Listing 3-4. More
|
||||
importantly, we’ve now increased the safety of the code and eliminated the
|
||||
chance of bugs that might result from going beyond the end of the array or not
|
||||
going far enough and missing some items.
|
||||
|
||||
For example, in the code in Listing 3-4, if you removed an item from the `a`
|
||||
array but forgot to update the condition to `while index < 4`, the code would
|
||||
panic. Using the `for` loop, you wouldn’t need to remember to change any other
|
||||
code if you changed the number of values in the array.
|
||||
|
||||
The safety and conciseness of `for` loops make them the most commonly used loop
|
||||
construct in Rust. Even in situations in which you want to run some code a
|
||||
certain number of times, as in the countdown example that used a `while` loop
|
||||
in Listing 3-3, most Rustaceans would use a `for` loop. The way to do that
|
||||
would be to use a `Range`, which is a type provided by the standard library
|
||||
that generates all numbers in sequence starting from one number and ending
|
||||
before another number.
|
||||
|
||||
Here’s what the countdown would look like using a `for` loop and another method
|
||||
we’ve not yet talked about, `rev`, to reverse the range:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
for number in (1..4).rev() {
|
||||
println!("{}!", number);
|
||||
}
|
||||
println!("LIFTOFF!!!");
|
||||
}
|
||||
```
|
||||
|
||||
This code is a bit nicer, isn’t it?
|
||||
|
||||
## Summary
|
||||
|
||||
You made it! That was a sizable chapter: you learned about variables, scalar
|
||||
and compound data types, functions, comments, `if` expressions, and loops! If
|
||||
you want to practice with the concepts discussed in this chapter, try building
|
||||
programs to do the following:
|
||||
|
||||
* Convert temperatures between Fahrenheit and Celsius.
|
||||
* Generate the nth Fibonacci number.
|
||||
* Print the lyrics to the Christmas carol “The Twelve Days of Christmas,”
|
||||
taking advantage of the repetition in the song.
|
||||
|
||||
When you’re ready to move on, we’ll talk about a concept in Rust that *doesn’t*
|
||||
commonly exist in other programming languages: ownership.
|
||||
7
2018-edition/src/ch04-00-understanding-ownership.md
Normal file
7
2018-edition/src/ch04-00-understanding-ownership.md
Normal file
@@ -0,0 +1,7 @@
|
||||
# Understanding Ownership
|
||||
|
||||
Ownership is Rust’s most unique feature, and it enables Rust to make memory
|
||||
safety guarantees without needing a garbage collector. Therefore, it’s
|
||||
important to understand how ownership works in Rust. In this chapter, we’ll
|
||||
talk about ownership as well as several related features: borrowing, slices,
|
||||
and how Rust lays data out in memory.
|
||||
552
2018-edition/src/ch04-01-what-is-ownership.md
Normal file
552
2018-edition/src/ch04-01-what-is-ownership.md
Normal file
@@ -0,0 +1,552 @@
|
||||
## What Is Ownership?
|
||||
|
||||
Rust’s central feature is *ownership*. Although the feature is straightforward
|
||||
to explain, it has deep implications for the rest of the language.
|
||||
|
||||
All programs have to manage the way they use a computer’s memory while running.
|
||||
Some languages have garbage collection that constantly looks for no longer used
|
||||
memory as the program runs; in other languages, the programmer must explicitly
|
||||
allocate and free the memory. Rust uses a third approach: memory is managed
|
||||
through a system of ownership with a set of rules that the compiler checks at
|
||||
compile time. None of the ownership features slow down your program while it’s
|
||||
running.
|
||||
|
||||
Because ownership is a new concept for many programmers, it does take some time
|
||||
to get used to. The good news is that the more experienced you become with Rust
|
||||
and the rules of the ownership system, the more you’ll be able to naturally
|
||||
develop code that is safe and efficient. Keep at it!
|
||||
|
||||
When you understand ownership, you’ll have a solid foundation for understanding
|
||||
the features that make Rust unique. In this chapter, you’ll learn ownership by
|
||||
working through some examples that focus on a very common data structure:
|
||||
strings.
|
||||
|
||||
> ### The Stack and the Heap
|
||||
>
|
||||
> In many programming languages, you don’t have to think about the stack and
|
||||
> the heap very often. But in a systems programming language like Rust, whether
|
||||
> a value is on the stack or the heap has more of an effect on how the language
|
||||
> behaves and why you have to make certain decisions. Parts of ownership will
|
||||
> be described in relation to the stack and the heap later in this chapter, so
|
||||
> here is a brief explanation in preparation.
|
||||
>
|
||||
> Both the stack and the heap are parts of memory that is available to your code
|
||||
> to use at runtime, but they are structured in different ways. The stack stores
|
||||
> values in the order it gets them and removes the values in the opposite order.
|
||||
> This is referred to as *last in, first out*. Think of a stack of plates: when
|
||||
> you add more plates, you put them on top of the pile, and when you need a
|
||||
> plate, you take one off the top. Adding or removing plates from the middle or
|
||||
> bottom wouldn’t work as well! Adding data is called *pushing onto the stack*,
|
||||
> and removing data is called *popping off the stack*.
|
||||
>
|
||||
> The stack is fast because of the way it accesses the data: it never has to
|
||||
> search for a place to put new data or a place to get data from because that
|
||||
> place is always the top. Another property that makes the stack fast is that
|
||||
> all data on the stack must take up a known, fixed size.
|
||||
>
|
||||
> Data with a size unknown at compile time or a size that might change can be
|
||||
> stored on the heap instead. The heap is less organized: when you put data on
|
||||
> the heap, you ask for some amount of space. The operating system finds an
|
||||
> empty spot somewhere in the heap that is big enough, marks it as being in
|
||||
> use, and returns a *pointer*, which is the address of that location. This
|
||||
> process is called *allocating on the heap*, sometimes abbreviated as just
|
||||
> “allocating.” Pushing values onto the stack is not considered allocating.
|
||||
> Because the pointer is a known, fixed size, you can store the pointer on the
|
||||
> stack, but when you want the actual data, you have to follow the pointer.
|
||||
>
|
||||
> Think of being seated at a restaurant. When you enter, you state the number of
|
||||
> people in your group, and the staff finds an empty table that fits everyone
|
||||
> and leads you there. If someone in your group comes late, they can ask where
|
||||
> you’ve been seated to find you.
|
||||
>
|
||||
> Accessing data in the heap is slower than accessing data on the stack because
|
||||
> you have to follow a pointer to get there. Contemporary processors are faster
|
||||
> if they jump around less in memory. Continuing the analogy, consider a server
|
||||
> at a restaurant taking orders from many tables. It’s most efficient to get
|
||||
> all the orders at one table before moving on to the next table. Taking an
|
||||
> order from table A, then an order from table B, then one from A again, and
|
||||
> then one from B again would be a much slower process. By the same token, a
|
||||
> processor can do its job better if it works on data that’s close to other
|
||||
> data (as it is on the stack) rather than farther away (as it can be on the
|
||||
> heap). Allocating a large amount of space on the heap can also take time.
|
||||
>
|
||||
> When your code calls a function, the values passed into the function
|
||||
> (including, potentially, pointers to data on the heap) and the function’s
|
||||
> local variables get pushed onto the stack. When the function is over, those
|
||||
> values get popped off the stack.
|
||||
>
|
||||
> Keeping track of what parts of code are using what data on the heap,
|
||||
> minimizing the amount of duplicate data on the heap, and cleaning up unused
|
||||
> data on the heap so you don’t run out of space are all problems that ownership
|
||||
> addresses. Once you understand ownership, you won’t need to think about the
|
||||
> stack and the heap very often, but knowing that managing heap data is why
|
||||
> ownership exists can help explain why it works the way it does.
|
||||
|
||||
### Ownership Rules
|
||||
|
||||
First, let’s take a look at the ownership rules. Keep these rules in mind as we
|
||||
work through the examples that illustrate them:
|
||||
|
||||
> 1. Each value in Rust has a variable that’s called its *owner*.
|
||||
> 2. There can only be one owner at a time.
|
||||
> 3. When the owner goes out of scope, the value will be dropped.
|
||||
|
||||
### Variable Scope
|
||||
|
||||
We’ve walked through an example of a Rust program already in Chapter 2. Now
|
||||
that we’re past basic syntax, we won’t include all the `fn main() {` code in
|
||||
examples, so if you’re following along, you’ll have to put the following
|
||||
examples inside a `main` function manually. As a result, our examples will be a
|
||||
bit more concise, letting us focus on the actual details rather than
|
||||
boilerplate code.
|
||||
|
||||
As a first example of ownership, we’ll look at the *scope* of some variables. A
|
||||
scope is the range within a program for which an item is valid. Let’s say we
|
||||
have a variable that looks like this:
|
||||
|
||||
```rust
|
||||
let s = "hello";
|
||||
```
|
||||
|
||||
The variable `s` refers to a string literal, where the value of the string is
|
||||
hardcoded into the text of our program. The variable is valid from the point at
|
||||
which it’s declared until the end of the current *scope*. Listing 4-1 has
|
||||
comments annotating where the variable `s` is valid:
|
||||
|
||||
```rust
|
||||
{ // s is not valid here, it’s not yet declared
|
||||
let s = "hello"; // s is valid from this point forward
|
||||
|
||||
// do stuff with s
|
||||
} // this scope is now over, and s is no longer valid
|
||||
```
|
||||
|
||||
<span class="caption">Listing 4-1: A variable and the scope in which it is
|
||||
valid</span>
|
||||
|
||||
In other words, there are two important points in time here:
|
||||
|
||||
* When `s` comes *into scope*, it is valid.
|
||||
* It remains valid until it goes *out of scope*.
|
||||
|
||||
At this point, the relationship between scopes and when variables are valid is
|
||||
similar to that in other programming languages. Now we’ll build on top of this
|
||||
understanding by introducing the `String` type.
|
||||
|
||||
### The `String` Type
|
||||
|
||||
To illustrate the rules of ownership, we need a data type that is more complex
|
||||
than the ones we covered in the “Data Types” section of Chapter 3. The types
|
||||
covered previously are all stored on the stack and popped off the stack when
|
||||
their scope is over, but we want to look at data that is stored on the heap and
|
||||
explore how Rust knows when to clean up that data.
|
||||
|
||||
We’ll use `String` as the example here and concentrate on the parts of `String`
|
||||
that relate to ownership. These aspects also apply to other complex data types
|
||||
provided by the standard library and that you create. We’ll discuss `String` in
|
||||
more depth in Chapter 8.
|
||||
|
||||
We’ve already seen string literals, where a string value is hardcoded into our
|
||||
program. String literals are convenient, but they aren’t suitable for every
|
||||
situation in which we may want to use text. One reason is that they’re
|
||||
immutable. Another is that not every string value can be known when we write
|
||||
our code: for example, what if we want to take user input and store it? For
|
||||
these situations, Rust has a second string type, `String`. This type is
|
||||
allocated on the heap and as such is able to store an amount of text that is
|
||||
unknown to us at compile time. You can create a `String` from a string literal
|
||||
using the `from` function, like so:
|
||||
|
||||
```rust
|
||||
let s = String::from("hello");
|
||||
```
|
||||
|
||||
The double colon (`::`) is an operator that allows us to namespace this
|
||||
particular `from` function under the `String` type rather than using some sort
|
||||
of name like `string_from`. We’ll discuss this syntax more in the “Method
|
||||
Syntax” section of Chapter 5 and when we talk about namespacing with modules in
|
||||
“Module Definitions” in Chapter 7.
|
||||
|
||||
This kind of string *can* be mutated:
|
||||
|
||||
```rust
|
||||
let mut s = String::from("hello");
|
||||
|
||||
s.push_str(", world!"); // push_str() appends a literal to a String
|
||||
|
||||
println!("{}", s); // This will print `hello, world!`
|
||||
```
|
||||
|
||||
So, what’s the difference here? Why can `String` be mutated but literals
|
||||
cannot? The difference is how these two types deal with memory.
|
||||
|
||||
### Memory and Allocation
|
||||
|
||||
In the case of a string literal, we know the contents at compile time, so the
|
||||
text is hardcoded directly into the final executable. This is why string
|
||||
literals are fast and efficient. But these properties only come from the string
|
||||
literal’s immutability. Unfortunately, we can’t put a blob of memory into the
|
||||
binary for each piece of text whose size is unknown at compile time and whose
|
||||
size might change while running the program.
|
||||
|
||||
With the `String` type, in order to support a mutable, growable piece of text,
|
||||
we need to allocate an amount of memory on the heap, unknown at compile time,
|
||||
to hold the contents. This means:
|
||||
|
||||
* The memory must be requested from the operating system at runtime.
|
||||
* We need a way of returning this memory to the operating system when we’re
|
||||
done with our `String`.
|
||||
|
||||
That first part is done by us: when we call `String::from`, its implementation
|
||||
requests the memory it needs. This is pretty much universal in programming
|
||||
languages.
|
||||
|
||||
However, the second part is different. In languages with a *garbage collector
|
||||
(GC)*, the GC keeps track and cleans up memory that isn’t being used anymore,
|
||||
and we don’t need to think about it. Without a GC, it’s our responsibility to
|
||||
identify when memory is no longer being used and call code to explicitly return
|
||||
it, just as we did to request it. Doing this correctly has historically been a
|
||||
difficult programming problem. If we forget, we’ll waste memory. If we do it
|
||||
too early, we’ll have an invalid variable. If we do it twice, that’s a bug too.
|
||||
We need to pair exactly one `allocate` with exactly one `free`.
|
||||
|
||||
Rust takes a different path: the memory is automatically returned once the
|
||||
variable that owns it goes out of scope. Here’s a version of our scope example
|
||||
from Listing 4-1 using a `String` instead of a string literal:
|
||||
|
||||
```rust
|
||||
{
|
||||
let s = String::from("hello"); // s is valid from this point forward
|
||||
|
||||
// do stuff with s
|
||||
} // this scope is now over, and s is no
|
||||
// longer valid
|
||||
```
|
||||
|
||||
There is a natural point at which we can return the memory our `String` needs
|
||||
to the operating system: when `s` goes out of scope. When a variable goes out
|
||||
of scope, Rust calls a special function for us. This function is called `drop`,
|
||||
and it’s where the author of `String` can put the code to return the memory.
|
||||
Rust calls `drop` automatically at the closing `}`.
|
||||
|
||||
> Note: In C++, this pattern of deallocating resources at the end of an item’s
|
||||
> lifetime is sometimes called *Resource Acquisition Is Initialization (RAII)*.
|
||||
> The `drop` function in Rust will be familiar to you if you’ve used RAII
|
||||
> patterns.
|
||||
|
||||
This pattern has a profound impact on the way Rust code is written. It may seem
|
||||
simple right now, but the behavior of code can be unexpected in more
|
||||
complicated situations when we want to have multiple variables use the data
|
||||
we’ve allocated on the heap. Let’s explore some of those situations now.
|
||||
|
||||
#### Ways Variables and Data Interact: Move
|
||||
|
||||
Multiple variables can interact with the same data in different ways in Rust.
|
||||
Let’s look at an example using an integer in Listing 4-2:
|
||||
|
||||
```rust
|
||||
let x = 5;
|
||||
let y = x;
|
||||
```
|
||||
|
||||
<span class="caption">Listing 4-2: Assigning the integer value of variable `x`
|
||||
to `y`</span>
|
||||
|
||||
We can probably guess what this is doing: “bind the value `5` to `x`; then make
|
||||
a copy of the value in `x` and bind it to `y`.” We now have two variables, `x`
|
||||
and `y`, and both equal `5`. This is indeed what is happening, because integers
|
||||
are simple values with a known, fixed size, and these two `5` values are pushed
|
||||
onto the stack.
|
||||
|
||||
Now let’s look at the `String` version:
|
||||
|
||||
```rust
|
||||
let s1 = String::from("hello");
|
||||
let s2 = s1;
|
||||
```
|
||||
|
||||
This looks very similar to the previous code, so we might assume that the way
|
||||
it works would be the same: that is, the second line would make a copy of the
|
||||
value in `s1` and bind it to `s2`. But this isn’t quite what happens.
|
||||
|
||||
Take a look at Figure 4-1 to see what is happening to `String` under the
|
||||
covers. A `String` is made up of three parts, shown on the left: a pointer to
|
||||
the memory that holds the contents of the string, a length, and a capacity.
|
||||
This group of data is stored on the stack. On the right is the memory on the
|
||||
heap that holds the contents.
|
||||
|
||||
<img alt="String in memory" src="img/trpl04-01.svg" class="center" style="width: 50%;" />
|
||||
|
||||
<span class="caption">Figure 4-1: Representation in memory of a `String`
|
||||
holding the value `"hello"` bound to `s1`</span>
|
||||
|
||||
The length is how much memory, in bytes, the contents of the `String` is
|
||||
currently using. The capacity is the total amount of memory, in bytes, that the
|
||||
`String` has received from the operating system. The difference between length
|
||||
and capacity matters, but not in this context, so for now, it’s fine to ignore
|
||||
the capacity.
|
||||
|
||||
When we assign `s1` to `s2`, the `String` data is copied, meaning we copy the
|
||||
pointer, the length, and the capacity that are on the stack. We do not copy the
|
||||
data on the heap that the pointer refers to. In other words, the data
|
||||
representation in memory looks like Figure 4-2.
|
||||
|
||||
<img alt="s1 and s2 pointing to the same value" src="img/trpl04-02.svg" class="center" style="width: 50%;" />
|
||||
|
||||
<span class="caption">Figure 4-2: Representation in memory of the variable `s2`
|
||||
that has a copy of the pointer, length, and capacity of `s1`</span>
|
||||
|
||||
The representation does *not* look like Figure 4-3, which is what memory would
|
||||
look like if Rust instead copied the heap data as well. If Rust did this, the
|
||||
operation `s2 = s1` could be very expensive in terms of runtime performance if
|
||||
the data on the heap were large.
|
||||
|
||||
<img alt="s1 and s2 to two places" src="img/trpl04-03.svg" class="center" style="width: 50%;" />
|
||||
|
||||
<span class="caption">Figure 4-3: Another possibility for what `s2 = s1` might
|
||||
do if Rust copied the heap data as well</span>
|
||||
|
||||
Earlier, we said that when a variable goes out of scope, Rust automatically
|
||||
calls the `drop` function and cleans up the heap memory for that variable. But
|
||||
Figure 4-2 shows both data pointers pointing to the same location. This is a
|
||||
problem: when `s2` and `s1` go out of scope, they will both try to free the
|
||||
same memory. This is known as a *double free* error and is one of the memory
|
||||
safety bugs we mentioned previously. Freeing memory twice can lead to memory
|
||||
corruption, which can potentially lead to security vulnerabilities.
|
||||
|
||||
To ensure memory safety, there’s one more detail to what happens in this
|
||||
situation in Rust. Instead of trying to copy the allocated memory, Rust
|
||||
considers `s1` to no longer be valid and, therefore, Rust doesn’t need to free
|
||||
anything when `s1` goes out of scope. Check out what happens when you try to
|
||||
use `s1` after `s2` is created; it won’t work:
|
||||
|
||||
```rust,ignore
|
||||
let s1 = String::from("hello");
|
||||
let s2 = s1;
|
||||
|
||||
println!("{}, world!", s1);
|
||||
```
|
||||
|
||||
You’ll get an error like this because Rust prevents you from using the
|
||||
invalidated reference:
|
||||
|
||||
```text
|
||||
error[E0382]: use of moved value: `s1`
|
||||
--> src/main.rs:5:28
|
||||
|
|
||||
3 | let s2 = s1;
|
||||
| -- value moved here
|
||||
4 |
|
||||
5 | println!("{}, world!", s1);
|
||||
| ^^ value used here after move
|
||||
|
|
||||
= note: move occurs because `s1` has type `std::string::String`, which does
|
||||
not implement the `Copy` trait
|
||||
```
|
||||
|
||||
If you’ve heard the terms *shallow copy* and *deep copy* while working with
|
||||
other languages, the concept of copying the pointer, length, and capacity
|
||||
without copying the data probably sounds like making a shallow copy. But
|
||||
because Rust also invalidates the first variable, instead of being called a
|
||||
shallow copy, it’s known as a *move*. Here we would read this by saying that
|
||||
`s1` was *moved* into `s2`. So what actually happens is shown in Figure 4-4.
|
||||
|
||||
<img alt="s1 moved to s2" src="img/trpl04-04.svg" class="center" style="width: 50%;" />
|
||||
|
||||
<span class="caption">Figure 4-4: Representation in memory after `s1` has been
|
||||
invalidated</span>
|
||||
|
||||
That solves our problem! With only `s2` valid, when it goes out of scope, it
|
||||
alone will free the memory, and we’re done.
|
||||
|
||||
In addition, there’s a design choice that’s implied by this: Rust will never
|
||||
automatically create “deep” copies of your data. Therefore, any *automatic*
|
||||
copying can be assumed to be inexpensive in terms of runtime performance.
|
||||
|
||||
#### Ways Variables and Data Interact: Clone
|
||||
|
||||
If we *do* want to deeply copy the heap data of the `String`, not just the
|
||||
stack data, we can use a common method called `clone`. We’ll discuss method
|
||||
syntax in Chapter 5, but because methods are a common feature in many
|
||||
programming languages, you’ve probably seen them before.
|
||||
|
||||
Here’s an example of the `clone` method in action:
|
||||
|
||||
```rust
|
||||
let s1 = String::from("hello");
|
||||
let s2 = s1.clone();
|
||||
|
||||
println!("s1 = {}, s2 = {}", s1, s2);
|
||||
```
|
||||
|
||||
This works just fine and explicitly produces the behavior shown in Figure 4-3,
|
||||
where the heap data *does* get copied.
|
||||
|
||||
When you see a call to `clone`, you know that some arbitrary code is being
|
||||
executed and that code may be expensive. It’s a visual indicator that something
|
||||
different is going on.
|
||||
|
||||
#### Stack-Only Data: Copy
|
||||
|
||||
There’s another wrinkle we haven’t talked about yet. This code using integers,
|
||||
part of which was shown earlier in Listing 4-2, works and is valid:
|
||||
|
||||
```rust
|
||||
let x = 5;
|
||||
let y = x;
|
||||
|
||||
println!("x = {}, y = {}", x, y);
|
||||
```
|
||||
|
||||
But this code seems to contradict what we just learned: we don’t have a call to
|
||||
`clone`, but `x` is still valid and wasn’t moved into `y`.
|
||||
|
||||
The reason is that types such as integers that have a known size at compile
|
||||
time are stored entirely on the stack, so copies of the actual values are quick
|
||||
to make. That means there’s no reason we would want to prevent `x` from being
|
||||
valid after we create the variable `y`. In other words, there’s no difference
|
||||
between deep and shallow copying here, so calling `clone` wouldn’t do anything
|
||||
different from the usual shallow copying and we can leave it out.
|
||||
|
||||
Rust has a special annotation called the `Copy` trait that we can place on
|
||||
types like integers that are stored on the stack (we’ll talk more about traits
|
||||
in Chapter 10). If a type has the `Copy` trait, an older variable is still
|
||||
usable after assignment. Rust won’t let us annotate a type with the `Copy`
|
||||
trait if the type, or any of its parts, has implemented the `Drop` trait. If
|
||||
the type needs something special to happen when the value goes out of scope and
|
||||
we add the `Copy` annotation to that type, we’ll get a compile time error. To
|
||||
learn about how to add the `Copy` annotation to your type, see “Derivable
|
||||
Traits” in Appendix C.
|
||||
|
||||
So what types are `Copy`? You can check the documentation for the given type to
|
||||
be sure, but as a general rule, any group of simple scalar values can be
|
||||
`Copy`, and nothing that requires allocation or is some form of resource is
|
||||
`Copy`. Here are some of the types that are `Copy`:
|
||||
|
||||
* All the integer types, such as `u32`.
|
||||
* The Boolean type, `bool`, with values `true` and `false`.
|
||||
* All the floating point types, such as `f64`.
|
||||
* The character type, `char`.
|
||||
* Tuples, but only if they contain types that are also `Copy`. For example,
|
||||
`(i32, i32)` is `Copy`, but `(i32, String)` is not.
|
||||
|
||||
### Ownership and Functions
|
||||
|
||||
The semantics for passing a value to a function are similar to those for
|
||||
assigning a value to a variable. Passing a variable to a function will move or
|
||||
copy, just as assignment does. Listing 4-3 has an example with some annotations
|
||||
showing where variables go into and out of scope:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let s = String::from("hello"); // s comes into scope
|
||||
|
||||
takes_ownership(s); // s's value moves into the function...
|
||||
// ... and so is no longer valid here
|
||||
|
||||
let x = 5; // x comes into scope
|
||||
|
||||
makes_copy(x); // x would move into the function,
|
||||
// but i32 is Copy, so it’s okay to still
|
||||
// use x afterward
|
||||
|
||||
} // Here, x goes out of scope, then s. But because s's value was moved, nothing
|
||||
// special happens.
|
||||
|
||||
fn takes_ownership(some_string: String) { // some_string comes into scope
|
||||
println!("{}", some_string);
|
||||
} // Here, some_string goes out of scope and `drop` is called. The backing
|
||||
// memory is freed.
|
||||
|
||||
fn makes_copy(some_integer: i32) { // some_integer comes into scope
|
||||
println!("{}", some_integer);
|
||||
} // Here, some_integer goes out of scope. Nothing special happens.
|
||||
```
|
||||
|
||||
<span class="caption">Listing 4-3: Functions with ownership and scope
|
||||
annotated</span>
|
||||
|
||||
If we tried to use `s` after the call to `takes_ownership`, Rust would throw a
|
||||
compile time error. These static checks protect us from mistakes. Try adding
|
||||
code to `main` that uses `s` and `x` to see where you can use them and where
|
||||
the ownership rules prevent you from doing so.
|
||||
|
||||
### Return Values and Scope
|
||||
|
||||
Returning values can also transfer ownership. Listing 4-4 is an example with
|
||||
similar annotations to those in Listing 4-3:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let s1 = gives_ownership(); // gives_ownership moves its return
|
||||
// value into s1
|
||||
|
||||
let s2 = String::from("hello"); // s2 comes into scope
|
||||
|
||||
let s3 = takes_and_gives_back(s2); // s2 is moved into
|
||||
// takes_and_gives_back, which also
|
||||
// moves its return value into s3
|
||||
} // Here, s3 goes out of scope and is dropped. s2 goes out of scope but was
|
||||
// moved, so nothing happens. s1 goes out of scope and is dropped.
|
||||
|
||||
fn gives_ownership() -> String { // gives_ownership will move its
|
||||
// return value into the function
|
||||
// that calls it
|
||||
|
||||
let some_string = String::from("hello"); // some_string comes into scope
|
||||
|
||||
some_string // some_string is returned and
|
||||
// moves out to the calling
|
||||
// function.
|
||||
}
|
||||
|
||||
// takes_and_gives_back will take a String and return one.
|
||||
fn takes_and_gives_back(a_string: String) -> String { // a_string comes into
|
||||
// scope
|
||||
|
||||
a_string // a_string is returned and moves out to the calling function
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 4-4: Transferring ownership of return
|
||||
values</span>
|
||||
|
||||
The ownership of a variable follows the same pattern every time: assigning a
|
||||
value to another variable moves it. When a variable that includes data on the
|
||||
heap goes out of scope, the value will be cleaned up by `drop` unless the data
|
||||
has been moved to be owned by another variable.
|
||||
|
||||
Taking ownership and then returning ownership with every function is a bit
|
||||
tedious. What if we want to let a function use a value but not take ownership?
|
||||
It’s quite annoying that anything we pass in also needs to be passed back if we
|
||||
want to use it again, in addition to any data resulting from the body of the
|
||||
function that we might want to return as well.
|
||||
|
||||
It’s possible to return multiple values using a tuple, as shown in Listing 4-5:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let s1 = String::from("hello");
|
||||
|
||||
let (s2, len) = calculate_length(s1);
|
||||
|
||||
println!("The length of '{}' is {}.", s2, len);
|
||||
}
|
||||
|
||||
fn calculate_length(s: String) -> (String, usize) {
|
||||
let length = s.len(); // len() returns the length of a String
|
||||
|
||||
(s, length)
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 4-5: Returning ownership of parameters</span>
|
||||
|
||||
But this is too much ceremony and a lot of work for a concept that should be
|
||||
common. Luckily for us, Rust has a feature for this concept, called
|
||||
*references*.
|
||||
322
2018-edition/src/ch04-02-references-and-borrowing.md
Normal file
322
2018-edition/src/ch04-02-references-and-borrowing.md
Normal file
@@ -0,0 +1,322 @@
|
||||
## References and Borrowing
|
||||
|
||||
The issue with the tuple code in Listing 4-5 is that we have to return the
|
||||
`String` to the calling function so we can still use the `String` after the
|
||||
call to `calculate_length`, because the `String` was moved into
|
||||
`calculate_length`.
|
||||
|
||||
Here is how you would define and use a `calculate_length` function that has a
|
||||
reference to an object as a parameter instead of taking ownership of the
|
||||
value:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let s1 = String::from("hello");
|
||||
|
||||
let len = calculate_length(&s1);
|
||||
|
||||
println!("The length of '{}' is {}.", s1, len);
|
||||
}
|
||||
|
||||
fn calculate_length(s: &String) -> usize {
|
||||
s.len()
|
||||
}
|
||||
```
|
||||
|
||||
First, notice that all the tuple code in the variable declaration and the
|
||||
function return value is gone. Second, note that we pass `&s1` into
|
||||
`calculate_length` and, in its definition, we take `&String` rather than
|
||||
`String`.
|
||||
|
||||
These ampersands are *references*, and they allow you to refer to some value
|
||||
without taking ownership of it. Figure 4-5 shows a diagram.
|
||||
|
||||
<img alt="&String s pointing at String s1" src="img/trpl04-05.svg" class="center" />
|
||||
|
||||
<span class="caption">Figure 4-5: A diagram of `&String s` pointing at `String
|
||||
s1`</span>
|
||||
|
||||
> Note: The opposite of referencing by using `&` is *dereferencing*, which is
|
||||
> accomplished with the dereference operator, `*`. We’ll see some uses of the
|
||||
> dereference operator in Chapter 8 and discuss details of dereferencing in
|
||||
> Chapter 15.
|
||||
|
||||
Let’s take a closer look at the function call here:
|
||||
|
||||
```rust
|
||||
# fn calculate_length(s: &String) -> usize {
|
||||
# s.len()
|
||||
# }
|
||||
let s1 = String::from("hello");
|
||||
|
||||
let len = calculate_length(&s1);
|
||||
```
|
||||
|
||||
The `&s1` syntax lets us create a reference that *refers* to the value of `s1`
|
||||
but does not own it. Because it does not own it, the value it points to will
|
||||
not be dropped when the reference goes out of scope.
|
||||
|
||||
Likewise, the signature of the function uses `&` to indicate that the type of
|
||||
the parameter `s` is a reference. Let’s add some explanatory annotations:
|
||||
|
||||
```rust
|
||||
fn calculate_length(s: &String) -> usize { // s is a reference to a String
|
||||
s.len()
|
||||
} // Here, s goes out of scope. But because it does not have ownership of what
|
||||
// it refers to, nothing happens.
|
||||
```
|
||||
|
||||
The scope in which the variable `s` is valid is the same as any function
|
||||
parameter’s scope, but we don’t drop what the reference points to when it goes
|
||||
out of scope because we don’t have ownership. When functions have references as
|
||||
parameters instead of the actual values, we won’t need to return the values in
|
||||
order to give back ownership, because we never had ownership.
|
||||
|
||||
We call having references as function parameters *borrowing*. As in real life,
|
||||
if a person owns something, you can borrow it from them. When you’re done, you
|
||||
have to give it back.
|
||||
|
||||
So what happens if we try to modify something we’re borrowing? Try the code in
|
||||
Listing 4-6. Spoiler alert: it doesn’t work!
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let s = String::from("hello");
|
||||
|
||||
change(&s);
|
||||
}
|
||||
|
||||
fn change(some_string: &String) {
|
||||
some_string.push_str(", world");
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 4-6: Attempting to modify a borrowed value</span>
|
||||
|
||||
Here’s the error:
|
||||
|
||||
```text
|
||||
error[E0596]: cannot borrow immutable borrowed content `*some_string` as mutable
|
||||
--> error.rs:8:5
|
||||
|
|
||||
7 | fn change(some_string: &String) {
|
||||
| ------- use `&mut String` here to make mutable
|
||||
8 | some_string.push_str(", world");
|
||||
| ^^^^^^^^^^^ cannot borrow as mutable
|
||||
```
|
||||
|
||||
Just as variables are immutable by default, so are references. We’re not
|
||||
allowed to modify something we have a reference to.
|
||||
|
||||
### Mutable References
|
||||
|
||||
We can fix the error in the code from Listing 4-6 with just a small tweak:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let mut s = String::from("hello");
|
||||
|
||||
change(&mut s);
|
||||
}
|
||||
|
||||
fn change(some_string: &mut String) {
|
||||
some_string.push_str(", world");
|
||||
}
|
||||
```
|
||||
|
||||
First, we had to change `s` to be `mut`. Then we had to create a mutable
|
||||
reference with `&mut s` and accept a mutable reference with `some_string: &mut
|
||||
String`.
|
||||
|
||||
But mutable references have one big restriction: you can only have one mutable
|
||||
reference to a particular piece of data in a particular scope. This code will
|
||||
fail:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
let mut s = String::from("hello");
|
||||
|
||||
let r1 = &mut s;
|
||||
let r2 = &mut s;
|
||||
```
|
||||
|
||||
Here’s the error:
|
||||
|
||||
```text
|
||||
error[E0499]: cannot borrow `s` as mutable more than once at a time
|
||||
--> borrow_twice.rs:5:19
|
||||
|
|
||||
4 | let r1 = &mut s;
|
||||
| - first mutable borrow occurs here
|
||||
5 | let r2 = &mut s;
|
||||
| ^ second mutable borrow occurs here
|
||||
6 | }
|
||||
| - first borrow ends here
|
||||
```
|
||||
|
||||
This restriction allows for mutation but in a very controlled fashion. It’s
|
||||
something that new Rustaceans struggle with, because most languages let you
|
||||
mutate whenever you’d like.
|
||||
|
||||
The benefit of having this restriction is that Rust can prevent data races at
|
||||
compile time. A *data race* is similar to a race condition and happens when
|
||||
these three behaviors occur:
|
||||
|
||||
* Two or more pointers access the same data at the same time.
|
||||
* At least one of the pointers is being used to write to the data.
|
||||
* There’s no mechanism being used to synchronize access to the data.
|
||||
|
||||
Data races cause undefined behavior and can be difficult to diagnose and fix
|
||||
when you’re trying to track them down at runtime; Rust prevents this problem
|
||||
from happening because it won’t even compile code with data races!
|
||||
|
||||
As always, we can use curly brackets to create a new scope, allowing for
|
||||
multiple mutable references, just not *simultaneous* ones:
|
||||
|
||||
```rust
|
||||
let mut s = String::from("hello");
|
||||
|
||||
{
|
||||
let r1 = &mut s;
|
||||
|
||||
} // r1 goes out of scope here, so we can make a new reference with no problems.
|
||||
|
||||
let r2 = &mut s;
|
||||
```
|
||||
|
||||
A similar rule exists for combining mutable and immutable references. This code
|
||||
results in an error:
|
||||
|
||||
```rust,ignore
|
||||
let mut s = String::from("hello");
|
||||
|
||||
let r1 = &s; // no problem
|
||||
let r2 = &s; // no problem
|
||||
let r3 = &mut s; // BIG PROBLEM
|
||||
```
|
||||
|
||||
Here’s the error:
|
||||
|
||||
```text
|
||||
error[E0502]: cannot borrow `s` as mutable because it is also borrowed as
|
||||
immutable
|
||||
--> borrow_thrice.rs:6:19
|
||||
|
|
||||
4 | let r1 = &s; // no problem
|
||||
| - immutable borrow occurs here
|
||||
5 | let r2 = &s; // no problem
|
||||
6 | let r3 = &mut s; // BIG PROBLEM
|
||||
| ^ mutable borrow occurs here
|
||||
7 | }
|
||||
| - immutable borrow ends here
|
||||
```
|
||||
|
||||
Whew! We *also* cannot have a mutable reference while we have an immutable one.
|
||||
Users of an immutable reference don’t expect the values to suddenly change out
|
||||
from under them! However, multiple immutable references are okay because no one
|
||||
who is just reading the data has the ability to affect anyone else’s reading of
|
||||
the data.
|
||||
|
||||
Even though these errors may be frustrating at times, remember that it’s the
|
||||
Rust compiler pointing out a potential bug early (at compile time rather than
|
||||
at runtime) and showing you exactly where the problem is. Then you don’t have
|
||||
to track down why your data isn’t what you thought it was.
|
||||
|
||||
### Dangling References
|
||||
|
||||
In languages with pointers, it’s easy to erroneously create a *dangling
|
||||
pointer*, a pointer that references a location in memory that may have been
|
||||
given to someone else, by freeing some memory while preserving a pointer to
|
||||
that memory. In Rust, by contrast, the compiler guarantees that references will
|
||||
never be dangling references: if you have a reference to some data, the
|
||||
compiler will ensure that the data will not go out of scope before the
|
||||
reference to the data does.
|
||||
|
||||
Let’s try to create a dangling reference, which Rust will prevent with a
|
||||
compile-time error:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let reference_to_nothing = dangle();
|
||||
}
|
||||
|
||||
fn dangle() -> &String {
|
||||
let s = String::from("hello");
|
||||
|
||||
&s
|
||||
}
|
||||
```
|
||||
|
||||
Here’s the error:
|
||||
|
||||
```text
|
||||
error[E0106]: missing lifetime specifier
|
||||
--> dangle.rs:5:16
|
||||
|
|
||||
5 | fn dangle() -> &String {
|
||||
| ^ expected lifetime parameter
|
||||
|
|
||||
= help: this function's return type contains a borrowed value, but there is
|
||||
no value for it to be borrowed from
|
||||
= help: consider giving it a 'static lifetime
|
||||
```
|
||||
|
||||
This error message refers to a feature we haven’t covered yet: *lifetimes*.
|
||||
We’ll discuss lifetimes in detail in Chapter 10. But, if you disregard the
|
||||
parts about lifetimes, the message does contain the key to why this code is a
|
||||
problem:
|
||||
|
||||
```text
|
||||
this function's return type contains a borrowed value, but there is no value
|
||||
for it to be borrowed from.
|
||||
```
|
||||
|
||||
Let’s take a closer look at exactly what’s happening at each stage of our
|
||||
`dangle` code:
|
||||
|
||||
```rust,ignore
|
||||
fn dangle() -> &String { // dangle returns a reference to a String
|
||||
|
||||
let s = String::from("hello"); // s is a new String
|
||||
|
||||
&s // we return a reference to the String, s
|
||||
} // Here, s goes out of scope, and is dropped. Its memory goes away.
|
||||
// Danger!
|
||||
```
|
||||
|
||||
Because `s` is created inside `dangle`, when the code of `dangle` is finished,
|
||||
`s` will be deallocated. But we tried to return a reference to it. That means
|
||||
this reference would be pointing to an invalid `String` That’s no good! Rust
|
||||
won’t let us do this.
|
||||
|
||||
The solution here is to return the `String` directly:
|
||||
|
||||
```rust
|
||||
fn no_dangle() -> String {
|
||||
let s = String::from("hello");
|
||||
|
||||
s
|
||||
}
|
||||
```
|
||||
|
||||
This works without any problems. Ownership is moved out, and nothing is
|
||||
deallocated.
|
||||
|
||||
### The Rules of References
|
||||
|
||||
Let’s recap what we’ve discussed about references:
|
||||
|
||||
* At any given time, you can have *either* (but not both of) one mutable
|
||||
reference or any number of immutable references.
|
||||
* References must always be valid.
|
||||
|
||||
Next, we’ll look at a different kind of reference: slices.
|
||||
386
2018-edition/src/ch04-03-slices.md
Normal file
386
2018-edition/src/ch04-03-slices.md
Normal file
@@ -0,0 +1,386 @@
|
||||
## The Slice Type
|
||||
|
||||
Another data type that does not have ownership is the *slice*. Slices let you
|
||||
reference a contiguous sequence of elements in a collection rather than the
|
||||
whole collection.
|
||||
|
||||
Here’s a small programming problem: write a function that takes a string and
|
||||
returns the first word it finds in that string. If the function doesn’t find a
|
||||
space in the string, the whole string must be one word, so the entire string
|
||||
should be returned.
|
||||
|
||||
Let’s think about the signature of this function:
|
||||
|
||||
```rust,ignore
|
||||
fn first_word(s: &String) -> ?
|
||||
```
|
||||
|
||||
This function, `first_word`, has a `&String` as a parameter. We don’t want
|
||||
ownership, so this is fine. But what should we return? We don’t really have a
|
||||
way to talk about *part* of a string. However, we could return the index of the
|
||||
end of the word. Let’s try that, as shown in Listing 4-7:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn first_word(s: &String) -> usize {
|
||||
let bytes = s.as_bytes();
|
||||
|
||||
for (i, &item) in bytes.iter().enumerate() {
|
||||
if item == b' ' {
|
||||
return i;
|
||||
}
|
||||
}
|
||||
|
||||
s.len()
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 4-7: The `first_word` function that returns a
|
||||
byte index value into the `String` parameter</span>
|
||||
|
||||
Because we need to go through the `String` element by element and check whether
|
||||
a value is a space, we’ll convert our `String` to an array of bytes using the
|
||||
`as_bytes` method:
|
||||
|
||||
```rust,ignore
|
||||
let bytes = s.as_bytes();
|
||||
```
|
||||
|
||||
Next, we create an iterator over the array of bytes using the `iter` method:
|
||||
|
||||
```rust,ignore
|
||||
for (i, &item) in bytes.iter().enumerate() {
|
||||
```
|
||||
|
||||
We’ll discuss iterators in more detail in Chapter 13. For now, know that `iter`
|
||||
is a method that returns each element in a collection and that `enumerate`
|
||||
wraps the result of `iter` and returns each element as part of a tuple instead.
|
||||
The first element of the tuple returned from `enumerate` is the index, and the
|
||||
second element is a reference to the element. This is a bit more convenient
|
||||
than calculating the index ourselves.
|
||||
|
||||
Because the `enumerate` method returns a tuple, we can use patterns to
|
||||
destructure that tuple, just like everywhere else in Rust. So in the `for`
|
||||
loop, we specify a pattern that has `i` for the index in the tuple and `&item`
|
||||
for the single byte in the tuple. Because we get a reference to the element
|
||||
from `.iter().enumerate()`, we use `&` in the pattern.
|
||||
|
||||
Inside the `for` loop, we search for the byte that represents the space by
|
||||
using the byte literal syntax. If we find a space, we return the position.
|
||||
Otherwise, we return the length of the string by using `s.len()`:
|
||||
|
||||
```rust,ignore
|
||||
if item == b' ' {
|
||||
return i;
|
||||
}
|
||||
}
|
||||
s.len()
|
||||
```
|
||||
|
||||
We now have a way to find out the index of the end of the first word in the
|
||||
string, but there’s a problem. We’re returning a `usize` on its own, but it’s
|
||||
only a meaningful number in the context of the `&String`. In other words,
|
||||
because it’s a separate value from the `String`, there’s no guarantee that it
|
||||
will still be valid in the future. Consider the program in Listing 4-8 that
|
||||
uses the `first_word` function from Listing 4-7:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# fn first_word(s: &String) -> usize {
|
||||
# let bytes = s.as_bytes();
|
||||
#
|
||||
# for (i, &item) in bytes.iter().enumerate() {
|
||||
# if item == b' ' {
|
||||
# return i;
|
||||
# }
|
||||
# }
|
||||
#
|
||||
# s.len()
|
||||
# }
|
||||
#
|
||||
fn main() {
|
||||
let mut s = String::from("hello world");
|
||||
|
||||
let word = first_word(&s); // word will get the value 5
|
||||
|
||||
s.clear(); // This empties the String, making it equal to ""
|
||||
|
||||
// word still has the value 5 here, but there's no more string that
|
||||
// we could meaningfully use the value 5 with. word is now totally invalid!
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 4-8: Storing the result from calling the
|
||||
`first_word` function and then changing the `String` contents</span>
|
||||
|
||||
This program compiles without any errors and would also do so if we used `word`
|
||||
after calling `s.clear()`. Because `word` isn’t connected to the state of `s`
|
||||
at all, `word` still contains the value `5`. We could use that value `5` with
|
||||
the variable `s` to try to extract the first word out, but this would be a bug
|
||||
because the contents of `s` have changed since we saved `5` in `word`.
|
||||
|
||||
Having to worry about the index in `word` getting out of sync with the data in
|
||||
`s` is tedious and error prone! Managing these indices is even more brittle if
|
||||
we write a `second_word` function. Its signature would have to look like this:
|
||||
|
||||
```rust,ignore
|
||||
fn second_word(s: &String) -> (usize, usize) {
|
||||
```
|
||||
|
||||
Now we’re tracking a starting *and* an ending index, and we have even more
|
||||
values that were calculated from data in a particular state but aren’t tied to
|
||||
that state at all. We now have three unrelated variables floating around that
|
||||
need to be kept in sync.
|
||||
|
||||
Luckily, Rust has a solution to this problem: string slices.
|
||||
|
||||
### String Slices
|
||||
|
||||
A *string slice* is a reference to part of a `String`, and it looks like this:
|
||||
|
||||
```rust
|
||||
let s = String::from("hello world");
|
||||
|
||||
let hello = &s[0..5];
|
||||
let world = &s[6..11];
|
||||
```
|
||||
|
||||
This is similar to taking a reference to the whole `String` but with the extra
|
||||
`[0..5]` bit. Rather than a reference to the entire `String`, it’s a reference
|
||||
to a portion of the `String`. The `start..end` syntax is a range that begins at
|
||||
`start` and continues up to, but not including, `end`.
|
||||
|
||||
We can create slices using a range within brackets by specifying
|
||||
`[starting_index..ending_index]`, where `starting_index` is the first position
|
||||
in the slice and `ending_index` is one more than the last position in the
|
||||
slice. Internally, the slice data structure stores the starting position and
|
||||
the length of the slice, which corresponds to `ending_index` minus
|
||||
`starting_index`. So in the case of `let world = &s[6..11];`, `world` would be
|
||||
a slice that contains a pointer to the 6th byte of `s` and a length value of 5.
|
||||
|
||||
Figure 4-6 shows this in a diagram.
|
||||
|
||||
<img alt="world containing a pointer to the 6th byte of String s and a length 5" src="img/trpl04-06.svg" class="center" style="width: 50%;" />
|
||||
|
||||
<span class="caption">Figure 4-6: String slice referring to part of a
|
||||
`String`</span>
|
||||
|
||||
With Rust’s `..` range syntax, if you want to start at the first index (zero),
|
||||
you can drop the value before the two periods. In other words, these are equal:
|
||||
|
||||
```rust
|
||||
let s = String::from("hello");
|
||||
|
||||
let slice = &s[0..2];
|
||||
let slice = &s[..2];
|
||||
```
|
||||
|
||||
By the same token, if your slice includes the last byte of the `String`, you
|
||||
can drop the trailing number. That means these are equal:
|
||||
|
||||
```rust
|
||||
let s = String::from("hello");
|
||||
|
||||
let len = s.len();
|
||||
|
||||
let slice = &s[3..len];
|
||||
let slice = &s[3..];
|
||||
```
|
||||
|
||||
You can also drop both values to take a slice of the entire string. So these
|
||||
are equal:
|
||||
|
||||
```rust
|
||||
let s = String::from("hello");
|
||||
|
||||
let len = s.len();
|
||||
|
||||
let slice = &s[0..len];
|
||||
let slice = &s[..];
|
||||
```
|
||||
|
||||
> Note: String slice range indices must occur at valid UTF-8 character
|
||||
> boundaries. If you attempt to create a string slice in the middle of a
|
||||
> multibyte character, your program will exit with an error. For the purposes
|
||||
> of introducing string slices, we are assuming ASCII only in this section; a
|
||||
> more thorough discussion of UTF-8 handling is in the “Strings” section of
|
||||
> Chapter 8.
|
||||
|
||||
With all this information in mind, let’s rewrite `first_word` to return a
|
||||
slice. The type that signifies “string slice” is written as `&str`:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn first_word(s: &String) -> &str {
|
||||
let bytes = s.as_bytes();
|
||||
|
||||
for (i, &item) in bytes.iter().enumerate() {
|
||||
if item == b' ' {
|
||||
return &s[0..i];
|
||||
}
|
||||
}
|
||||
|
||||
&s[..]
|
||||
}
|
||||
```
|
||||
|
||||
We get the index for the end of the word in the same way as we did in Listing
|
||||
4-7, by looking for the first occurrence of a space. When we find a space, we
|
||||
return a string slice using the start of the string and the index of the space
|
||||
as the starting and ending indices.
|
||||
|
||||
Now when we call `first_word`, we get back a single value that is tied to the
|
||||
underlying data. The value is made up of a reference to the starting point of
|
||||
the slice and the number of elements in the slice.
|
||||
|
||||
Returning a slice would also work for a `second_word` function:
|
||||
|
||||
```rust,ignore
|
||||
fn second_word(s: &String) -> &str {
|
||||
```
|
||||
|
||||
We now have a straightforward API that’s much harder to mess up, because the
|
||||
compiler will ensure the references into the `String` remain valid. Remember
|
||||
the bug in the program in Listing 4-8, when we got the index to the end of the
|
||||
first word but then cleared the string so our index was invalid? That code was
|
||||
logically incorrect but didn’t show any immediate errors. The problems would
|
||||
show up later if we kept trying to use the first word index with an emptied
|
||||
string. Slices make this bug impossible and let us know we have a problem with
|
||||
our code much sooner. Using the slice version of `first_word` will throw a
|
||||
compile time error:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let mut s = String::from("hello world");
|
||||
|
||||
let word = first_word(&s);
|
||||
|
||||
s.clear(); // Error!
|
||||
}
|
||||
```
|
||||
|
||||
Here’s the compiler error:
|
||||
|
||||
```text
|
||||
error[E0502]: cannot borrow `s` as mutable because it is also borrowed as immutable
|
||||
--> src/main.rs:6:5
|
||||
|
|
||||
4 | let word = first_word(&s);
|
||||
| - immutable borrow occurs here
|
||||
5 |
|
||||
6 | s.clear(); // Error!
|
||||
| ^ mutable borrow occurs here
|
||||
7 | }
|
||||
| - immutable borrow ends here
|
||||
```
|
||||
|
||||
Recall from the borrowing rules that if we have an immutable reference to
|
||||
something, we cannot also take a mutable reference. Because `clear` needs to
|
||||
truncate the `String`, it tries to take a mutable reference, which fails. Not
|
||||
only has Rust made our API easier to use, but it has also eliminated an entire
|
||||
class of errors at compile time!
|
||||
|
||||
#### String Literals Are Slices
|
||||
|
||||
Recall that we talked about string literals being stored inside the binary. Now
|
||||
that we know about slices, we can properly understand string literals:
|
||||
|
||||
```rust
|
||||
let s = "Hello, world!";
|
||||
```
|
||||
|
||||
The type of `s` here is `&str`: it’s a slice pointing to that specific point of
|
||||
the binary. This is also why string literals are immutable; `&str` is an
|
||||
immutable reference.
|
||||
|
||||
#### String Slices as Parameters
|
||||
|
||||
Knowing that you can take slices of literals and `String`s leads us to one more
|
||||
improvement on `first_word`, and that’s its signature:
|
||||
|
||||
```rust,ignore
|
||||
fn first_word(s: &String) -> &str {
|
||||
```
|
||||
|
||||
A more experienced Rustacean would write the following line instead because it
|
||||
allows us to use the same function on both `String`s and `&str`s:
|
||||
|
||||
```rust,ignore
|
||||
fn first_word(s: &str) -> &str {
|
||||
```
|
||||
|
||||
If we have a string slice, we can pass that directly. If we have a `String`, we
|
||||
can pass a slice of the entire `String`. Defining a function to take a string
|
||||
slice instead of a reference to a `String` makes our API more general and useful
|
||||
without losing any functionality:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# fn first_word(s: &str) -> &str {
|
||||
# let bytes = s.as_bytes();
|
||||
#
|
||||
# for (i, &item) in bytes.iter().enumerate() {
|
||||
# if item == b' ' {
|
||||
# return &s[0..i];
|
||||
# }
|
||||
# }
|
||||
#
|
||||
# &s[..]
|
||||
# }
|
||||
fn main() {
|
||||
let my_string = String::from("hello world");
|
||||
|
||||
// first_word works on slices of `String`s
|
||||
let word = first_word(&my_string[..]);
|
||||
|
||||
let my_string_literal = "hello world";
|
||||
|
||||
// first_word works on slices of string literals
|
||||
let word = first_word(&my_string_literal[..]);
|
||||
|
||||
// Because string literals *are* string slices already,
|
||||
// this works too, without the slice syntax!
|
||||
let word = first_word(my_string_literal);
|
||||
}
|
||||
```
|
||||
|
||||
### Other Slices
|
||||
|
||||
String slices, as you might imagine, are specific to strings. But there’s a
|
||||
more general slice type, too. Consider this array:
|
||||
|
||||
```rust
|
||||
let a = [1, 2, 3, 4, 5];
|
||||
```
|
||||
|
||||
Just as we might want to refer to a part of a string, we might want to refer
|
||||
to part of an array. We’d do so like this:
|
||||
|
||||
```rust
|
||||
let a = [1, 2, 3, 4, 5];
|
||||
|
||||
let slice = &a[1..3];
|
||||
```
|
||||
|
||||
This slice has the type `&[i32]`. It works the same way as string slices do, by
|
||||
storing a reference to the first element and a length. You’ll use this kind of
|
||||
slice for all sorts of other collections. We’ll discuss these collections in
|
||||
detail when we talk about vectors in Chapter 8.
|
||||
|
||||
## Summary
|
||||
|
||||
The concepts of ownership, borrowing, and slices ensure memory safety in Rust
|
||||
programs at compile time. The Rust language gives you control over your memory
|
||||
usage in the same way as other systems programming languages, but having the
|
||||
owner of data automatically clean up that data when the owner goes out of scope
|
||||
means you don’t have to write and debug extra code to get this control.
|
||||
|
||||
Ownership affects how lots of other parts of Rust work, so we’ll talk about
|
||||
these concepts further throughout the rest of the book. Let’s move on to
|
||||
Chapter 5 and look at grouping pieces of data together in a `struct`.
|
||||
11
2018-edition/src/ch05-00-structs.md
Normal file
11
2018-edition/src/ch05-00-structs.md
Normal file
@@ -0,0 +1,11 @@
|
||||
# Using Structs to Structure Related Data
|
||||
|
||||
A *struct*, or *structure*, is a custom data type that lets you name and
|
||||
package together multiple related values that make up a meaningful group. If
|
||||
you’re familiar with an object-oriented language, a *struct* is like an
|
||||
object’s data attributes. In this chapter, we’ll compare and contrast tuples
|
||||
with structs, demonstrate how to use structs, and discuss how to define methods
|
||||
and associated functions to specify behavior associated with a struct’s data.
|
||||
Structs and enums (discussed in Chapter 6) are the building blocks for creating
|
||||
new types in your program’s domain to take full advantage of Rust’s compile
|
||||
time type checking.
|
||||
310
2018-edition/src/ch05-01-defining-structs.md
Normal file
310
2018-edition/src/ch05-01-defining-structs.md
Normal file
@@ -0,0 +1,310 @@
|
||||
## Defining and Instantiating Structs
|
||||
|
||||
Structs are similar to tuples, which were discussed in Chapter 3. Like tuples,
|
||||
the pieces of a struct can be different types. Unlike with tuples, you’ll name
|
||||
each piece of data so it’s clear what the values mean. As a result of these
|
||||
names, structs are more flexible than tuples: you don’t have to rely on the
|
||||
order of the data to specify or access the values of an instance.
|
||||
|
||||
To define a struct, we enter the keyword `struct` and name the entire struct. A
|
||||
struct’s name should describe the significance of the pieces of data being
|
||||
grouped together. Then, inside curly brackets, we define the names and types of
|
||||
the pieces of data, which we call *fields*. For example, Listing 5-1 shows a
|
||||
struct that stores information about a user account:
|
||||
|
||||
```rust
|
||||
struct User {
|
||||
username: String,
|
||||
email: String,
|
||||
sign_in_count: u64,
|
||||
active: bool,
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-1: A `User` struct definition</span>
|
||||
|
||||
To use a struct after we’ve defined it, we create an *instance* of that struct
|
||||
by specifying concrete values for each of the fields. We create an instance by
|
||||
stating the name of the struct and then add curly brackets containing `key:
|
||||
value` pairs, where the keys are the names of the fields and the values are the
|
||||
data we want to store in those fields. We don’t have to specify the fields in
|
||||
the same order in which we declared them in the struct. In other words, the
|
||||
struct definition is like a general template for the type, and instances fill
|
||||
in that template with particular data to create values of the type. For
|
||||
example, we can declare a particular user as shown in Listing 5-2:
|
||||
|
||||
```rust
|
||||
# struct User {
|
||||
# username: String,
|
||||
# email: String,
|
||||
# sign_in_count: u64,
|
||||
# active: bool,
|
||||
# }
|
||||
#
|
||||
let user1 = User {
|
||||
email: String::from("someone@example.com"),
|
||||
username: String::from("someusername123"),
|
||||
active: true,
|
||||
sign_in_count: 1,
|
||||
};
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-2: Creating an instance of the `User`
|
||||
struct</span>
|
||||
|
||||
To get a specific value from a struct, we can use dot notation. If we wanted
|
||||
just this user’s email address, we could use `user1.email` wherever we wanted
|
||||
to use this value. If the instance is mutable, we can change a value by using
|
||||
the dot notation and assigning into a particular field. Listing 5-3 shows how
|
||||
to change the value in the `email` field of a mutable `User` instance:
|
||||
|
||||
```rust
|
||||
# struct User {
|
||||
# username: String,
|
||||
# email: String,
|
||||
# sign_in_count: u64,
|
||||
# active: bool,
|
||||
# }
|
||||
#
|
||||
let mut user1 = User {
|
||||
email: String::from("someone@example.com"),
|
||||
username: String::from("someusername123"),
|
||||
active: true,
|
||||
sign_in_count: 1,
|
||||
};
|
||||
|
||||
user1.email = String::from("anotheremail@example.com");
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-3: Changing the value in the `email` field of a
|
||||
`User` instance</span>
|
||||
|
||||
Note that the entire instance must be mutable; Rust doesn’t allow us to mark
|
||||
only certain fields as mutable.
|
||||
|
||||
As with any expression, we can construct a new instance of the struct as the
|
||||
last expression in the function body to implicitly return that new instance.
|
||||
Listing 5-4 shows a `build_user` function that returns a `User` instance with
|
||||
the given email and username. The `active` field gets the value of `true`, and
|
||||
the `sign_in_count` gets a value of `1`.
|
||||
|
||||
```rust
|
||||
# struct User {
|
||||
# username: String,
|
||||
# email: String,
|
||||
# sign_in_count: u64,
|
||||
# active: bool,
|
||||
# }
|
||||
#
|
||||
fn build_user(email: String, username: String) -> User {
|
||||
User {
|
||||
email: email,
|
||||
username: username,
|
||||
active: true,
|
||||
sign_in_count: 1,
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-4: A `build_user` function that takes an email
|
||||
and username and returns a `User` instance</span>
|
||||
|
||||
It makes sense to name the function parameters with the same name as the struct
|
||||
fields, but having to repeat the `email` and `username` field names and
|
||||
variables is a bit tedious. If the struct had more fields, repeating each name
|
||||
would get even more annoying. Luckily, there’s a convenient shorthand!
|
||||
|
||||
### Using the Field Init Shorthand when Variables and Fields Have the Same Name
|
||||
|
||||
Because the parameter names and the struct field names are exactly the same in
|
||||
Listing 5-4, we can use the *field init shorthand* syntax to rewrite
|
||||
`build_user` so that it behaves exactly the same but doesn’t have the
|
||||
repetition of `email` and `username` as shown in Listing 5-5.
|
||||
|
||||
```rust
|
||||
# struct User {
|
||||
# username: String,
|
||||
# email: String,
|
||||
# sign_in_count: u64,
|
||||
# active: bool,
|
||||
# }
|
||||
#
|
||||
fn build_user(email: String, username: String) -> User {
|
||||
User {
|
||||
email,
|
||||
username,
|
||||
active: true,
|
||||
sign_in_count: 1,
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-5: A `build_user` function that uses field init
|
||||
shorthand because the `email` and `username` parameters have the same name as
|
||||
struct fields</span>
|
||||
|
||||
Here, we’re creating a new instance of the `User` struct, which has a field
|
||||
named `email`. We want to set the `email` field’s value to the value in the
|
||||
`email` parameter of the `build_user` function. Because the `email` field and
|
||||
the `email` parameter have the same name, we only need to write `email` rather
|
||||
than `email: email`.
|
||||
|
||||
### Creating Instances From Other Instances With Struct Update Syntax
|
||||
|
||||
It’s often useful to create a new instance of a struct that uses most of an old
|
||||
instance’s values but changes some. You’ll do this using *struct update syntax*.
|
||||
|
||||
First, Listing 5-6 shows how we create a new `User` instance in `user2` without
|
||||
the update syntax. We set new values for `email` and `username` but otherwise
|
||||
use the same values from `user1` that we created in Listing 5-2:
|
||||
|
||||
```rust
|
||||
# struct User {
|
||||
# username: String,
|
||||
# email: String,
|
||||
# sign_in_count: u64,
|
||||
# active: bool,
|
||||
# }
|
||||
#
|
||||
# let user1 = User {
|
||||
# email: String::from("someone@example.com"),
|
||||
# username: String::from("someusername123"),
|
||||
# active: true,
|
||||
# sign_in_count: 1,
|
||||
# };
|
||||
#
|
||||
let user2 = User {
|
||||
email: String::from("another@example.com"),
|
||||
username: String::from("anotherusername567"),
|
||||
active: user1.active,
|
||||
sign_in_count: user1.sign_in_count,
|
||||
};
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-6: Creating a new `User` instance using some of
|
||||
the values from `user1`</span>
|
||||
|
||||
Using struct update syntax, we can achieve the same effect with less code, as
|
||||
shown in Listing 5-7. The syntax `..` specifies that the remaining fields not
|
||||
explicitly set should have the same value as the fields in the given instance.
|
||||
|
||||
```rust
|
||||
# struct User {
|
||||
# username: String,
|
||||
# email: String,
|
||||
# sign_in_count: u64,
|
||||
# active: bool,
|
||||
# }
|
||||
#
|
||||
# let user1 = User {
|
||||
# email: String::from("someone@example.com"),
|
||||
# username: String::from("someusername123"),
|
||||
# active: true,
|
||||
# sign_in_count: 1,
|
||||
# };
|
||||
#
|
||||
let user2 = User {
|
||||
email: String::from("another@example.com"),
|
||||
username: String::from("anotherusername567"),
|
||||
..user1
|
||||
};
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-7: Using struct update syntax to set new
|
||||
`email` and `username` values for a `User` instance but use the rest of the
|
||||
values from the fields of the instance in the `user1` variable</span>
|
||||
|
||||
The code in Listing 5-7 also creates an instance in `user2` that has a
|
||||
different value for `email` and `username` but has the same values for the
|
||||
`active` and `sign_in_count` fields from `user1`.
|
||||
|
||||
### Tuple Structs without Named Fields to Create Different Types
|
||||
|
||||
You can also define structs that look similar to tuples, called *tuple
|
||||
structs*. Tuple structs have the added meaning the struct name provides but
|
||||
don’t have names associated with their fields; rather, they just have the types
|
||||
of the fields. Tuple structs are useful when you want to give the whole tuple a
|
||||
name and make the tuple be a different type than other tuples, and naming each
|
||||
field as in a regular struct would be verbose or redundant.
|
||||
|
||||
To define a tuple struct start with the `struct` keyword and the struct name
|
||||
followed by the types in the tuple. For example, here are definitions and
|
||||
usages of two tuple structs named `Color` and `Point`:
|
||||
|
||||
```rust
|
||||
struct Color(i32, i32, i32);
|
||||
struct Point(i32, i32, i32);
|
||||
|
||||
let black = Color(0, 0, 0);
|
||||
let origin = Point(0, 0, 0);
|
||||
```
|
||||
|
||||
Note that the `black` and `origin` values are different types, because they’re
|
||||
instances of different tuple structs. Each struct you define is its own type,
|
||||
even though the fields within the struct have the same types. For example, a
|
||||
function that takes a parameter of type `Color` cannot take a `Point` as an
|
||||
argument, even though both types are made up of three `i32` values. Otherwise,
|
||||
tuple struct instances behave like tuples: you can destructure them into their
|
||||
individual pieces, you can use a `.` followed by the index to access an
|
||||
individual value, and so on.
|
||||
|
||||
### Unit-Like Structs Without Any Fields
|
||||
|
||||
You can also define structs that don’t have any fields! These are called
|
||||
*unit-like structs* because they behave similarly to `()`, the unit type.
|
||||
Unit-like structs can be useful in situations in which you need to implement a
|
||||
trait on some type but don’t have any data that you want to store in the type
|
||||
itself. We’ll discuss traits in Chapter 10.
|
||||
|
||||
> ### Ownership of Struct Data
|
||||
>
|
||||
> In the `User` struct definition in Listing 5-1, we used the owned `String`
|
||||
> type rather than the `&str` string slice type. This is a deliberate choice
|
||||
> because we want instances of this struct to own all of its data and for that
|
||||
> data to be valid for as long as the entire struct is valid.
|
||||
>
|
||||
> It’s possible for structs to store references to data owned by something else,
|
||||
> but to do so requires the use of *lifetimes*, a Rust feature that we’ll
|
||||
> discuss in Chapter 10. Lifetimes ensure that the data referenced by a struct
|
||||
> is valid for as long as the struct is. Let’s say you try to store a reference
|
||||
> in a struct without specifying lifetimes, like this, which won’t work:
|
||||
>
|
||||
> <span class="filename">Filename: src/main.rs</span>
|
||||
>
|
||||
> ```rust,ignore
|
||||
> struct User {
|
||||
> username: &str,
|
||||
> email: &str,
|
||||
> sign_in_count: u64,
|
||||
> active: bool,
|
||||
> }
|
||||
>
|
||||
> fn main() {
|
||||
> let user1 = User {
|
||||
> email: "someone@example.com",
|
||||
> username: "someusername123",
|
||||
> active: true,
|
||||
> sign_in_count: 1,
|
||||
> };
|
||||
> }
|
||||
> ```
|
||||
>
|
||||
> The compiler will complain that it needs lifetime specifiers:
|
||||
>
|
||||
> ```text
|
||||
> error[E0106]: missing lifetime specifier
|
||||
> -->
|
||||
> |
|
||||
> 2 | username: &str,
|
||||
> | ^ expected lifetime parameter
|
||||
>
|
||||
> error[E0106]: missing lifetime specifier
|
||||
> -->
|
||||
> |
|
||||
> 3 | email: &str,
|
||||
> | ^ expected lifetime parameter
|
||||
> ```
|
||||
>
|
||||
> In Chapter 10, we’ll discuss how to fix these errors so you can store
|
||||
> references in structs, but for now, we’ll fix errors like these using owned
|
||||
> types like `String` instead of references like `&str`.
|
||||
264
2018-edition/src/ch05-02-example-structs.md
Normal file
264
2018-edition/src/ch05-02-example-structs.md
Normal file
@@ -0,0 +1,264 @@
|
||||
## An Example Program Using Structs
|
||||
|
||||
To understand when we might want to use structs, let’s write a program that
|
||||
calculates the area of a rectangle. We’ll start with single variables, and then
|
||||
refactor the program until we’re using structs instead.
|
||||
|
||||
Let’s make a new binary project with Cargo called *rectangles* that will take
|
||||
the width and height of a rectangle specified in pixels and calculate the area
|
||||
of the rectangle. Listing 5-8 shows a short program with one way of doing
|
||||
exactly that in our project’s *src/main.rs*:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let width1 = 30;
|
||||
let height1 = 50;
|
||||
|
||||
println!(
|
||||
"The area of the rectangle is {} square pixels.",
|
||||
area(width1, height1)
|
||||
);
|
||||
}
|
||||
|
||||
fn area(width: u32, height: u32) -> u32 {
|
||||
width * height
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-8: Calculating the area of a rectangle
|
||||
specified by separate width and height variables</span>
|
||||
|
||||
Now, run this program using `cargo run`:
|
||||
|
||||
```text
|
||||
The area of the rectangle is 1500 square pixels.
|
||||
```
|
||||
|
||||
Even though Listing 5-8 works and figures out the area of the rectangle by
|
||||
calling the `area` function with each dimension, we can do better. The width
|
||||
and the height are related to each other because together they describe one
|
||||
rectangle.
|
||||
|
||||
The issue with this code is evident in the signature of `area`:
|
||||
|
||||
```rust,ignore
|
||||
fn area(width: u32, height: u32) -> u32 {
|
||||
```
|
||||
|
||||
The `area` function is supposed to calculate the area of one rectangle, but the
|
||||
function we wrote has two parameters. The parameters are related, but that’s
|
||||
not expressed anywhere in our program. It would be more readable and more
|
||||
manageable to group width and height together. We’ve already discussed one way
|
||||
we might do that in “The Tuple Type” section of Chapter 3: by using tuples.
|
||||
|
||||
### Refactoring with Tuples
|
||||
|
||||
Listing 5-9 shows another version of our program that uses tuples:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let rect1 = (30, 50);
|
||||
|
||||
println!(
|
||||
"The area of the rectangle is {} square pixels.",
|
||||
area(rect1)
|
||||
);
|
||||
}
|
||||
|
||||
fn area(dimensions: (u32, u32)) -> u32 {
|
||||
dimensions.0 * dimensions.1
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-9: Specifying the width and height of the
|
||||
rectangle with a tuple</span>
|
||||
|
||||
In one way, this program is better. Tuples let us add a bit of structure, and
|
||||
we’re now passing just one argument. But in another way, this version is less
|
||||
clear: tuples don’t name their elements, so our calculation has become more
|
||||
confusing because we have to index into the parts of the tuple.
|
||||
|
||||
It doesn’t matter if we mix up width and height for the area calculation, but
|
||||
if we want to draw the rectangle on the screen, it would matter! We would have
|
||||
to keep in mind that `width` is the tuple index `0` and `height` is the tuple
|
||||
index `1`. If someone else worked on this code, they would have to figure this
|
||||
out and keep it in mind as well. It would be easy to forget or mix up these
|
||||
values and cause errors, because we haven’t conveyed the meaning of our data in
|
||||
our code.
|
||||
|
||||
### Refactoring with Structs: Adding More Meaning
|
||||
|
||||
We use structs to add meaning by labeling the data. We can transform the tuple
|
||||
we’re using into a data type with a name for the whole as well as names for the
|
||||
parts, as shown in Listing 5-10:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
struct Rectangle {
|
||||
width: u32,
|
||||
height: u32,
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let rect1 = Rectangle { width: 30, height: 50 };
|
||||
|
||||
println!(
|
||||
"The area of the rectangle is {} square pixels.",
|
||||
area(&rect1)
|
||||
);
|
||||
}
|
||||
|
||||
fn area(rectangle: &Rectangle) -> u32 {
|
||||
rectangle.width * rectangle.height
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-10: Defining a `Rectangle` struct</span>
|
||||
|
||||
Here we’ve defined a struct and named it `Rectangle`. Inside the curly
|
||||
brackets, we defined the fields as `width` and `height`, both of which have
|
||||
type `u32`. Then in `main`, we created a particular instance of `Rectangle`
|
||||
that has a width of 30 and a height of 50.
|
||||
|
||||
Our `area` function is now defined with one parameter, which we’ve named
|
||||
`rectangle`, whose type is an immutable borrow of a struct `Rectangle`
|
||||
instance. As mentioned in Chapter 4, we want to borrow the struct rather than
|
||||
take ownership of it. This way, `main` retains its ownership and can continue
|
||||
using `rect1`, which is the reason we use the `&` in the function signature and
|
||||
where we call the function.
|
||||
|
||||
The `area` function accesses the `width` and `height` fields of the `Rectangle`
|
||||
instance. Our function signature for `area` now says exactly what we mean:
|
||||
calculate the area of `Rectangle`, using its `width` and `height` fields. This
|
||||
conveys that the width and height are related to each other, and it gives
|
||||
descriptive names to the values rather than using the tuple index values of `0`
|
||||
and `1`. This is a win for clarity.
|
||||
|
||||
### Adding Useful Functionality with Derived Traits
|
||||
|
||||
It’d be nice to be able to print an instance of `Rectangle` while we’re
|
||||
debugging our program and see the values for all its fields. Listing 5-11 tries
|
||||
using the `println!` macro as we have used in previous chapters. This won’t
|
||||
work, however:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
struct Rectangle {
|
||||
width: u32,
|
||||
height: u32,
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let rect1 = Rectangle { width: 30, height: 50 };
|
||||
|
||||
println!("rect1 is {}", rect1);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-11: Attempting to print a `Rectangle`
|
||||
instance</span>
|
||||
|
||||
When we run this code, we get an error with this core message:
|
||||
|
||||
```text
|
||||
error[E0277]: the trait bound `Rectangle: std::fmt::Display` is not satisfied
|
||||
```
|
||||
|
||||
The `println!` macro can do many kinds of formatting, and by default, curly
|
||||
brackets tell `println!` to use formatting known as `Display`: output intended
|
||||
for direct end user consumption. The primitive types we’ve seen so far
|
||||
implement `Display` by default, because there’s only one way you’d want to show
|
||||
a `1` or any other primitive type to a user. But with structs, the way
|
||||
`println!` should format the output is less clear because there are more
|
||||
display possibilities: Do you want commas or not? Do you want to print the
|
||||
curly brackets? Should all the fields be shown? Due to this ambiguity, Rust
|
||||
doesn’t try to guess what we want, and structs don’t have a provided
|
||||
implementation of `Display`.
|
||||
|
||||
If we continue reading the errors, we’ll find this helpful note:
|
||||
|
||||
```text
|
||||
`Rectangle` cannot be formatted with the default formatter; try using
|
||||
`:?` instead if you are using a format string
|
||||
```
|
||||
|
||||
Let’s try it! The `println!` macro call will now look like `println!("rect1 is
|
||||
{:?}", rect1);`. Putting the specifier `:?` inside the curly brackets tells
|
||||
`println!` we want to use an output format called `Debug`. `Debug` is a trait
|
||||
that enables us to print our struct in a way that is useful for developers so
|
||||
we can see its value while we’re debugging our code.
|
||||
|
||||
Run the code with this change. Drat! We still get an error:
|
||||
|
||||
```text
|
||||
error[E0277]: the trait bound `Rectangle: std::fmt::Debug` is not satisfied
|
||||
```
|
||||
|
||||
But again, the compiler gives us a helpful note:
|
||||
|
||||
```text
|
||||
`Rectangle` cannot be formatted using `:?`; if it is defined in your
|
||||
crate, add `#[derive(Debug)]` or manually implement it
|
||||
```
|
||||
|
||||
Rust *does* include functionality to print out debugging information, but we
|
||||
have to explicitly opt in to make that functionality available for our struct.
|
||||
To do that, we add the annotation `#[derive(Debug)]` just before the struct
|
||||
definition, as shown in Listing 5-12:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
#[derive(Debug)]
|
||||
struct Rectangle {
|
||||
width: u32,
|
||||
height: u32,
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let rect1 = Rectangle { width: 30, height: 50 };
|
||||
|
||||
println!("rect1 is {:?}", rect1);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-12: Adding the annotation to derive the `Debug`
|
||||
trait and printing the `Rectangle` instance using debug formatting</span>
|
||||
|
||||
Now when we run the program, we won’t get any errors, and we’ll see the
|
||||
following output:
|
||||
|
||||
```text
|
||||
rect1 is Rectangle { width: 30, height: 50 }
|
||||
```
|
||||
|
||||
Nice! It’s not the prettiest output, but it shows the values of all the fields
|
||||
for this instance, which would definitely help during debugging. When we have
|
||||
larger structs, it’s useful to have output that’s a bit easier to read; in
|
||||
those cases, we can use `{:#?}` instead of `{:?}` in the `println!` string.
|
||||
When we use the `{:#?}` style in the example, the output will look like this:
|
||||
|
||||
```text
|
||||
rect1 is Rectangle {
|
||||
width: 30,
|
||||
height: 50
|
||||
}
|
||||
```
|
||||
|
||||
Rust has provided a number of traits for us to use with the `derive` annotation
|
||||
that can add useful behavior to our custom types. Those traits and their
|
||||
behaviors are listed in Appendix C, “Derivable Traits.” We’ll cover how to
|
||||
implement these traits with custom behavior as well as how to create your own
|
||||
traits in Chapter 10.
|
||||
|
||||
Our `area` function is very specific: it only computes the area of rectangles.
|
||||
It would be helpful to tie this behavior more closely to our `Rectangle`
|
||||
struct, because it won’t work with any other type. Let’s look at how we can
|
||||
continue to refactor this code by turning the `area` function into an `area`
|
||||
*method* defined on our `Rectangle` type.
|
||||
276
2018-edition/src/ch05-03-method-syntax.md
Normal file
276
2018-edition/src/ch05-03-method-syntax.md
Normal file
@@ -0,0 +1,276 @@
|
||||
## Method Syntax
|
||||
|
||||
*Methods* are similar to functions: they’re declared with the `fn` keyword and
|
||||
their name, they can have parameters and a return value, and they contain some
|
||||
code that is run when they’re called from somewhere else. However, methods are
|
||||
different from functions in that they’re defined within the context of a struct
|
||||
(or an enum or a trait object, which we cover in Chapters 6 and 17,
|
||||
respectively), and their first parameter is always `self`, which represents the
|
||||
instance of the struct the method is being called on.
|
||||
|
||||
### Defining Methods
|
||||
|
||||
Let’s change the `area` function that has a `Rectangle` instance as a parameter
|
||||
and instead make an `area` method defined on the `Rectangle` struct, as shown
|
||||
in Listing 5-13:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
#[derive(Debug)]
|
||||
struct Rectangle {
|
||||
width: u32,
|
||||
height: u32,
|
||||
}
|
||||
|
||||
impl Rectangle {
|
||||
fn area(&self) -> u32 {
|
||||
self.width * self.height
|
||||
}
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let rect1 = Rectangle { width: 30, height: 50 };
|
||||
|
||||
println!(
|
||||
"The area of the rectangle is {} square pixels.",
|
||||
rect1.area()
|
||||
);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-13: Defining an `area` method on the
|
||||
`Rectangle` struct</span>
|
||||
|
||||
To define the function within the context of `Rectangle`, we start an `impl`
|
||||
(implementation) block. Then we move the `area` function within the `impl`
|
||||
curly brackets and change the first (and in this case, only) parameter to be
|
||||
`self` in the signature and everywhere within the body. In `main`, where we
|
||||
called the `area` function and passed `rect1` as an argument, we can instead
|
||||
use *method syntax* to call the `area` method on our `Rectangle` instance.
|
||||
The method syntax goes after an instance: we add a dot followed by the method
|
||||
name, parentheses, and any arguments.
|
||||
|
||||
In the signature for `area`, we use `&self` instead of `rectangle: &Rectangle`
|
||||
because Rust knows the type of `self` is `Rectangle` due to this method’s being
|
||||
inside the `impl Rectangle` context. Note that we still need to use the `&`
|
||||
before `self`, just as we did in `&Rectangle`. Methods can take ownership of
|
||||
`self`, borrow `self` immutably as we’ve done here, or borrow `self` mutably,
|
||||
just as they can any other parameter.
|
||||
|
||||
We’ve chosen `&self` here for the same reason we used `&Rectangle` in the
|
||||
function version: we don’t want to take ownership, and we just want to read the
|
||||
data in the struct, not write to it. If we wanted to change the instance that
|
||||
we’ve called the method on as part of what the method does, we’d use `&mut
|
||||
self` as the first parameter. Having a method that takes ownership of the
|
||||
instance by using just `self` as the first parameter is rare; this technique is
|
||||
usually used when the method transforms `self` into something else and you want
|
||||
to prevent the caller from using the original instance after the transformation.
|
||||
|
||||
The main benefit of using methods instead of functions, in addition to using
|
||||
method syntax and not having to repeat the type of `self` in every method’s
|
||||
signature, is for organization. We’ve put all the things we can do with an
|
||||
instance of a type in one `impl` block rather than making future users of our
|
||||
code search for capabilities of `Rectangle` in various places in the library we
|
||||
provide.
|
||||
|
||||
> ### Where’s the `->` Operator?
|
||||
>
|
||||
> In C and C++, two different operators are used for calling methods: you use
|
||||
> `.` if you’re calling a method on the object directly and `->` if you’re
|
||||
> calling the method on a pointer to the object and need to dereference the
|
||||
> pointer first. In other words, if `object` is a pointer,
|
||||
> `object->something()` is similar to `(*object).something()`.
|
||||
>
|
||||
> Rust doesn’t have an equivalent to the `->` operator; instead, Rust has a
|
||||
> feature called *automatic referencing and dereferencing*. Calling methods is
|
||||
> one of the few places in Rust that has this behavior.
|
||||
>
|
||||
> Here’s how it works: when you call a method with `object.something()`, Rust
|
||||
> automatically adds in `&`, `&mut`, or `*` so `object` matches the signature of
|
||||
> the method. In other words, the following are the same:
|
||||
>
|
||||
> ```rust
|
||||
> # #[derive(Debug,Copy,Clone)]
|
||||
> # struct Point {
|
||||
> # x: f64,
|
||||
> # y: f64,
|
||||
> # }
|
||||
> #
|
||||
> # impl Point {
|
||||
> # fn distance(&self, other: &Point) -> f64 {
|
||||
> # let x_squared = f64::powi(other.x - self.x, 2);
|
||||
> # let y_squared = f64::powi(other.y - self.y, 2);
|
||||
> #
|
||||
> # f64::sqrt(x_squared + y_squared)
|
||||
> # }
|
||||
> # }
|
||||
> # let p1 = Point { x: 0.0, y: 0.0 };
|
||||
> # let p2 = Point { x: 5.0, y: 6.5 };
|
||||
> p1.distance(&p2);
|
||||
> (&p1).distance(&p2);
|
||||
> ```
|
||||
>
|
||||
> The first one looks much cleaner. This automatic referencing behavior works
|
||||
> because methods have a clear receiver—the type of `self`. Given the receiver
|
||||
> and name of a method, Rust can figure out definitively whether the method is
|
||||
> reading (`&self`), mutating (`&mut self`), or consuming (`self`). The fact
|
||||
> that Rust makes borrowing implicit for method receivers is a big part of
|
||||
> making ownership ergonomic in practice.
|
||||
|
||||
### Methods with More Parameters
|
||||
|
||||
Let’s practice using methods by implementing a second method on the `Rectangle`
|
||||
struct. This time, we want an instance of `Rectangle` to take another instance
|
||||
of `Rectangle` and return `true` if the second `Rectangle` can fit completely
|
||||
within `self`; otherwise it should return `false`. That is, we want to be able
|
||||
to write the program shown in Listing 5-14, once we’ve defined the `can_hold`
|
||||
method:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let rect1 = Rectangle { width: 30, height: 50 };
|
||||
let rect2 = Rectangle { width: 10, height: 40 };
|
||||
let rect3 = Rectangle { width: 60, height: 45 };
|
||||
|
||||
println!("Can rect1 hold rect2? {}", rect1.can_hold(&rect2));
|
||||
println!("Can rect1 hold rect3? {}", rect1.can_hold(&rect3));
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-14: Using the as-yet-unwritten `can_hold`
|
||||
method</span>
|
||||
|
||||
And the expected output would look like the following, because both dimensions
|
||||
of `rect2` are smaller than the dimensions of `rect1` but `rect3` is wider than
|
||||
`rect1`:
|
||||
|
||||
```text
|
||||
Can rect1 hold rect2? true
|
||||
Can rect1 hold rect3? false
|
||||
```
|
||||
|
||||
We know we want to define a method, so it will be within the `impl Rectangle`
|
||||
block. The method name will be `can_hold`, and it will take an immutable borrow
|
||||
of another `Rectangle` as a parameter. We can tell what the type of the
|
||||
parameter will be by looking at the code that calls the method:
|
||||
`rect1.can_hold(&rect2)` passes in `&rect2`, which is an immutable borrow to
|
||||
`rect2`, an instance of `Rectangle`. This makes sense because we only need to
|
||||
read `rect2` (rather than write, which would mean we’d need a mutable borrow),
|
||||
and we want `main` to retain ownership of `rect2` so we can use it again after
|
||||
calling the `can_hold` method. The return value of `can_hold` will be a
|
||||
Boolean, and the implementation will check whether the width and height of
|
||||
`self` are both greater than the width and height of the other `Rectangle`,
|
||||
respectively. Let’s add the new `can_hold` method to the `impl` block from
|
||||
Listing 5-13, shown in Listing 5-15:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# #[derive(Debug)]
|
||||
# struct Rectangle {
|
||||
# width: u32,
|
||||
# height: u32,
|
||||
# }
|
||||
#
|
||||
impl Rectangle {
|
||||
fn area(&self) -> u32 {
|
||||
self.width * self.height
|
||||
}
|
||||
|
||||
fn can_hold(&self, other: &Rectangle) -> bool {
|
||||
self.width > other.width && self.height > other.height
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-15: Implementing the `can_hold` method on
|
||||
`Rectangle` that takes another `Rectangle` instance as a parameter</span>
|
||||
|
||||
When we run this code with the `main` function in Listing 5-14, we’ll get our
|
||||
desired output. Methods can take multiple parameters that we add to the
|
||||
signature after the `self` parameter, and those parameters work just like
|
||||
parameters in functions.
|
||||
|
||||
### Associated Functions
|
||||
|
||||
Another useful feature of `impl` blocks is that we’re allowed to define
|
||||
functions within `impl` blocks that *don’t* take `self` as a parameter. These
|
||||
are called *associated functions* because they’re associated with the struct.
|
||||
They’re still functions, not methods, because they don’t have an instance of
|
||||
the struct to work with. You’ve already used the `String::from` associated
|
||||
function.
|
||||
|
||||
Associated functions are often used for constructors that will return a new
|
||||
instance of the struct. For example, we could provide an associated function
|
||||
that would have one dimension parameter and use that as both width and height,
|
||||
thus making it easier to create a square `Rectangle` rather than having to
|
||||
specify the same value twice:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# #[derive(Debug)]
|
||||
# struct Rectangle {
|
||||
# width: u32,
|
||||
# height: u32,
|
||||
# }
|
||||
#
|
||||
impl Rectangle {
|
||||
fn square(size: u32) -> Rectangle {
|
||||
Rectangle { width: size, height: size }
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
To call this associated function, we use the `::` syntax with the struct name;
|
||||
`let sq = Rectangle::square(3);` is an example. This function is namespaced by
|
||||
the struct: the `::` syntax is used for both associated functions and
|
||||
namespaces created by modules. We’ll discuss modules in Chapter 7.
|
||||
|
||||
### Multiple `impl` Blocks
|
||||
|
||||
Each struct is allowed to have multiple `impl` blocks. For example, Listing
|
||||
5-15 is equivalent to the code shown in Listing 5-16, which has each method
|
||||
in its own `impl` block:
|
||||
|
||||
```rust
|
||||
# #[derive(Debug)]
|
||||
# struct Rectangle {
|
||||
# width: u32,
|
||||
# height: u32,
|
||||
# }
|
||||
#
|
||||
impl Rectangle {
|
||||
fn area(&self) -> u32 {
|
||||
self.width * self.height
|
||||
}
|
||||
}
|
||||
|
||||
impl Rectangle {
|
||||
fn can_hold(&self, other: &Rectangle) -> bool {
|
||||
self.width > other.width && self.height > other.height
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 5-16: Rewriting Listing 5-15 using multiple `impl`
|
||||
blocks</span>
|
||||
|
||||
There’s no reason to separate these methods into multiple `impl` blocks here,
|
||||
but this is valid syntax. We’ll see a case in which multiple `impl` blocks are
|
||||
useful in Chapter 10 where we discuss generic types and traits.
|
||||
|
||||
## Summary
|
||||
|
||||
Structs let you create custom types that are meaningful for your domain. By
|
||||
using structs, you can keep associated pieces of data connected to each other
|
||||
and name each piece to make your code clear. Methods let you specify the
|
||||
behavior that instances of your structs have, and associated functions let you
|
||||
namespace functionality that is particular to your struct without having an
|
||||
instance available.
|
||||
|
||||
But structs aren’t the only way you can create custom types: let’s turn to
|
||||
Rust’s enum feature to add another tool to your toolbox.
|
||||
15
2018-edition/src/ch06-00-enums.md
Normal file
15
2018-edition/src/ch06-00-enums.md
Normal file
@@ -0,0 +1,15 @@
|
||||
# Enums and Pattern Matching
|
||||
|
||||
In this chapter we’ll look at *enumerations*, also referred to as *enums*.
|
||||
Enums allow you to define a type by enumerating its possible values. First,
|
||||
we’ll define and use an enum to show how an enum can encode meaning along with
|
||||
data. Next, we’ll explore a particularly useful enum, called `Option`, which
|
||||
expresses that a value can be either something or nothing. Then we’ll look at
|
||||
how pattern matching in the `match` expression makes it easy to run different
|
||||
code for different values of an enum. Finally, we’ll cover how the `if let`
|
||||
construct is another convenient and concise idiom available to you to handle
|
||||
enums in your code.
|
||||
|
||||
Enums are a feature in many languages, but their capabilities differ in each
|
||||
language. Rust’s enums are most similar to *algebraic data types* in functional
|
||||
languages, such as F#, OCaml, and Haskell.
|
||||
399
2018-edition/src/ch06-01-defining-an-enum.md
Normal file
399
2018-edition/src/ch06-01-defining-an-enum.md
Normal file
@@ -0,0 +1,399 @@
|
||||
## Defining an Enum
|
||||
|
||||
Let’s look at a situation we might want to express in code and see why enums
|
||||
are useful and more appropriate than structs in this case. Say we need to work
|
||||
with IP addresses. Currently, two major standards are used for IP addresses:
|
||||
version four and version six. These are the only possibilities for an IP
|
||||
address that our program will come across: we can *enumerate* all possible
|
||||
values, which is where enumeration gets its name.
|
||||
|
||||
Any IP address can be either a version four or a version six address, but not
|
||||
both at the same time. That property of IP addresses makes the enum data
|
||||
structure appropriate, because enum values can only be one of the variants.
|
||||
Both version four and version six addresses are still fundamentally IP
|
||||
addresses, so they should be treated as the same type when the code is handling
|
||||
situations that apply to any kind of IP address.
|
||||
|
||||
We can express this concept in code by defining an `IpAddrKind` enumeration and
|
||||
listing the possible kinds an IP address can be, `V4` and `V6`. These are known
|
||||
as the *variants* of the enum:
|
||||
|
||||
```rust
|
||||
enum IpAddrKind {
|
||||
V4,
|
||||
V6,
|
||||
}
|
||||
```
|
||||
|
||||
`IpAddrKind` is now a custom data type that we can use elsewhere in our code.
|
||||
|
||||
### Enum Values
|
||||
|
||||
We can create instances of each of the two variants of `IpAddrKind` like this:
|
||||
|
||||
```rust
|
||||
# enum IpAddrKind {
|
||||
# V4,
|
||||
# V6,
|
||||
# }
|
||||
#
|
||||
let four = IpAddrKind::V4;
|
||||
let six = IpAddrKind::V6;
|
||||
```
|
||||
|
||||
Note that the variants of the enum are namespaced under its identifier, and we
|
||||
use a double colon to separate the two. The reason this is useful is that now
|
||||
both values `IpAddrKind::V4` and `IpAddrKind::V6` are of the same type:
|
||||
`IpAddrKind`. We can then, for instance, define a function that takes any
|
||||
`IpAddrKind`:
|
||||
|
||||
```rust
|
||||
# enum IpAddrKind {
|
||||
# V4,
|
||||
# V6,
|
||||
# }
|
||||
#
|
||||
fn route(ip_type: IpAddrKind) { }
|
||||
```
|
||||
|
||||
And we can call this function with either variant:
|
||||
|
||||
```rust
|
||||
# enum IpAddrKind {
|
||||
# V4,
|
||||
# V6,
|
||||
# }
|
||||
#
|
||||
# fn route(ip_type: IpAddrKind) { }
|
||||
#
|
||||
route(IpAddrKind::V4);
|
||||
route(IpAddrKind::V6);
|
||||
```
|
||||
|
||||
Using enums has even more advantages. Thinking more about our IP address type,
|
||||
at the moment we don’t have a way to store the actual IP address *data*; we
|
||||
only know what *kind* it is. Given that you just learned about structs in
|
||||
Chapter 5, you might tackle this problem as shown in Listing 6-1:
|
||||
|
||||
```rust
|
||||
enum IpAddrKind {
|
||||
V4,
|
||||
V6,
|
||||
}
|
||||
|
||||
struct IpAddr {
|
||||
kind: IpAddrKind,
|
||||
address: String,
|
||||
}
|
||||
|
||||
let home = IpAddr {
|
||||
kind: IpAddrKind::V4,
|
||||
address: String::from("127.0.0.1"),
|
||||
};
|
||||
|
||||
let loopback = IpAddr {
|
||||
kind: IpAddrKind::V6,
|
||||
address: String::from("::1"),
|
||||
};
|
||||
```
|
||||
|
||||
<span class="caption">Listing 6-1: Storing the data and `IpAddrKind` variant of
|
||||
an IP address using a `struct`</span>
|
||||
|
||||
Here, we’ve defined a struct `IpAddr` that has two fields: a `kind` field that
|
||||
is of type `IpAddrKind` (the enum we defined previously) and an `address` field
|
||||
of type `String`. We have two instances of this struct. The first, `home`, has
|
||||
the value `IpAddrKind::V4` as its `kind` with associated address data of
|
||||
`127.0.0.1`. The second instance, `loopback`, has the other variant of
|
||||
`IpAddrKind` as its `kind` value, `V6`, and has address `::1` associated with
|
||||
it. We’ve used a struct to bundle the `kind` and `address` values together, so
|
||||
now the variant is associated with the value.
|
||||
|
||||
We can represent the same concept in a more concise way using just an enum,
|
||||
rather than an enum inside a struct, by putting data directly into each enum
|
||||
variant. This new definition of the `IpAddr` enum says that both `V4` and `V6`
|
||||
variants will have associated `String` values:
|
||||
|
||||
```rust
|
||||
enum IpAddr {
|
||||
V4(String),
|
||||
V6(String),
|
||||
}
|
||||
|
||||
let home = IpAddr::V4(String::from("127.0.0.1"));
|
||||
|
||||
let loopback = IpAddr::V6(String::from("::1"));
|
||||
```
|
||||
|
||||
We attach data to each variant of the enum directly, so there is no need for an
|
||||
extra struct.
|
||||
|
||||
There’s another advantage to using an enum rather than a struct: each variant
|
||||
can have different types and amounts of associated data. Version four type IP
|
||||
addresses will always have four numeric components that will have values
|
||||
between 0 and 255. If we wanted to store `V4` addresses as four `u8` values but
|
||||
still express `V6` addresses as one `String` value, we wouldn’t be able to with
|
||||
a struct. Enums handle this case with ease:
|
||||
|
||||
```rust
|
||||
enum IpAddr {
|
||||
V4(u8, u8, u8, u8),
|
||||
V6(String),
|
||||
}
|
||||
|
||||
let home = IpAddr::V4(127, 0, 0, 1);
|
||||
|
||||
let loopback = IpAddr::V6(String::from("::1"));
|
||||
```
|
||||
|
||||
We’ve shown several different ways to define data structures to store version
|
||||
four and version six IP addresses. However, as it turns out, wanting to store
|
||||
IP addresses and encode which kind they are is so common that [the standard
|
||||
library has a definition we can use!][IpAddr]<!-- ignore --> Let’s look at how
|
||||
the standard library defines `IpAddr`: it has the exact enum and variants that
|
||||
we’ve defined and used, but it embeds the address data inside the variants in
|
||||
the form of two different structs, which are defined differently for each
|
||||
variant:
|
||||
|
||||
[IpAddr]: ../../std/net/enum.IpAddr.html
|
||||
|
||||
```rust
|
||||
struct Ipv4Addr {
|
||||
// --snip--
|
||||
}
|
||||
|
||||
struct Ipv6Addr {
|
||||
// --snip--
|
||||
}
|
||||
|
||||
enum IpAddr {
|
||||
V4(Ipv4Addr),
|
||||
V6(Ipv6Addr),
|
||||
}
|
||||
```
|
||||
|
||||
This code illustrates that you can put any kind of data inside an enum variant:
|
||||
strings, numeric types, or structs, for example. You can even include another
|
||||
enum! Also, standard library types are often not much more complicated than
|
||||
what you might come up with.
|
||||
|
||||
Note that even though the standard library contains a definition for `IpAddr`,
|
||||
we can still create and use our own definition without conflict because we
|
||||
haven’t brought the standard library’s definition into our scope. We’ll talk
|
||||
more about bringing types into scope in Chapter 7.
|
||||
|
||||
Let’s look at another example of an enum in Listing 6-2: this one has a wide
|
||||
variety of types embedded in its variants:
|
||||
|
||||
```rust
|
||||
enum Message {
|
||||
Quit,
|
||||
Move { x: i32, y: i32 },
|
||||
Write(String),
|
||||
ChangeColor(i32, i32, i32),
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 6-2: A `Message` enum whose variants each store
|
||||
different amounts and types of values</span>
|
||||
|
||||
This enum has four variants with different types:
|
||||
|
||||
* `Quit` has no data associated with it at all.
|
||||
* `Move` includes an anonymous struct inside it.
|
||||
* `Write` includes a single `String`.
|
||||
* `ChangeColor` includes three `i32` values.
|
||||
|
||||
Defining an enum with variants like the ones in Listing 6-2 is similar to
|
||||
defining different kinds of struct definitions, except the enum doesn’t use the
|
||||
`struct` keyword and all the variants are grouped together under the `Message`
|
||||
type. The following structs could hold the same data that the preceding enum
|
||||
variants hold:
|
||||
|
||||
```rust
|
||||
struct QuitMessage; // unit struct
|
||||
struct MoveMessage {
|
||||
x: i32,
|
||||
y: i32,
|
||||
}
|
||||
struct WriteMessage(String); // tuple struct
|
||||
struct ChangeColorMessage(i32, i32, i32); // tuple struct
|
||||
```
|
||||
|
||||
But if we used the different structs, which each have their own type, we
|
||||
couldn’t as easily define a function to take any of these kinds of messages as
|
||||
we could with the `Message` enum defined in Listing 6-2, which is a single type.
|
||||
|
||||
There is one more similarity between enums and structs: just as we’re able to
|
||||
define methods on structs using `impl`, we’re also able to define methods on
|
||||
enums. Here’s a method named `call` that we could define on our `Message` enum:
|
||||
|
||||
```rust
|
||||
# enum Message {
|
||||
# Quit,
|
||||
# Move { x: i32, y: i32 },
|
||||
# Write(String),
|
||||
# ChangeColor(i32, i32, i32),
|
||||
# }
|
||||
#
|
||||
impl Message {
|
||||
fn call(&self) {
|
||||
// method body would be defined here
|
||||
}
|
||||
}
|
||||
|
||||
let m = Message::Write(String::from("hello"));
|
||||
m.call();
|
||||
```
|
||||
|
||||
The body of the method would use `self` to get the value that we called the
|
||||
method on. In this example, we’ve created a variable `m` that has the value
|
||||
`Message::Write(String::from("hello"))`, and that is what `self` will be in the
|
||||
body of the `call` method when `m.call()` runs.
|
||||
|
||||
Let’s look at another enum in the standard library that is very common and
|
||||
useful: `Option`.
|
||||
|
||||
### The `Option` Enum and Its Advantages Over Null Values
|
||||
|
||||
In the previous section, we looked at how the `IpAddr` enum let us use Rust’s
|
||||
type system to encode more information than just the data into our program.
|
||||
This section explores a case study of `Option`, which is another enum defined
|
||||
by the standard library. The `Option` type is used in many places because it
|
||||
encodes the very common scenario in which a value could be something or it
|
||||
could be nothing. Expressing this concept in terms of the type system means the
|
||||
compiler can check whether you’ve handled all the cases you should be handling;
|
||||
this functionality can prevent bugs that are extremely common in other
|
||||
programming languages.
|
||||
|
||||
Programming language design is often thought of in terms of which features you
|
||||
include, but the features you exclude are important too. Rust doesn’t have the
|
||||
null feature that many other languages have. *Null* is a value that means there
|
||||
is no value there. In languages with null, variables can always be in one of
|
||||
two states: null or not-null.
|
||||
|
||||
In his 2009 presentation “Null References: The Billion Dollar Mistake,” Tony
|
||||
Hoare, the inventor of null, has this to say:
|
||||
|
||||
> I call it my billion-dollar mistake. At that time, I was designing the first
|
||||
> comprehensive type system for references in an object-oriented language. My
|
||||
> goal was to ensure that all use of references should be absolutely safe, with
|
||||
> checking performed automatically by the compiler. But I couldn’t resist the
|
||||
> temptation to put in a null reference, simply because it was so easy to
|
||||
> implement. This has led to innumerable errors, vulnerabilities, and system
|
||||
> crashes, which have probably caused a billion dollars of pain and damage in
|
||||
> the last forty years.
|
||||
|
||||
The problem with null values is that if you try to use a null value as a
|
||||
not-null value, you’ll get an error of some kind. Because this null or not-null
|
||||
property is pervasive, it’s extremely easy to make this kind of error.
|
||||
|
||||
However, the concept that null is trying to express is still a useful one: a
|
||||
null is a value that is currently invalid or absent for some reason.
|
||||
|
||||
The problem isn’t really with the concept but with the particular
|
||||
implementation. As such, Rust does not have nulls, but it does have an enum
|
||||
that can encode the concept of a value being present or absent. This enum is
|
||||
`Option<T>`, and it is [defined by the standard library][option]<!-- ignore -->
|
||||
as follows:
|
||||
|
||||
[option]: ../../std/option/enum.Option.html
|
||||
|
||||
```rust
|
||||
enum Option<T> {
|
||||
Some(T),
|
||||
None,
|
||||
}
|
||||
```
|
||||
|
||||
The `Option<T>` enum is so useful that it’s even included in the prelude; you
|
||||
don’t need to bring it into scope explicitly. In addition, so are its variants:
|
||||
you can use `Some` and `None` directly without the `Option::` prefix. The
|
||||
`Option<T>` enum is still just a regular enum, and `Some(T)` and `None` are
|
||||
still variants of type `Option<T>`.
|
||||
|
||||
The `<T>` syntax is a feature of Rust we haven’t talked about yet. It’s a
|
||||
generic type parameter, and we’ll cover generics in more detail in Chapter 10.
|
||||
For now, all you need to know is that `<T>` means the `Some` variant of the
|
||||
`Option` enum can hold one piece of data of any type. Here are some examples of
|
||||
using `Option` values to hold number types and string types:
|
||||
|
||||
```rust
|
||||
let some_number = Some(5);
|
||||
let some_string = Some("a string");
|
||||
|
||||
let absent_number: Option<i32> = None;
|
||||
```
|
||||
|
||||
If we use `None` rather than `Some`, we need to tell Rust what type of
|
||||
`Option<T>` we have, because the compiler can’t infer the type that the `Some`
|
||||
variant will hold by looking only at a `None` value.
|
||||
|
||||
When we have a `Some` value, we know that a value is present and the value is
|
||||
held within the `Some`. When we have a `None` value, in some sense, it means
|
||||
the same thing as null: we don’t have a valid value. So why is having
|
||||
`Option<T>` any better than having null?
|
||||
|
||||
In short, because `Option<T>` and `T` (where `T` can be any type) are different
|
||||
types, the compiler won’t let us use an `Option<T>` value as if it were
|
||||
definitely a valid value. For example, this code won’t compile because it’s
|
||||
trying to add an `i8` to an `Option<i8>`:
|
||||
|
||||
```rust,ignore
|
||||
let x: i8 = 5;
|
||||
let y: Option<i8> = Some(5);
|
||||
|
||||
let sum = x + y;
|
||||
```
|
||||
|
||||
If we run this code, we get an error message like this:
|
||||
|
||||
```text
|
||||
error[E0277]: the trait bound `i8: std::ops::Add<std::option::Option<i8>>` is
|
||||
not satisfied
|
||||
-->
|
||||
|
|
||||
5 | let sum = x + y;
|
||||
| ^ no implementation for `i8 + std::option::Option<i8>`
|
||||
|
|
||||
```
|
||||
|
||||
Intense! In effect, this error message means that Rust doesn’t understand how
|
||||
to add an `i8` and an `Option<i8>`, because they’re different types. When we
|
||||
have a value of a type like `i8` in Rust, the compiler will ensure that we
|
||||
always have a valid value. We can proceed confidently without having to check
|
||||
for null before using that value. Only when we have an `Option<i8>` (or
|
||||
whatever type of value we’re working with) do we have to worry about possibly
|
||||
not having a value, and the compiler will make sure we handle that case before
|
||||
using the value.
|
||||
|
||||
In other words, you have to convert an `Option<T>` to a `T` before you can
|
||||
perform `T` operations with it. Generally, this helps catch one of the most
|
||||
common issues with null: assuming that something isn’t null when it actually
|
||||
is.
|
||||
|
||||
Not having to worry about incorrectly assuming a not-null value helps you to be
|
||||
more confident in your code. In order to have a value that can possibly be
|
||||
null, you must explicitly opt in by making the type of that value `Option<T>`.
|
||||
Then, when you use that value, you are required to explicitly handle the case
|
||||
when the value is null. Everywhere that a value has a type that isn’t an
|
||||
`Option<T>`, you *can* safely assume that the value isn’t null. This was a
|
||||
deliberate design decision for Rust to limit null’s pervasiveness and increase
|
||||
the safety of Rust code.
|
||||
|
||||
So, how do you get the `T` value out of a `Some` variant when you have a value
|
||||
of type `Option<T>` so you can use that value? The `Option<T>` enum has a large
|
||||
number of methods that are useful in a variety of situations; you can check
|
||||
them out in [its documentation][docs]<!-- ignore -->. Becoming familiar with
|
||||
the methods on `Option<T>` will be extremely useful in your journey with Rust.
|
||||
|
||||
[docs]: ../../std/option/enum.Option.html
|
||||
|
||||
In general, in order to use an `Option<T>` value, you want to have code that
|
||||
will handle each variant. You want some code that will run only when you have a
|
||||
`Some(T)` value, and this code is allowed to use the inner `T`. You want some
|
||||
other code to run if you have a `None` value, and that code doesn’t have a `T`
|
||||
value available. The `match` expression is a control flow construct that does
|
||||
just this when used with enums: it will run different code depending on which
|
||||
variant of the enum it has, and that code can use the data inside the matching
|
||||
value.
|
||||
295
2018-edition/src/ch06-02-match.md
Normal file
295
2018-edition/src/ch06-02-match.md
Normal file
@@ -0,0 +1,295 @@
|
||||
## The `match` Control Flow Operator
|
||||
|
||||
Rust has an extremely powerful control flow operator called `match` that allows
|
||||
you to compare a value against a series of patterns and then execute code based
|
||||
on which pattern matches. Patterns can be made up of literal values, variable
|
||||
names, wildcards, and many other things; Chapter 18 covers all the different
|
||||
kinds of patterns and what they do. The power of `match` comes from the
|
||||
expressiveness of the patterns and the fact that the compiler confirms that all
|
||||
possible cases are handled.
|
||||
|
||||
Think of a `match` expression as being like a coin-sorting machine: coins slide
|
||||
down a track with variously sized holes along it, and each coin falls through
|
||||
the first hole it encounters that it fits into. In the same way, values go
|
||||
through each pattern in a `match`, and at the first pattern the value “fits,”
|
||||
the value falls into the associated code block to be used during execution.
|
||||
|
||||
Because we just mentioned coins, let’s use them as an example using `match`! We
|
||||
can write a function that can take an unknown United States coin and, in a
|
||||
similar way as the counting machine, determine which coin it is and return its
|
||||
value in cents, as shown here in Listing 6-3:
|
||||
|
||||
```rust
|
||||
enum Coin {
|
||||
Penny,
|
||||
Nickel,
|
||||
Dime,
|
||||
Quarter,
|
||||
}
|
||||
|
||||
fn value_in_cents(coin: Coin) -> u32 {
|
||||
match coin {
|
||||
Coin::Penny => 1,
|
||||
Coin::Nickel => 5,
|
||||
Coin::Dime => 10,
|
||||
Coin::Quarter => 25,
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 6-3: An enum and a `match` expression that has
|
||||
the variants of the enum as its patterns</span>
|
||||
|
||||
Let’s break down the `match` in the `value_in_cents` function. First, we list
|
||||
the `match` keyword followed by an expression, which in this case is the value
|
||||
`coin`. This seems very similar to an expression used with `if`, but there’s a
|
||||
big difference: with `if`, the expression needs to return a Boolean value, but
|
||||
here, it can be any type. The type of `coin` in this example is the `Coin` enum
|
||||
that we defined on line 1.
|
||||
|
||||
Next are the `match` arms. An arm has two parts: a pattern and some code. The
|
||||
first arm here has a pattern that is the value `Coin::Penny` and then the `=>`
|
||||
operator that separates the pattern and the code to run. The code in this case
|
||||
is just the value `1`. Each arm is separated from the next with a comma.
|
||||
|
||||
When the `match` expression executes, it compares the resulting value against
|
||||
the pattern of each arm, in order. If a pattern matches the value, the code
|
||||
associated with that pattern is executed. If that pattern doesn’t match the
|
||||
value, execution continues to the next arm, much as in a coin-sorting machine.
|
||||
We can have as many arms as we need: in Listing 6-3, our `match` has four arms.
|
||||
|
||||
The code associated with each arm is an expression, and the resulting value of
|
||||
the expression in the matching arm is the value that gets returned for the
|
||||
entire `match` expression.
|
||||
|
||||
Curly brackets typically aren’t used if the match arm code is short, as it is
|
||||
in Listing 6-3 where each arm just returns a value. If you want to run multiple
|
||||
lines of code in a match arm, you can use curly brackets. For example, the
|
||||
following code would print “Lucky penny!” every time the method was called with
|
||||
a `Coin::Penny` but would still return the last value of the block, `1`:
|
||||
|
||||
```rust
|
||||
# enum Coin {
|
||||
# Penny,
|
||||
# Nickel,
|
||||
# Dime,
|
||||
# Quarter,
|
||||
# }
|
||||
#
|
||||
fn value_in_cents(coin: Coin) -> u32 {
|
||||
match coin {
|
||||
Coin::Penny => {
|
||||
println!("Lucky penny!");
|
||||
1
|
||||
},
|
||||
Coin::Nickel => 5,
|
||||
Coin::Dime => 10,
|
||||
Coin::Quarter => 25,
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
### Patterns that Bind to Values
|
||||
|
||||
Another useful feature of match arms is that they can bind to the parts of the
|
||||
values that match the pattern. This is how we can extract values out of enum
|
||||
variants.
|
||||
|
||||
As an example, let’s change one of our enum variants to hold data inside it.
|
||||
From 1999 through 2008, the United States minted quarters with different
|
||||
designs for each of the 50 states on one side. No other coins got state
|
||||
designs, so only quarters have this extra value. We can add this information to
|
||||
our `enum` by changing the `Quarter` variant to include a `UsState` value stored
|
||||
inside it, which we’ve done here in Listing 6-4:
|
||||
|
||||
```rust
|
||||
#[derive(Debug)] // So we can inspect the state in a minute
|
||||
enum UsState {
|
||||
Alabama,
|
||||
Alaska,
|
||||
// --snip--
|
||||
}
|
||||
|
||||
enum Coin {
|
||||
Penny,
|
||||
Nickel,
|
||||
Dime,
|
||||
Quarter(UsState),
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 6-4: A `Coin` enum in which the `Quarter` variant
|
||||
also holds a `UsState` value</span>
|
||||
|
||||
Let’s imagine that a friend of ours is trying to collect all 50 state quarters.
|
||||
While we sort our loose change by coin type, we’ll also call out the name of
|
||||
the state associated with each quarter so if it’s one our friend doesn’t have,
|
||||
they can add it to their collection.
|
||||
|
||||
In the match expression for this code, we add a variable called `state` to the
|
||||
pattern that matches values of the variant `Coin::Quarter`. When a
|
||||
`Coin::Quarter` matches, the `state` variable will bind to the value of that
|
||||
quarter’s state. Then we can use `state` in the code for that arm, like so:
|
||||
|
||||
```rust
|
||||
# #[derive(Debug)]
|
||||
# enum UsState {
|
||||
# Alabama,
|
||||
# Alaska,
|
||||
# }
|
||||
#
|
||||
# enum Coin {
|
||||
# Penny,
|
||||
# Nickel,
|
||||
# Dime,
|
||||
# Quarter(UsState),
|
||||
# }
|
||||
#
|
||||
fn value_in_cents(coin: Coin) -> u32 {
|
||||
match coin {
|
||||
Coin::Penny => 1,
|
||||
Coin::Nickel => 5,
|
||||
Coin::Dime => 10,
|
||||
Coin::Quarter(state) => {
|
||||
println!("State quarter from {:?}!", state);
|
||||
25
|
||||
},
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
If we were to call `value_in_cents(Coin::Quarter(UsState::Alaska))`, `coin`
|
||||
would be `Coin::Quarter(UsState::Alaska)`. When we compare that value with each
|
||||
of the match arms, none of them match until we reach `Coin::Quarter(state)`. At
|
||||
that point, the binding for `state` will be the value `UsState::Alaska`. We can
|
||||
then use that binding in the `println!` expression, thus getting the inner
|
||||
state value out of the `Coin` enum variant for `Quarter`.
|
||||
|
||||
### Matching with `Option<T>`
|
||||
|
||||
In the previous section, we wanted to get the inner `T` value out of the `Some`
|
||||
case when using `Option<T>`; we can also handle `Option<T>` using `match` as we
|
||||
did with the `Coin` enum! Instead of comparing coins, we’ll compare the
|
||||
variants of `Option<T>`, but the way that the `match` expression works remains
|
||||
the same.
|
||||
|
||||
Let’s say we want to write a function that takes an `Option<i32>` and, if
|
||||
there’s a value inside, adds 1 to that value. If there isn’t a value inside,
|
||||
the function should return the `None` value and not attempt to perform any
|
||||
operations.
|
||||
|
||||
This function is very easy to write, thanks to `match`, and will look like
|
||||
Listing 6-5:
|
||||
|
||||
```rust
|
||||
fn plus_one(x: Option<i32>) -> Option<i32> {
|
||||
match x {
|
||||
None => None,
|
||||
Some(i) => Some(i + 1),
|
||||
}
|
||||
}
|
||||
|
||||
let five = Some(5);
|
||||
let six = plus_one(five);
|
||||
let none = plus_one(None);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 6-5: A function that uses a `match` expression on
|
||||
an `Option<i32>`</span>
|
||||
|
||||
Let’s examine the first execution of `plus_one` in more detail. When we call
|
||||
`plus_one(five)`, the variable `x` in the body of `plus_one` will have the
|
||||
value `Some(5)`. We then compare that against each match arm.
|
||||
|
||||
```rust,ignore
|
||||
None => None,
|
||||
```
|
||||
|
||||
The `Some(5)` value doesn’t match the pattern `None`, so we continue to the
|
||||
next arm.
|
||||
|
||||
```rust,ignore
|
||||
Some(i) => Some(i + 1),
|
||||
```
|
||||
|
||||
Does `Some(5)` match `Some(i)`? Why yes it does! We have the same variant. The
|
||||
`i` binds to the value contained in `Some`, so `i` takes the value `5`. The
|
||||
code in the match arm is then executed, so we add 1 to the value of `i` and
|
||||
create a new `Some` value with our total `6` inside.
|
||||
|
||||
Now let’s consider the second call of `plus_one` in Listing 6-5, where `x` is
|
||||
`None`. We enter the `match` and compare to the first arm.
|
||||
|
||||
```rust,ignore
|
||||
None => None,
|
||||
```
|
||||
|
||||
It matches! There’s no value to add to, so the program stops and returns the
|
||||
`None` value on the right side of `=>`. Because the first arm matched, no other
|
||||
arms are compared.
|
||||
|
||||
Combining `match` and enums is useful in many situations. You’ll see this
|
||||
pattern a lot in Rust code: `match` against an enum, bind a variable to the
|
||||
data inside, and then execute code based on it. It’s a bit tricky at first, but
|
||||
once you get used to it, you’ll wish you had it in all languages. It’s
|
||||
consistently a user favorite.
|
||||
|
||||
### Matches Are Exhaustive
|
||||
|
||||
There’s one other aspect of `match` we need to discuss. Consider this version
|
||||
of our `plus_one` function that has a bug and won’t compile:
|
||||
|
||||
```rust,ignore
|
||||
fn plus_one(x: Option<i32>) -> Option<i32> {
|
||||
match x {
|
||||
Some(i) => Some(i + 1),
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
We didn’t handle the `None` case, so this code will cause a bug. Luckily, it’s
|
||||
a bug Rust knows how to catch. If we try to compile this code, we’ll get this
|
||||
error:
|
||||
|
||||
```text
|
||||
error[E0004]: non-exhaustive patterns: `None` not covered
|
||||
-->
|
||||
|
|
||||
6 | match x {
|
||||
| ^ pattern `None` not covered
|
||||
```
|
||||
|
||||
Rust knows that we didn’t cover every possible case and even knows which
|
||||
pattern we forgot! Matches in Rust are *exhaustive*: we must exhaust every last
|
||||
possibility in order for the code to be valid. Especially in the case of
|
||||
`Option<T>`, when Rust prevents us from forgetting to explicitly handle the
|
||||
`None` case, it protects us from assuming that we have a value when we might
|
||||
have null, thus making the billion-dollar mistake discussed earlier.
|
||||
|
||||
### The `_` Placeholder
|
||||
|
||||
Rust also has a pattern we can use when we don’t want to list all possible
|
||||
values. For example, a `u8` can have valid values of 0 through 255. If we only
|
||||
care about the values 1, 3, 5, and 7, we don’t want to have to list out 0, 2,
|
||||
4, 6, 8, 9 all the way up to 255. Fortunately, we don’t have to: we can use the
|
||||
special pattern `_` instead:
|
||||
|
||||
```rust
|
||||
let some_u8_value = 0u8;
|
||||
match some_u8_value {
|
||||
1 => println!("one"),
|
||||
3 => println!("three"),
|
||||
5 => println!("five"),
|
||||
7 => println!("seven"),
|
||||
_ => (),
|
||||
}
|
||||
```
|
||||
|
||||
The `_` pattern will match any value. By putting it after our other arms, the
|
||||
`_` will match all the possible cases that aren’t specified before it. The `()`
|
||||
is just the unit value, so nothing will happen in the `_` case. As a result, we
|
||||
can say that we want to do nothing for all the possible values that we don’t
|
||||
list before the `_` placeholder.
|
||||
|
||||
However, the `match` expression can be a bit wordy in a situation in which we
|
||||
only care about *one* of the cases. For this situation, Rust provides `if let`.
|
||||
118
2018-edition/src/ch06-03-if-let.md
Normal file
118
2018-edition/src/ch06-03-if-let.md
Normal file
@@ -0,0 +1,118 @@
|
||||
## Concise Control Flow with `if let`
|
||||
|
||||
The `if let` syntax lets you combine `if` and `let` into a less verbose way to
|
||||
handle values that match one pattern while ignoring the rest. Consider the
|
||||
program in Listing 6-6 that matches on an `Option<u8>` value but only wants to
|
||||
execute code if the value is 3:
|
||||
|
||||
```rust
|
||||
let some_u8_value = Some(0u8);
|
||||
match some_u8_value {
|
||||
Some(3) => println!("three"),
|
||||
_ => (),
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 6-6: A `match` that only cares about executing
|
||||
code when the value is `Some(3)`</span>
|
||||
|
||||
We want to do something with the `Some(3)` match but do nothing with any other
|
||||
`Some<u8>` value or the `None` value. To satisfy the `match` expression, we
|
||||
have to add `_ => ()` after processing just one variant, which is a lot of
|
||||
boilerplate code to add.
|
||||
|
||||
Instead, we could write this in a shorter way using `if let`. The following
|
||||
code behaves the same as the `match` in Listing 6-6:
|
||||
|
||||
```rust
|
||||
# let some_u8_value = Some(0u8);
|
||||
if let Some(3) = some_u8_value {
|
||||
println!("three");
|
||||
}
|
||||
```
|
||||
|
||||
The syntax `if let` takes a pattern and an expression separated by an `=`. It
|
||||
works the same way as a `match`, where the expression is given to the `match`
|
||||
and the pattern is its first arm.
|
||||
|
||||
Using `if let` means you have less typing, less indentation, and less
|
||||
boilerplate code. However, you lose the exhaustive checking that `match`
|
||||
enforces. Choosing between `match` and `if let` depends on what you’re doing in
|
||||
your particular situation and whether gaining conciseness is an appropriate
|
||||
trade-off for losing exhaustive checking.
|
||||
|
||||
In other words, you can think of `if let` as syntax sugar for a `match` that
|
||||
runs code when the value matches one pattern and then ignores all other values.
|
||||
|
||||
We can include an `else` with an `if let`. The block of code that goes with the
|
||||
`else` is the same as the block of code that would go with the `_` case in the
|
||||
`match` expression that is equivalent to the `if let` and `else`. Recall the
|
||||
`Coin` enum definition in Listing 6-4, where the `Quarter` variant also held a
|
||||
`UsState` value. If we wanted to count all non-quarter coins we see while also
|
||||
announcing the state of the quarters, we could do that with a `match`
|
||||
expression like this:
|
||||
|
||||
```rust
|
||||
# #[derive(Debug)]
|
||||
# enum UsState {
|
||||
# Alabama,
|
||||
# Alaska,
|
||||
# }
|
||||
#
|
||||
# enum Coin {
|
||||
# Penny,
|
||||
# Nickel,
|
||||
# Dime,
|
||||
# Quarter(UsState),
|
||||
# }
|
||||
# let coin = Coin::Penny;
|
||||
let mut count = 0;
|
||||
match coin {
|
||||
Coin::Quarter(state) => println!("State quarter from {:?}!", state),
|
||||
_ => count += 1,
|
||||
}
|
||||
```
|
||||
|
||||
Or we could use an `if let` and `else` expression like this:
|
||||
|
||||
```rust
|
||||
# #[derive(Debug)]
|
||||
# enum UsState {
|
||||
# Alabama,
|
||||
# Alaska,
|
||||
# }
|
||||
#
|
||||
# enum Coin {
|
||||
# Penny,
|
||||
# Nickel,
|
||||
# Dime,
|
||||
# Quarter(UsState),
|
||||
# }
|
||||
# let coin = Coin::Penny;
|
||||
let mut count = 0;
|
||||
if let Coin::Quarter(state) = coin {
|
||||
println!("State quarter from {:?}!", state);
|
||||
} else {
|
||||
count += 1;
|
||||
}
|
||||
```
|
||||
|
||||
If you have a situation in which your program has logic that is too verbose to
|
||||
express using a `match`, remember that `if let` is in your Rust toolbox as well.
|
||||
|
||||
## Summary
|
||||
|
||||
We’ve now covered how to use enums to create custom types that can be one of a
|
||||
set of enumerated values. We’ve shown how the standard library’s `Option<T>`
|
||||
type helps you use the type system to prevent errors. When enum values have
|
||||
data inside them, you can use `match` or `if let` to extract and use those
|
||||
values, depending on how many cases you need to handle.
|
||||
|
||||
Your Rust programs can now express concepts in your domain using structs and
|
||||
enums. Creating custom types to use in your API ensures type safety: the
|
||||
compiler will make certain your functions get only values of the type each
|
||||
function expects.
|
||||
|
||||
In order to provide a well-organized API to your users that is straightforward
|
||||
to use and only exposes exactly what your users will need, let’s now turn to
|
||||
Rust’s modules.
|
||||
24
2018-edition/src/ch07-00-modules.md
Normal file
24
2018-edition/src/ch07-00-modules.md
Normal file
@@ -0,0 +1,24 @@
|
||||
# Using Modules to Reuse and Organize Code
|
||||
|
||||
When you start writing programs in Rust, your code might live solely in the
|
||||
`main` function. As your code grows, you’ll eventually move functionality into
|
||||
other functions for reuse and better organization. By splitting your code into
|
||||
smaller chunks, you make each chunk easier to understand on its own. But what
|
||||
happens if you have too many functions? Rust has a module system that enables
|
||||
the reuse of code in an organized fashion.
|
||||
|
||||
In the same way that you extract lines of code into a function, you can extract
|
||||
functions (and other code, like structs and enums) into different modules. A
|
||||
*module* is a namespace that contains definitions of functions or types, and
|
||||
you can choose whether those definitions are visible outside their module
|
||||
(public) or not (private). Here’s an overview of how modules work:
|
||||
|
||||
* The `mod` keyword declares a new module. Code within the module appears
|
||||
either immediately following this declaration within curly brackets or in
|
||||
another file.
|
||||
* By default, functions, types, constants, and modules are private. The `pub`
|
||||
keyword makes an item public and therefore visible outside its namespace.
|
||||
* The `use` keyword brings modules, or the definitions inside modules, into
|
||||
scope so it’s easier to refer to them.
|
||||
|
||||
We’ll look at each of these parts to see how they fit into the whole.
|
||||
481
2018-edition/src/ch07-01-mod-and-the-filesystem.md
Normal file
481
2018-edition/src/ch07-01-mod-and-the-filesystem.md
Normal file
@@ -0,0 +1,481 @@
|
||||
## `mod` and the Filesystem
|
||||
|
||||
We’ll start our module example by making a new project with Cargo, but instead
|
||||
of creating a binary crate, we’ll make a library crate: a project that other
|
||||
people can pull into their projects as a dependency. For example, the `rand`
|
||||
crate discussed in Chapter 2 is a library crate that we used as a dependency in
|
||||
the guessing game project.
|
||||
|
||||
We’ll create a skeleton of a library that provides some general networking
|
||||
functionality; we’ll concentrate on the organization of the modules and
|
||||
functions, but we won’t worry about what code goes in the function bodies.
|
||||
We’ll call our library `communicator`. To create a library, pass the `--lib`
|
||||
option instead of `--bin`:
|
||||
|
||||
```text
|
||||
$ cargo new communicator --lib
|
||||
$ cd communicator
|
||||
```
|
||||
|
||||
Notice that Cargo generated *src/lib.rs* instead of *src/main.rs*. Inside
|
||||
*src/lib.rs* we’ll find the following:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
#[test]
|
||||
fn it_works() {
|
||||
assert_eq!(2 + 2, 4);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
Cargo creates an example test to help us get our library started, rather than
|
||||
the “Hello, world!” binary that we get when we use the `--bin` option. We’ll
|
||||
look at the `#[]` and `mod tests` syntax in the “Using `super` to Access a
|
||||
Parent Module” section later in this chapter, but for now, leave this code at
|
||||
the bottom of *src/lib.rs*.
|
||||
|
||||
Because we don’t have a *src/main.rs* file, there’s nothing for Cargo to
|
||||
execute with the `cargo run` command. Therefore, we’ll use the `cargo build`
|
||||
command to compile our library crate’s code.
|
||||
|
||||
We’ll look at different options for organizing your library’s code that will be
|
||||
suitable in a variety of situations, depending on the intent of the code.
|
||||
|
||||
### Module Definitions
|
||||
|
||||
For our `communicator` networking library, we’ll first define a module named
|
||||
`network` that contains the definition of a function called `connect`. Every
|
||||
module definition in Rust starts with the `mod` keyword. Add this code to the
|
||||
beginning of the *src/lib.rs* file, above the test code:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
mod network {
|
||||
fn connect() {
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
After the `mod` keyword, we put the name of the module, `network`, and then a
|
||||
block of code in curly brackets. Everything inside this block is inside the
|
||||
namespace `network`. In this case, we have a single function, `connect`. If we
|
||||
wanted to call this function from code outside the `network` module, we
|
||||
would need to specify the module and use the namespace syntax `::` like so:
|
||||
`network::connect()`.
|
||||
|
||||
We can also have multiple modules, side by side, in the same *src/lib.rs* file.
|
||||
For example, to also have a `client` module that has a function named
|
||||
`connect`, we can add it as shown in Listing 7-1:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
mod network {
|
||||
fn connect() {
|
||||
}
|
||||
}
|
||||
|
||||
mod client {
|
||||
fn connect() {
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 7-1: The `network` module and the `client` module
|
||||
defined side by side in *src/lib.rs*</span>
|
||||
|
||||
Now we have a `network::connect` function and a `client::connect` function.
|
||||
These can have completely different functionality, and the function names do
|
||||
not conflict with each other because they’re in different modules.
|
||||
|
||||
In this case, because we’re building a library, the file that serves as the
|
||||
entry point for building our library is *src/lib.rs*. However, in respect to
|
||||
creating modules, there’s nothing special about *src/lib.rs*. We could also
|
||||
create modules in *src/main.rs* for a binary crate in the same way as we’re
|
||||
creating modules in *src/lib.rs* for the library crate. In fact, we can put
|
||||
modules inside of modules, which can be useful as your modules grow to keep
|
||||
related functionality organized together and separate functionality apart. The
|
||||
way you choose to organize your code depends on how you think about the
|
||||
relationship between the parts of your code. For instance, the `client` code
|
||||
and its `connect` function might make more sense to users of our library if
|
||||
they were inside the `network` namespace instead, as in Listing 7-2:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
mod network {
|
||||
fn connect() {
|
||||
}
|
||||
|
||||
mod client {
|
||||
fn connect() {
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 7-2: Moving the `client` module inside the
|
||||
`network` module</span>
|
||||
|
||||
In your *src/lib.rs* file, replace the existing `mod network` and `mod client`
|
||||
definitions with the ones in Listing 7-2, which have the `client` module as an
|
||||
inner module of `network`. The functions `network::connect` and
|
||||
`network::client::connect` are both named `connect`, but they don’t conflict
|
||||
with each other because they’re in different namespaces.
|
||||
|
||||
In this way, modules form a hierarchy. The contents of *src/lib.rs* are at the
|
||||
topmost level, and the submodules are at lower levels. Here’s what the
|
||||
organization of our example in Listing 7-1 looks like when thought of as a
|
||||
hierarchy:
|
||||
|
||||
```text
|
||||
communicator
|
||||
├── network
|
||||
└── client
|
||||
```
|
||||
|
||||
And here’s the hierarchy corresponding to the example in Listing 7-2:
|
||||
|
||||
```text
|
||||
communicator
|
||||
└── network
|
||||
└── client
|
||||
```
|
||||
|
||||
The hierarchy shows that in Listing 7-2, `client` is a child of the `network`
|
||||
module rather than a sibling. More complicated projects can have many modules,
|
||||
and they’ll need to be organized logically in order for you to keep track of
|
||||
them. What “logically” means in your project is up to you and depends on how
|
||||
you and your library’s users think about your project’s domain. Use the
|
||||
techniques shown here to create side-by-side modules and nested modules in
|
||||
whatever structure you would like.
|
||||
|
||||
### Moving Modules to Other Files
|
||||
|
||||
Modules form a hierarchical structure, much like another structure in computing
|
||||
that you’re used to: filesystems! We can use Rust’s module system along with
|
||||
multiple files to split up Rust projects so not everything lives in
|
||||
*src/lib.rs* or *src/main.rs*. For this example, let’s start with the code in
|
||||
Listing 7-3:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
mod client {
|
||||
fn connect() {
|
||||
}
|
||||
}
|
||||
|
||||
mod network {
|
||||
fn connect() {
|
||||
}
|
||||
|
||||
mod server {
|
||||
fn connect() {
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 7-3: Three modules, `client`, `network`, and
|
||||
`network::server`, all defined in *src/lib.rs*</span>
|
||||
|
||||
The file *src/lib.rs* has this module hierarchy:
|
||||
|
||||
```text
|
||||
communicator
|
||||
├── client
|
||||
└── network
|
||||
└── server
|
||||
```
|
||||
|
||||
If these modules had many functions, and those functions were becoming lengthy,
|
||||
it would be difficult to scroll through this file to find the code we wanted to
|
||||
work with. Because the functions are nested inside one or more `mod` blocks,
|
||||
the lines of code inside the functions will start getting lengthy as well.
|
||||
These would be good reasons to separate the `client`, `network`, and `server`
|
||||
modules from *src/lib.rs* and place them into their own files.
|
||||
|
||||
First, let’s replace the `client` module code with only the declaration of the
|
||||
`client` module so that *src/lib.rs* looks like code shown in Listing 7-4:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
mod client;
|
||||
|
||||
mod network {
|
||||
fn connect() {
|
||||
}
|
||||
|
||||
mod server {
|
||||
fn connect() {
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 7-4: Extracting the contents of the `client` module but leaving the declaration in *src/lib.rs*</span>
|
||||
|
||||
We’re still *declaring* the `client` module here, but by replacing the block
|
||||
with a semicolon, we’re telling Rust to look in another location for the code
|
||||
defined within the scope of the `client` module. In other words, the line `mod
|
||||
client;` means this:
|
||||
|
||||
```rust,ignore
|
||||
mod client {
|
||||
// contents of client.rs
|
||||
}
|
||||
```
|
||||
|
||||
Now we need to create the external file with that module name. Create a
|
||||
*client.rs* file in your *src/* directory and open it. Then enter the
|
||||
following, which is the `connect` function in the `client` module that we
|
||||
removed in the previous step:
|
||||
|
||||
<span class="filename">Filename: src/client.rs</span>
|
||||
|
||||
```rust
|
||||
fn connect() {
|
||||
}
|
||||
```
|
||||
|
||||
Note that we don’t need a `mod` declaration in this file because we already
|
||||
declared the `client` module with `mod` in *src/lib.rs*. This file just
|
||||
provides the *contents* of the `client` module. If we put a `mod client` here,
|
||||
we’d be giving the `client` module its own submodule named `client`!
|
||||
|
||||
Rust only knows to look in *src/lib.rs* by default. If we want to add more
|
||||
files to our project, we need to tell Rust in *src/lib.rs* to look in other
|
||||
files; this is why `mod client` needs to be defined in *src/lib.rs* and can’t
|
||||
be defined in *src/client.rs*.
|
||||
|
||||
Now the project should compile successfully, although you’ll get a few
|
||||
warnings. Remember to use `cargo build` instead of `cargo run` because we have
|
||||
a library crate rather than a binary crate:
|
||||
|
||||
```text
|
||||
$ cargo build
|
||||
Compiling communicator v0.1.0 (file:///projects/communicator)
|
||||
warning: function is never used: `connect`
|
||||
--> src/client.rs:1:1
|
||||
|
|
||||
1 | / fn connect() {
|
||||
2 | | }
|
||||
| |_^
|
||||
|
|
||||
= note: #[warn(dead_code)] on by default
|
||||
|
||||
warning: function is never used: `connect`
|
||||
--> src/lib.rs:4:5
|
||||
|
|
||||
4 | / fn connect() {
|
||||
5 | | }
|
||||
| |_____^
|
||||
|
||||
warning: function is never used: `connect`
|
||||
--> src/lib.rs:8:9
|
||||
|
|
||||
8 | / fn connect() {
|
||||
9 | | }
|
||||
| |_________^
|
||||
```
|
||||
|
||||
These warnings tell us that we have functions that are never used. Don’t worry
|
||||
about these warnings for now; we’ll address them later in this chapter in the
|
||||
“Controlling Visibility with `pub`” section. The good news is that they’re just
|
||||
warnings; our project built successfully!
|
||||
|
||||
Next, let’s extract the `network` module into its own file using the same
|
||||
pattern. In *src/lib.rs*, delete the body of the `network` module and add a
|
||||
semicolon to the declaration, like so:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
mod client;
|
||||
|
||||
mod network;
|
||||
```
|
||||
|
||||
Then create a new *src/network.rs* file and enter the following:
|
||||
|
||||
<span class="filename">Filename: src/network.rs</span>
|
||||
|
||||
```rust
|
||||
fn connect() {
|
||||
}
|
||||
|
||||
mod server {
|
||||
fn connect() {
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
Notice that we still have a `mod` declaration within this module file; this is
|
||||
because we still want `server` to be a submodule of `network`.
|
||||
|
||||
Run `cargo build` again. Success! We have one more module to extract: `server`.
|
||||
Because it’s a submodule—that is, a module within a module—our current tactic
|
||||
of extracting a module into a file named after that module won’t work. We’ll
|
||||
try anyway so you can see the error. First, change *src/network.rs* to have
|
||||
`mod server;` instead of the `server` module’s contents:
|
||||
|
||||
<span class="filename">Filename: src/network.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn connect() {
|
||||
}
|
||||
|
||||
mod server;
|
||||
```
|
||||
|
||||
Then create a *src/server.rs* file and enter the contents of the `server`
|
||||
module that we extracted:
|
||||
|
||||
<span class="filename">Filename: src/server.rs</span>
|
||||
|
||||
```rust
|
||||
fn connect() {
|
||||
}
|
||||
```
|
||||
|
||||
When we try to `cargo build`, we’ll get the error shown in Listing 7-5:
|
||||
|
||||
```text
|
||||
$ cargo build
|
||||
Compiling communicator v0.1.0 (file:///projects/communicator)
|
||||
error: cannot declare a new module at this location
|
||||
--> src/network.rs:4:5
|
||||
|
|
||||
4 | mod server;
|
||||
| ^^^^^^
|
||||
|
|
||||
note: maybe move this module `src/network.rs` to its own directory via `src/network/mod.rs`
|
||||
--> src/network.rs:4:5
|
||||
|
|
||||
4 | mod server;
|
||||
| ^^^^^^
|
||||
note: ... or maybe `use` the module `server` instead of possibly redeclaring it
|
||||
--> src/network.rs:4:5
|
||||
|
|
||||
4 | mod server;
|
||||
| ^^^^^^
|
||||
```
|
||||
|
||||
<span class="caption">Listing 7-5: Error when trying to extract the `server`
|
||||
submodule into *src/server.rs*</span>
|
||||
|
||||
The error says we `cannot declare a new module at this location` and is
|
||||
pointing to the `mod server;` line in *src/network.rs*. So *src/network.rs* is
|
||||
different than *src/lib.rs* somehow: keep reading to understand why.
|
||||
|
||||
The note in the middle of Listing 7-5 is actually very helpful because it
|
||||
points out something we haven’t yet talked about doing:
|
||||
|
||||
```text
|
||||
note: maybe move this module `network` to its own directory via
|
||||
`network/mod.rs`
|
||||
```
|
||||
|
||||
Instead of continuing to follow the same file-naming pattern we used
|
||||
previously, we can do what the note suggests:
|
||||
|
||||
1. Make a new *directory* named *network*, the parent module’s name.
|
||||
2. Move the *src/network.rs* file into the new *network* directory and
|
||||
rename it *src/network/mod.rs*.
|
||||
3. Move the submodule file *src/server.rs* into the *network* directory.
|
||||
|
||||
Here are commands to carry out these steps:
|
||||
|
||||
```text
|
||||
$ mkdir src/network
|
||||
$ mv src/network.rs src/network/mod.rs
|
||||
$ mv src/server.rs src/network
|
||||
```
|
||||
|
||||
Now when we try to run `cargo build`, compilation will work (we’ll still have
|
||||
warnings though). Our module layout still looks exactly the same as it did when
|
||||
we had all the code in *src/lib.rs* in Listing 7-3:
|
||||
|
||||
```text
|
||||
communicator
|
||||
├── client
|
||||
└── network
|
||||
└── server
|
||||
```
|
||||
|
||||
The corresponding file layout now looks like this:
|
||||
|
||||
```text
|
||||
└── src
|
||||
├── client.rs
|
||||
├── lib.rs
|
||||
└── network
|
||||
├── mod.rs
|
||||
└── server.rs
|
||||
```
|
||||
|
||||
So when we wanted to extract the `network::server` module, why did we have to
|
||||
also change the *src/network.rs* file to the *src/network/mod.rs* file and put
|
||||
the code for `network::server` in the *network* directory in
|
||||
*src/network/server.rs*? Why couldn’t we just extract the `network::server`
|
||||
module into *src/server.rs*? The reason is that Rust wouldn’t be able to
|
||||
recognize that `server` was supposed to be a submodule of `network` if the
|
||||
*server.rs* file was in the *src* directory. To clarify Rust’s behavior here,
|
||||
let’s consider a different example with the following module hierarchy, where
|
||||
all the definitions are in *src/lib.rs*:
|
||||
|
||||
```text
|
||||
communicator
|
||||
├── client
|
||||
└── network
|
||||
└── client
|
||||
```
|
||||
|
||||
In this example, we have three modules again: `client`, `network`, and
|
||||
`network::client`. Following the same steps we did earlier for extracting
|
||||
modules into files, we would create *src/client.rs* for the `client` module.
|
||||
For the `network` module, we would create *src/network.rs*. But we wouldn’t be
|
||||
able to extract the `network::client` module into a *src/client.rs* file
|
||||
because that already exists for the top-level `client` module! If we could put
|
||||
the code for *both* the `client` and `network::client` modules in the
|
||||
*src/client.rs* file, Rust wouldn’t have any way to know whether the code was
|
||||
for `client` or for `network::client`.
|
||||
|
||||
Therefore, in order to extract a file for the `network::client` submodule of
|
||||
the `network` module, we needed to create a directory for the `network` module
|
||||
instead of a *src/network.rs* file. The code that is in the `network` module
|
||||
then goes into the *src/network/mod.rs* file, and the submodule
|
||||
`network::client` can have its own *src/network/client.rs* file. Now the
|
||||
top-level *src/client.rs* is unambiguously the code that belongs to the
|
||||
`client` module.
|
||||
|
||||
### Rules of Module Filesystems
|
||||
|
||||
Let’s summarize the rules of modules with regard to files:
|
||||
|
||||
* If a module named `foo` has no submodules, you should put the declarations
|
||||
for `foo` in a file named *foo.rs*.
|
||||
* If a module named `foo` does have submodules, you should put the declarations
|
||||
for `foo` in a file named *foo/mod.rs*.
|
||||
|
||||
These rules apply recursively, so if a module named `foo` has a submodule named
|
||||
`bar` and `bar` does not have submodules, you should have the following files
|
||||
in your *src* directory:
|
||||
|
||||
```text
|
||||
└── foo
|
||||
├── bar.rs (contains the declarations in `foo::bar`)
|
||||
└── mod.rs (contains the declarations in `foo`, including `mod bar`)
|
||||
```
|
||||
|
||||
The modules should be declared in their parent module’s file using the `mod`
|
||||
keyword.
|
||||
|
||||
Next, we’ll talk about the `pub` keyword and get rid of those warnings!
|
||||
288
2018-edition/src/ch07-02-controlling-visibility-with-pub.md
Normal file
288
2018-edition/src/ch07-02-controlling-visibility-with-pub.md
Normal file
@@ -0,0 +1,288 @@
|
||||
## Controlling Visibility with `pub`
|
||||
|
||||
We resolved the error messages shown in Listing 7-5 by moving the `network` and
|
||||
`network::server` code into the *src/network/mod.rs* and
|
||||
*src/network/server.rs* files, respectively. At that point, `cargo build` was
|
||||
able to build our project, but we still get warning messages about the
|
||||
`client::connect`, `network::connect`, and `network::server::connect` functions
|
||||
not being used.
|
||||
|
||||
So why are we receiving these warnings? After all, we’re building a library
|
||||
with functions that are intended to be used by our *users*, not necessarily by
|
||||
us within our own project, so it shouldn’t matter that these `connect`
|
||||
functions go unused. The point of creating them is that they will be used by
|
||||
another project, not our own.
|
||||
|
||||
To understand why this program invokes these warnings, let’s try using the
|
||||
`connect` library from another project, calling it externally. To do that,
|
||||
we’ll create a binary crate in the same directory as our library crate by
|
||||
making a *src/main.rs* file containing this code:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
extern crate communicator;
|
||||
|
||||
fn main() {
|
||||
communicator::client::connect();
|
||||
}
|
||||
```
|
||||
|
||||
We use the `extern crate` command to bring the `communicator` library crate
|
||||
into scope. Our package now contains *two* crates. Cargo treats *src/main.rs*
|
||||
as the root file of a binary crate, which is separate from the existing library
|
||||
crate whose root file is *src/lib.rs*. This pattern is quite common for
|
||||
executable projects: most functionality is in a library crate, and the binary
|
||||
crate uses that library crate. As a result, other programs can also use the
|
||||
library crate, and it’s a nice separation of concerns.
|
||||
|
||||
From the point of view of a crate outside the `communicator` library looking
|
||||
in, all the modules we’ve been creating are within a module that has the same
|
||||
name as the crate, `communicator`. We call the top-level module of a crate the
|
||||
*root module*.
|
||||
|
||||
Also note that even if we’re using an external crate within a submodule of our
|
||||
project, the `extern crate` should go in our root module (so in *src/main.rs*
|
||||
or *src/lib.rs*). Then, in our submodules, we can refer to items from external
|
||||
crates as if the items are top-level modules.
|
||||
|
||||
Right now, our binary crate just calls our library’s `connect` function from
|
||||
the `client` module. However, invoking `cargo build` will now give us an error
|
||||
after the warnings:
|
||||
|
||||
```text
|
||||
error[E0603]: module `client` is private
|
||||
--> src/main.rs:4:5
|
||||
|
|
||||
4 | communicator::client::connect();
|
||||
| ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
||||
```
|
||||
|
||||
Ah ha! This error tells us that the `client` module is private, which is the
|
||||
crux of the warnings. It’s also the first time we’ve run into the concepts of
|
||||
*public* and *private* in the context of Rust. The default state of all code in
|
||||
Rust is private: no one else is allowed to use the code. If you don’t use a
|
||||
private function within your program, because your program is the only code
|
||||
allowed to use that function, Rust will warn you that the function has gone
|
||||
unused.
|
||||
|
||||
After you specify that a function such as `client::connect` is public, not only
|
||||
will your call to that function from your binary crate be allowed, but also the
|
||||
warning that the function is unused will go away. Marking a function as public
|
||||
lets Rust know that the function will be used by code outside of your program.
|
||||
Rust considers the theoretical external usage that’s now possible as the
|
||||
function “being used.” Thus, when a function is marked public, Rust will not
|
||||
require that it be used in your program and will stop warning that the function
|
||||
is unused.
|
||||
|
||||
### Making a Function Public
|
||||
|
||||
To tell Rust to make a function public, we add the `pub` keyword to the start
|
||||
of the declaration. We’ll focus on fixing the warning that indicates
|
||||
`client::connect` has gone unused for now, as well as the `` module `client` is
|
||||
private `` error from our binary crate. Modify *src/lib.rs* to make the
|
||||
`client` module public, like so:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub mod client;
|
||||
|
||||
mod network;
|
||||
```
|
||||
|
||||
The `pub` keyword is placed right before `mod`. Let’s try building again:
|
||||
|
||||
```text
|
||||
error[E0603]: function `connect` is private
|
||||
--> src/main.rs:4:5
|
||||
|
|
||||
4 | communicator::client::connect();
|
||||
| ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
||||
```
|
||||
|
||||
Hooray! We have a different error! Yes, different error messages are a cause
|
||||
for celebration. The new error shows `` function `connect` is private ``, so
|
||||
let’s edit *src/client.rs* to make `client::connect` public too:
|
||||
|
||||
<span class="filename">Filename: src/client.rs</span>
|
||||
|
||||
```rust
|
||||
pub fn connect() {
|
||||
}
|
||||
```
|
||||
|
||||
Now run `cargo build` again:
|
||||
|
||||
```text
|
||||
warning: function is never used: `connect`
|
||||
--> src/network/mod.rs:1:1
|
||||
|
|
||||
1 | / fn connect() {
|
||||
2 | | }
|
||||
| |_^
|
||||
|
|
||||
= note: #[warn(dead_code)] on by default
|
||||
|
||||
warning: function is never used: `connect`
|
||||
--> src/network/server.rs:1:1
|
||||
|
|
||||
1 | / fn connect() {
|
||||
2 | | }
|
||||
| |_^
|
||||
```
|
||||
|
||||
The code compiled, and the warning that `client::connect` is not being used is
|
||||
gone!
|
||||
|
||||
Unused code warnings don’t always indicate that an item in your code needs to
|
||||
be made public: if you *didn’t* want these functions to be part of your public
|
||||
API, unused code warnings could be alerting you to code you no longer need that
|
||||
you can safely delete. They could also be alerting you to a bug if you had just
|
||||
accidentally removed all places within your library where this function is
|
||||
called.
|
||||
|
||||
But in this case, we *do* want the other two functions to be part of our
|
||||
crate’s public API, so let’s mark them as `pub` as well to get rid of the
|
||||
remaining warnings. Modify *src/network/mod.rs* to look like the following:
|
||||
|
||||
<span class="filename">Filename: src/network/mod.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub fn connect() {
|
||||
}
|
||||
|
||||
mod server;
|
||||
```
|
||||
|
||||
Then compile the code:
|
||||
|
||||
```text
|
||||
warning: function is never used: `connect`
|
||||
--> src/network/mod.rs:1:1
|
||||
|
|
||||
1 | / pub fn connect() {
|
||||
2 | | }
|
||||
| |_^
|
||||
|
|
||||
= note: #[warn(dead_code)] on by default
|
||||
|
||||
warning: function is never used: `connect`
|
||||
--> src/network/server.rs:1:1
|
||||
|
|
||||
1 | / fn connect() {
|
||||
2 | | }
|
||||
| |_^
|
||||
```
|
||||
|
||||
Hmmm, we’re still getting an unused function warning, even though
|
||||
`network::connect` is set to `pub`. The reason is that the function is public
|
||||
within the module, but the `network` module that the function resides in is not
|
||||
public. We’re working from the interior of the library out this time, whereas
|
||||
with `client::connect` we worked from the outside in. We need to change
|
||||
*src/lib.rs* to make `network` public too, like so:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub mod client;
|
||||
|
||||
pub mod network;
|
||||
```
|
||||
|
||||
Now when we compile, that warning is gone:
|
||||
|
||||
```text
|
||||
warning: function is never used: `connect`
|
||||
--> src/network/server.rs:1:1
|
||||
|
|
||||
1 | / fn connect() {
|
||||
2 | | }
|
||||
| |_^
|
||||
|
|
||||
= note: #[warn(dead_code)] on by default
|
||||
```
|
||||
|
||||
Only one warning is left—try to fix this one on your own!
|
||||
|
||||
### Privacy Rules
|
||||
|
||||
Overall, these are the rules for item visibility:
|
||||
|
||||
- If an item is public, it can be accessed through any of its parent modules.
|
||||
- If an item is private, it can be accessed only by its immediate parent
|
||||
module and any of the parent’s child modules.
|
||||
|
||||
### Privacy Examples
|
||||
|
||||
Let’s look at a few more privacy examples to get some practice. Create a new
|
||||
library project and enter the code in Listing 7-6 into your new project’s
|
||||
*src/lib.rs*:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
mod outermost {
|
||||
pub fn middle_function() {}
|
||||
|
||||
fn middle_secret_function() {}
|
||||
|
||||
mod inside {
|
||||
pub fn inner_function() {}
|
||||
|
||||
fn secret_function() {}
|
||||
}
|
||||
}
|
||||
|
||||
fn try_me() {
|
||||
outermost::middle_function();
|
||||
outermost::middle_secret_function();
|
||||
outermost::inside::inner_function();
|
||||
outermost::inside::secret_function();
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 7-6: Examples of private and public functions,
|
||||
some of which are incorrect</span>
|
||||
|
||||
Before you try to compile this code, make a guess about which lines in the
|
||||
`try_me` function will have errors. Then, try compiling the code to see whether
|
||||
you were right—and read on for the discussion of the errors!
|
||||
|
||||
#### Looking at the Errors
|
||||
|
||||
The `try_me` function is in the root module of our project. The module named
|
||||
`outermost` is private, but the second privacy rule states that the `try_me`
|
||||
function is allowed to access the `outermost` module because `outermost` is in
|
||||
the current (root) module, as is `try_me`.
|
||||
|
||||
The call to `outermost::middle_function` will work because `middle_function` is
|
||||
public and `try_me` is accessing `middle_function` through its parent module
|
||||
`outermost`. We determined in the previous paragraph that this module is
|
||||
accessible.
|
||||
|
||||
The call to `outermost::middle_secret_function` will cause a compilation error.
|
||||
Because `middle_secret_function` is private, the second rule applies. The root
|
||||
module is neither the current module of `middle_secret_function` (`outermost`
|
||||
is), nor is it a child module of the current module of `middle_secret_function`.
|
||||
|
||||
The module named `inside` is private and has no child modules, so it can be
|
||||
accessed only by its current module `outermost`. That means the `try_me`
|
||||
function is not allowed to call `outermost::inside::inner_function` or
|
||||
`outermost::inside::secret_function`.
|
||||
|
||||
#### Fixing the Errors
|
||||
|
||||
Here are some suggestions for changing the code in an attempt to fix the
|
||||
errors. Make a guess as to whether it will fix the errors before you try each
|
||||
one. Then compile the code to see whether or not you’re right, using the
|
||||
privacy rules to understand why. Feel free to design more experiments and try
|
||||
them out!
|
||||
|
||||
* What if the `inside` module were public?
|
||||
* What if `outermost` were public and `inside` were private?
|
||||
* What if, in the body of `inner_function`, you called
|
||||
`::outermost::middle_secret_function()`? (The two colons at the beginning mean
|
||||
that we want to refer to the modules starting from the root module.)
|
||||
|
||||
Next, let’s talk about bringing items into scope with the `use` keyword.
|
||||
271
2018-edition/src/ch07-03-importing-names-with-use.md
Normal file
271
2018-edition/src/ch07-03-importing-names-with-use.md
Normal file
@@ -0,0 +1,271 @@
|
||||
## Referring to Names in Different Modules
|
||||
|
||||
We’ve covered how to call functions defined within a module using the module
|
||||
name as part of the call, as in the call to the `nested_modules` function shown
|
||||
here in Listing 7-7:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
pub mod a {
|
||||
pub mod series {
|
||||
pub mod of {
|
||||
pub fn nested_modules() {}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
fn main() {
|
||||
a::series::of::nested_modules();
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 7-7: Calling a function by fully specifying its
|
||||
enclosing module’s path</span>
|
||||
|
||||
As you can see, referring to the fully qualified name can get quite lengthy.
|
||||
Fortunately, Rust has a keyword to make these calls more concise.
|
||||
|
||||
### Bringing Names into Scope with the `use` Keyword
|
||||
|
||||
Rust’s `use` keyword shortens lengthy function calls by bringing the modules of
|
||||
the function you want to call into scope. Here’s an example of bringing the
|
||||
`a::series::of` module into a binary crate’s root scope:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
pub mod a {
|
||||
pub mod series {
|
||||
pub mod of {
|
||||
pub fn nested_modules() {}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
use a::series::of;
|
||||
|
||||
fn main() {
|
||||
of::nested_modules();
|
||||
}
|
||||
```
|
||||
|
||||
The line `use a::series::of;` means that rather than using the full
|
||||
`a::series::of` path wherever we want to refer to the `of` module, we can use
|
||||
`of`.
|
||||
|
||||
The `use` keyword brings only what we’ve specified into scope: it does not
|
||||
bring children of modules into scope. That’s why we still have to use
|
||||
`of::nested_modules` when we want to call the `nested_modules` function.
|
||||
|
||||
We could have chosen to bring the function into scope by instead specifying the
|
||||
function in the `use` as follows:
|
||||
|
||||
```rust
|
||||
pub mod a {
|
||||
pub mod series {
|
||||
pub mod of {
|
||||
pub fn nested_modules() {}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
use a::series::of::nested_modules;
|
||||
|
||||
fn main() {
|
||||
nested_modules();
|
||||
}
|
||||
```
|
||||
|
||||
Doing so allows us to exclude all the modules and reference the function
|
||||
directly.
|
||||
|
||||
Because enums also form a sort of namespace like modules, we can bring an
|
||||
enum’s variants into scope with `use` as well. For any kind of `use` statement,
|
||||
if you’re bringing multiple items from one namespace into scope, you can list
|
||||
them using curly brackets and commas in the last position, like so:
|
||||
|
||||
```rust
|
||||
enum TrafficLight {
|
||||
Red,
|
||||
Yellow,
|
||||
Green,
|
||||
}
|
||||
|
||||
use TrafficLight::{Red, Yellow};
|
||||
|
||||
fn main() {
|
||||
let red = Red;
|
||||
let yellow = Yellow;
|
||||
let green = TrafficLight::Green;
|
||||
}
|
||||
```
|
||||
|
||||
We’re still specifying the `TrafficLight` namespace for the `Green` variant
|
||||
because we didn’t include `Green` in the `use` statement.
|
||||
|
||||
### Bringing All Names into Scope with a Glob
|
||||
|
||||
To bring all the items in a namespace into scope at once, we can use the `*`
|
||||
syntax, which is called the *glob operator*. This example brings all the
|
||||
variants of an enum into scope without having to list each specifically:
|
||||
|
||||
```rust
|
||||
enum TrafficLight {
|
||||
Red,
|
||||
Yellow,
|
||||
Green,
|
||||
}
|
||||
|
||||
use TrafficLight::*;
|
||||
|
||||
fn main() {
|
||||
let red = Red;
|
||||
let yellow = Yellow;
|
||||
let green = Green;
|
||||
}
|
||||
```
|
||||
|
||||
The `*` will bring into scope all the visible items in the `TrafficLight`
|
||||
namespace. You should use globs sparingly: they are convenient, but a glob
|
||||
might also pull in more items than you expected and cause naming conflicts.
|
||||
|
||||
### Using `super` to Access a Parent Module
|
||||
|
||||
As you saw at the beginning of this chapter, when you create a library crate,
|
||||
Cargo makes a `tests` module for you. Let’s go into more detail about that now.
|
||||
In your `communicator` project, open *src/lib.rs*:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub mod client;
|
||||
|
||||
pub mod network;
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
#[test]
|
||||
fn it_works() {
|
||||
assert_eq!(2 + 2, 4);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
Chapter 11 explains more about testing, but parts of this example should make
|
||||
sense now: we have a module named `tests` that lives next to our other modules
|
||||
and contains one function named `it_works`. Even though there are special
|
||||
annotations, the `tests` module is just another module! So our module hierarchy
|
||||
looks like this:
|
||||
|
||||
```text
|
||||
communicator
|
||||
├── client
|
||||
├── network
|
||||
| └── client
|
||||
└── tests
|
||||
```
|
||||
|
||||
Tests are for exercising the code within our library, so let’s try to call our
|
||||
`client::connect` function from this `it_works` function, even though we won’t
|
||||
be checking any functionality right now. This won’t work yet:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
#[test]
|
||||
fn it_works() {
|
||||
client::connect();
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
Run the tests by invoking the `cargo test` command:
|
||||
|
||||
```text
|
||||
$ cargo test
|
||||
Compiling communicator v0.1.0 (file:///projects/communicator)
|
||||
error[E0433]: failed to resolve. Use of undeclared type or module `client`
|
||||
--> src/lib.rs:9:9
|
||||
|
|
||||
9 | client::connect();
|
||||
| ^^^^^^ Use of undeclared type or module `client`
|
||||
```
|
||||
|
||||
The compilation failed, but why? We don’t need to place `communicator::` in
|
||||
front of the function, as we did in *src/main.rs*, because we are definitely
|
||||
within the `communicator` library crate here. The reason is that paths are
|
||||
always relative to the current module, which here is `tests`. The only
|
||||
exception is in a `use` statement, where paths are relative to the crate root
|
||||
by default. Our `tests` module needs the `client` module in its scope!
|
||||
|
||||
So how do we get back up one module in the module hierarchy to call the
|
||||
`client::connect` function in the `tests` module? In the `tests` module, we can
|
||||
either use leading colons to let Rust know that we want to start from the root
|
||||
and list the whole path, like this:
|
||||
|
||||
```rust,ignore
|
||||
::client::connect();
|
||||
```
|
||||
|
||||
Or, we can use `super` to move up one module in the hierarchy from our current
|
||||
module, like this:
|
||||
|
||||
```rust,ignore
|
||||
super::client::connect();
|
||||
```
|
||||
|
||||
These two options don’t look that different in this example, but if you’re
|
||||
deeper in a module hierarchy, starting from the root every time would make your
|
||||
code lengthy. In those cases, using `super` to get from the current module to
|
||||
sibling modules is a good shortcut. Plus, if you’ve specified the path from the
|
||||
root in many places in your code and then rearrange your modules by moving a
|
||||
subtree to another place, you’ll end up needing to update the path in several
|
||||
places, which would be tedious.
|
||||
|
||||
It would also be annoying to have to type `super::` in each test, but you’ve
|
||||
already seen the tool for that solution: `use`! The `super::` functionality
|
||||
changes the path you give to `use` so it is relative to the parent module
|
||||
instead of to the root module.
|
||||
|
||||
For these reasons, in the `tests` module especially, `use super::something` is
|
||||
usually the best solution. So now our test looks like this:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::client;
|
||||
|
||||
#[test]
|
||||
fn it_works() {
|
||||
client::connect();
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
When we run `cargo test` again, the test will pass, and the first part of the
|
||||
test result output will be the following:
|
||||
|
||||
```text
|
||||
$ cargo test
|
||||
Compiling communicator v0.1.0 (file:///projects/communicator)
|
||||
Running target/debug/communicator-92007ddb5330fa5a
|
||||
|
||||
running 1 test
|
||||
test tests::it_works ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
## Summary
|
||||
|
||||
Now you know some new techniques for organizing your code! Use these techniques
|
||||
to group related functionality together, keep files from becoming too long, and
|
||||
present a tidy public API to your library users.
|
||||
|
||||
Next, we’ll look at some collection data structures in the standard library
|
||||
that you can use in your nice, neat code.
|
||||
25
2018-edition/src/ch08-00-common-collections.md
Normal file
25
2018-edition/src/ch08-00-common-collections.md
Normal file
@@ -0,0 +1,25 @@
|
||||
# Common Collections
|
||||
|
||||
Rust’s standard library includes a number of very useful data structures called
|
||||
*collections*. Most other data types represent one specific value, but
|
||||
collections can contain multiple values. Unlike the built-in array and tuple
|
||||
types, the data these collections point to is stored on the heap, which means
|
||||
the amount of data does not need to be known at compile time and can grow or
|
||||
shrink as the program runs. Each kind of collection has different capabilities
|
||||
and costs, and choosing an appropriate one for your current situation is a
|
||||
skill you’ll develop over time. In this chapter, we’ll discuss three
|
||||
collections that are used very often in Rust programs:
|
||||
|
||||
* A *vector* allows you to store a variable number of values next to each other.
|
||||
* A *string* is a collection of characters. We’ve mentioned the `String` type
|
||||
previously, but in this chapter we’ll talk about it in depth.
|
||||
* A *hash map* allows you to associate a value with a particular key. It’s a
|
||||
particular implementation of the more general data structure called a *map*.
|
||||
|
||||
To learn about the other kinds of collections provided by the standard library,
|
||||
see [the documentation][collections].
|
||||
|
||||
[collections]: ../../std/collections/index.html
|
||||
|
||||
We’ll discuss how to create and update vectors, strings, and hash maps, as well
|
||||
as what makes each special.
|
||||
280
2018-edition/src/ch08-01-vectors.md
Normal file
280
2018-edition/src/ch08-01-vectors.md
Normal file
@@ -0,0 +1,280 @@
|
||||
## Storing Lists of Values with Vectors
|
||||
|
||||
The first collection type we’ll look at is `Vec<T>`, also known as a *vector*.
|
||||
Vectors allow you to store more than one value in a single data structure that
|
||||
puts all the values next to each other in memory. Vectors can only store values
|
||||
of the same type. They are useful when you have a list of items, such as the
|
||||
lines of text in a file or the prices of items in a shopping cart.
|
||||
|
||||
### Creating a New Vector
|
||||
|
||||
To create a new, empty vector, we can call the `Vec::new` function, as shown in
|
||||
Listing 8-1:
|
||||
|
||||
```rust
|
||||
let v: Vec<i32> = Vec::new();
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-1: Creating a new, empty vector to hold values
|
||||
of type `i32`</span>
|
||||
|
||||
Note that we added a type annotation here. Because we aren’t inserting any
|
||||
values into this vector, Rust doesn’t know what kind of elements we intend to
|
||||
store. This is an important point. Vectors are implemented using generics;
|
||||
we’ll cover how to use generics with your own types in Chapter 10. For now,
|
||||
know that the `Vec<T>` type provided by the standard library can hold any type,
|
||||
and when a specific vector holds a specific type, the type is specified within
|
||||
angle brackets. In Listing 8-1, we’ve told Rust that the `Vec<T>` in `v` will
|
||||
hold elements of the `i32` type.
|
||||
|
||||
In more realistic code, Rust can often infer the type of value you want to
|
||||
store once you insert values, so you rarely need to do this type annotation.
|
||||
It’s more common to create a `Vec<T>` that has initial values, and Rust
|
||||
provides the `vec!` macro for convenience. The macro will create a new vector
|
||||
that holds the values you give it. Listing 8-2 creates a new `Vec<i32>` that
|
||||
holds the values `1`, `2`, and `3`:
|
||||
|
||||
```rust
|
||||
let v = vec![1, 2, 3];
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-2: Creating a new vector containing
|
||||
values</span>
|
||||
|
||||
Because we’ve given initial `i32` values, Rust can infer that the type of `v`
|
||||
is `Vec<i32>`, and the type annotation isn’t necessary. Next, we’ll look at how
|
||||
to modify a vector.
|
||||
|
||||
### Updating a Vector
|
||||
|
||||
To create a vector and then add elements to it, we can use the `push` method,
|
||||
as shown in Listing 8-3:
|
||||
|
||||
```rust
|
||||
let mut v = Vec::new();
|
||||
|
||||
v.push(5);
|
||||
v.push(6);
|
||||
v.push(7);
|
||||
v.push(8);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-3: Using the `push` method to add values to a
|
||||
vector</span>
|
||||
|
||||
As with any variable, if we want to be able to change its value, we need to
|
||||
make it mutable using the `mut` keyword, as discussed in Chapter 3. The numbers
|
||||
we place inside are all of type `i32`, and Rust infers this from the data, so
|
||||
we don’t need the `Vec<i32>` annotation.
|
||||
|
||||
### Dropping a Vector Drops Its Elements
|
||||
|
||||
Like any other `struct`, a vector is freed when it goes out of scope, as
|
||||
annotated in Listing 8-4:
|
||||
|
||||
```rust
|
||||
{
|
||||
let v = vec![1, 2, 3, 4];
|
||||
|
||||
// do stuff with v
|
||||
|
||||
} // <- v goes out of scope and is freed here
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-4: Showing where the vector and its elements
|
||||
are dropped</span>
|
||||
|
||||
When the vector gets dropped, all of its contents are also dropped, meaning
|
||||
those integers it holds will be cleaned up. This may seem like a
|
||||
straightforward point but can get a bit more complicated when you start to
|
||||
introduce references to the elements of the vector. Let’s tackle that next!
|
||||
|
||||
### Reading Elements of Vectors
|
||||
|
||||
Now that you know how to create, update, and destroy vectors, knowing how to
|
||||
read their contents is a good next step. There are two ways to reference a
|
||||
value stored in a vector. In the examples, we’ve annotated the types of the
|
||||
values that are returned from these functions for extra clarity.
|
||||
|
||||
Listing 8-5 shows both methods of accessing a value in a vector, either with
|
||||
indexing syntax or the `get` method:
|
||||
|
||||
```rust
|
||||
let v = vec![1, 2, 3, 4, 5];
|
||||
|
||||
let third: &i32 = &v[2];
|
||||
let third: Option<&i32> = v.get(2);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-5: Using indexing syntax or the `get` method to
|
||||
access an item in a vector</span>
|
||||
|
||||
Note two details here. First, we use the index value of `2` to get the third
|
||||
element: vectors are indexed by number, starting at zero. Second, the two ways
|
||||
to get the third element are by using `&` and `[]`, which gives us a reference,
|
||||
or by using the `get` method with the index passed as an argument, which gives
|
||||
us an `Option<&T>`.
|
||||
|
||||
Rust has two ways to reference an element so you can choose how the program
|
||||
behaves when you try to use an index value that the vector doesn’t have an
|
||||
element for. As an example, let’s see what a program will do if it has a vector
|
||||
that holds five elements and then tries to access an element at index 100, as
|
||||
shown in Listing 8-6:
|
||||
|
||||
```rust,should_panic
|
||||
let v = vec![1, 2, 3, 4, 5];
|
||||
|
||||
let does_not_exist = &v[100];
|
||||
let does_not_exist = v.get(100);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-6: Attempting to access the element at index
|
||||
100 in a vector containing five elements</span>
|
||||
|
||||
When we run this code, the first `[]` method will cause the program to panic
|
||||
because it references a nonexistent element. This method is best used when you
|
||||
want your program to crash if there’s an attempt to access an element past the
|
||||
end of the vector.
|
||||
|
||||
When the `get` method is passed an index that is outside the vector, it returns
|
||||
`None` without panicking. You would use this method if accessing an element
|
||||
beyond the range of the vector happens occasionally under normal circumstances.
|
||||
Your code will then have logic to handle having either `Some(&element)` or
|
||||
`None`, as discussed in Chapter 6. For example, the index could be coming from
|
||||
a person entering a number. If they accidentally enter a number that’s too
|
||||
large and the program gets a `None` value, you could tell the user how many
|
||||
items are in the current vector and give them another chance to enter a valid
|
||||
value. That would be more user-friendly than crashing the program due to a typo!
|
||||
|
||||
When the program has a valid reference, the borrow checker enforces the
|
||||
ownership and borrowing rules (covered in Chapter 4) to ensure this reference
|
||||
and any other references to the contents of the vector remain valid. Recall the
|
||||
rule that states you can’t have mutable and immutable references in the same
|
||||
scope. That rule applies in Listing 8-7, where we hold an immutable reference to
|
||||
the first element in a vector and try to add an element to the end, which won’t
|
||||
work:
|
||||
|
||||
```rust,ignore
|
||||
let mut v = vec![1, 2, 3, 4, 5];
|
||||
|
||||
let first = &v[0];
|
||||
|
||||
v.push(6);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-7: Attempting to add an element to a vector
|
||||
while holding a reference to an item</span>
|
||||
|
||||
Compiling this code will result in this error:
|
||||
|
||||
```text
|
||||
error[E0502]: cannot borrow `v` as mutable because it is also borrowed as immutable
|
||||
-->
|
||||
|
|
||||
4 | let first = &v[0];
|
||||
| - immutable borrow occurs here
|
||||
5 |
|
||||
6 | v.push(6);
|
||||
| ^ mutable borrow occurs here
|
||||
7 |
|
||||
8 | }
|
||||
| - immutable borrow ends here
|
||||
```
|
||||
|
||||
The code in Listing 8-7 might look like it should work: why should a reference
|
||||
to the first element care about what changes at the end of the vector? This
|
||||
error is due to the way vectors work: adding a new element onto the end of the
|
||||
vector might require allocating new memory and copying the old elements to the
|
||||
new space, if there isn’t enough room to put all the elements next to each
|
||||
other where the vector currently is. In that case, the reference to the first
|
||||
element would be pointing to deallocated memory. The borrowing rules prevent
|
||||
programs from ending up in that situation.
|
||||
|
||||
> Note: For more on the implementation details of the `Vec<T>` type, see “The
|
||||
> Rustonomicon” at https://doc.rust-lang.org/stable/nomicon/vec.html.
|
||||
|
||||
### Iterating over the Values in a Vector
|
||||
|
||||
If we want to access each element in a vector in turn, we can iterate through
|
||||
all of the elements rather than use indexes to access one at a time. Listing
|
||||
8-8 shows how to use a `for` loop to get immutable references to each element
|
||||
in a vector of `i32` values and print them:
|
||||
|
||||
```rust
|
||||
let v = vec![100, 32, 57];
|
||||
for i in &v {
|
||||
println!("{}", i);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-8: Printing each element in a vector by
|
||||
iterating over the elements using a `for` loop</span>
|
||||
|
||||
We can also iterate over mutable references to each element in a mutable vector
|
||||
in order to make changes to all the elements. The `for` loop in Listing 8-9
|
||||
will add `50` to each element:
|
||||
|
||||
```rust
|
||||
let mut v = vec![100, 32, 57];
|
||||
for i in &mut v {
|
||||
*i += 50;
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-9: Iterating over mutable references to
|
||||
elements in a vector</span>
|
||||
|
||||
To change the value that the mutable reference refers to, we have to use the
|
||||
dereference operator (`*`) to get to the value in `i` before we can use the
|
||||
`+=` operator .
|
||||
|
||||
### Using an Enum to Store Multiple Types
|
||||
|
||||
At the beginning of this chapter, we said that vectors can only store values
|
||||
that are the same type. This can be inconvenient; there are definitely use
|
||||
cases for needing to store a list of items of different types. Fortunately, the
|
||||
variants of an enum are defined under the same enum type, so when we need to
|
||||
store elements of a different type in a vector, we can define and use an enum!
|
||||
|
||||
For example, say we want to get values from a row in a spreadsheet in which
|
||||
some of the columns in the row contain integers, some floating-point numbers,
|
||||
and some strings. We can define an enum whose variants will hold the different
|
||||
value types, and then all the enum variants will be considered the same type:
|
||||
that of the enum. Then we can create a vector that holds that enum and so,
|
||||
ultimately, holds different types. We’ve demonstrated this in Listing 8-10:
|
||||
|
||||
```rust
|
||||
enum SpreadsheetCell {
|
||||
Int(i32),
|
||||
Float(f64),
|
||||
Text(String),
|
||||
}
|
||||
|
||||
let row = vec![
|
||||
SpreadsheetCell::Int(3),
|
||||
SpreadsheetCell::Text(String::from("blue")),
|
||||
SpreadsheetCell::Float(10.12),
|
||||
];
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-10: Defining an `enum` to store values of
|
||||
different types in one vector</span>
|
||||
|
||||
Rust needs to know what types will be in the vector at compile time so it knows
|
||||
exactly how much memory on the heap will be needed to store each element. A
|
||||
secondary advantage is that we can be explicit about what types are allowed in
|
||||
this vector. If Rust allowed a vector to hold any type, there would be a chance
|
||||
that one or more of the types would cause errors with the operations performed
|
||||
on the elements of the vector. Using an enum plus a `match` expression means
|
||||
that Rust will ensure at compile time that every possible case is handled, as
|
||||
discussed in Chapter 6.
|
||||
|
||||
When you’re writing a program, if you don’t know the exhaustive set of types
|
||||
the program will get at runtime to store in a vector, the enum technique won’t
|
||||
work. Instead, you can use a trait object, which we’ll cover in Chapter 17.
|
||||
|
||||
Now that we’ve discussed some of the most common ways to use vectors, be sure
|
||||
to review the API documentation for all the many useful methods defined on
|
||||
`Vec<T>` by the standard library. For example, in addition to `push`, a `pop`
|
||||
method removes and returns the last element. Let’s move on to the next
|
||||
collection type: `String`!
|
||||
452
2018-edition/src/ch08-02-strings.md
Normal file
452
2018-edition/src/ch08-02-strings.md
Normal file
@@ -0,0 +1,452 @@
|
||||
## Storing UTF-8 Encoded Text with Strings
|
||||
|
||||
We talked about strings in Chapter 4, but we’ll look at them in more depth now.
|
||||
New Rustaceans commonly get stuck on strings due to a combination of three
|
||||
reasons: Rust’s propensity for exposing possible errors, strings being a more
|
||||
complicated data structure than many programmers give them credit for, and
|
||||
UTF-8. These factors combine in a way that can seem difficult when you’re
|
||||
coming from other programming languages.
|
||||
|
||||
It’s useful to discuss strings in the context of collections because strings
|
||||
are implemented as a collection of bytes, plus some methods to provide useful
|
||||
functionality when those bytes are interpreted as text. In this section, we’ll
|
||||
talk about the operations on `String` that every collection type has, such as
|
||||
creating, updating, and reading. We’ll also discuss the ways in which `String`
|
||||
is different from the other collections, namely how indexing into a `String` is
|
||||
complicated by the differences between how people and computers interpret
|
||||
`String` data.
|
||||
|
||||
### What Is a String?
|
||||
|
||||
We’ll first define what we mean by the term *string*. Rust has only one string
|
||||
type in the core language, which is the string slice `str` that is usually seen
|
||||
in its borrowed form `&str`. In Chapter 4, we talked about *string slices*,
|
||||
which are references to some UTF-8 encoded string data stored elsewhere. String
|
||||
literals, for example, are stored in the binary output of the program and are
|
||||
therefore string slices.
|
||||
|
||||
The `String` type, which is provided by Rust’s standard library rather than
|
||||
coded into the core language, is a growable, mutable, owned, UTF-8 encoded
|
||||
string type. When Rustaceans refer to “strings” in Rust, they usually mean the
|
||||
`String` and the string slice `&str` types, not just one of those types.
|
||||
Although this section is largely about `String`, both types are used heavily in
|
||||
Rust’s standard library, and both `String` and string slices are UTF-8 encoded.
|
||||
|
||||
Rust’s standard library also includes a number of other string types, such as
|
||||
`OsString`, `OsStr`, `CString`, and `CStr`. Library crates can provide even
|
||||
more options for storing string data. See how those names all end in `String`
|
||||
or `Str`? They refer to owned and borrowed variants, just like the `String` and
|
||||
`str` types you’ve seen previously. These string types can store text in
|
||||
different encodings or be represented in memory in a different way, for
|
||||
example. We won’t discuss these other string types in this chapter; see their
|
||||
API documentation for more about how to use them and when each is appropriate.
|
||||
|
||||
### Creating a New String
|
||||
|
||||
Many of the same operations available with `Vec<T>` are available with `String`
|
||||
as well, starting with the `new` function to create a string, shown in Listing
|
||||
8-11:
|
||||
|
||||
```rust
|
||||
let mut s = String::new();
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-11: Creating a new, empty `String`</span>
|
||||
|
||||
This line creates a new empty string called `s`, which we can then load data
|
||||
into. Often, we’ll have some initial data that we want to start the string
|
||||
with. For that, we use the `to_string` method, which is available on any type
|
||||
that implements the `Display` trait, as string literals do. Listing 8-12 shows
|
||||
two examples:
|
||||
|
||||
```rust
|
||||
let data = "initial contents";
|
||||
|
||||
let s = data.to_string();
|
||||
|
||||
// the method also works on a literal directly:
|
||||
let s = "initial contents".to_string();
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-12: Using the `to_string` method to create a
|
||||
`String` from a string literal</span>
|
||||
|
||||
This code creates a string containing `initial contents`.
|
||||
|
||||
We can also use the function `String::from` to create a `String` from a string
|
||||
literal. The code in Listing 8-13 is equivalent to the code from Listing 8-12
|
||||
that uses `to_string`:
|
||||
|
||||
```rust
|
||||
let s = String::from("initial contents");
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-13: Using the `String::from` function to create
|
||||
a `String` from a string literal</span>
|
||||
|
||||
Because strings are used for so many things, we can use many different generic
|
||||
APIs for strings, providing us with a lot of options. Some of them can seem
|
||||
redundant, but they all have their place! In this case, `String::from` and
|
||||
`to_string` do the same thing, so which you choose is a matter of style.
|
||||
|
||||
Remember that strings are UTF-8 encoded, so we can include any properly encoded
|
||||
data in them, as shown in Listing 8-14:
|
||||
|
||||
```rust
|
||||
let hello = String::from("السلام عليكم");
|
||||
let hello = String::from("Dobrý den");
|
||||
let hello = String::from("Hello");
|
||||
let hello = String::from("שָׁלוֹם");
|
||||
let hello = String::from("नमस्ते");
|
||||
let hello = String::from("こんにちは");
|
||||
let hello = String::from("안녕하세요");
|
||||
let hello = String::from("你好");
|
||||
let hello = String::from("Olá");
|
||||
let hello = String::from("Здравствуйте");
|
||||
let hello = String::from("Hola");
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-14: Storing greetings in different languages in
|
||||
strings</span>
|
||||
|
||||
All of these are valid `String` values.
|
||||
|
||||
### Updating a String
|
||||
|
||||
A `String` can grow in size and its contents can change, just like the contents
|
||||
of a `Vec<T>`, if you push more data into it. In addition, you can conveniently
|
||||
use the `+` operator or the `format!` macro to concatenate `String` values.
|
||||
|
||||
#### Appending to a String with `push_str` and `push`
|
||||
|
||||
We can grow a `String` by using the `push_str` method to append a string slice,
|
||||
as shown in Listing 8-15:
|
||||
|
||||
```rust
|
||||
let mut s = String::from("foo");
|
||||
s.push_str("bar");
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-15: Appending a string slice to a `String`
|
||||
using the `push_str` method</span>
|
||||
|
||||
After these two lines, `s` will contain `foobar`. The `push_str` method takes a
|
||||
string slice because we don’t necessarily want to take ownership of the
|
||||
parameter. For example, the code in Listing 8-16 shows that it would be
|
||||
unfortunate if we weren’t able to use `s2` after appending its contents to `s1`:
|
||||
|
||||
```rust
|
||||
let mut s1 = String::from("foo");
|
||||
let s2 = "bar";
|
||||
s1.push_str(s2);
|
||||
println!("s2 is {}", s2);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-16: Using a string slice after appending its
|
||||
contents to a `String`</span>
|
||||
|
||||
If the `push_str` method took ownership of `s2`, we wouldn’t be able to print
|
||||
its value on the last line. However, this code works as we’d expect!
|
||||
|
||||
The `push` method takes a single character as a parameter and adds it to the
|
||||
`String`. Listing 8-17 shows code that adds the letter l to a `String` using
|
||||
the `push` method:
|
||||
|
||||
```rust
|
||||
let mut s = String::from("lo");
|
||||
s.push('l');
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-17: Adding one character to a `String` value
|
||||
using `push`</span>
|
||||
|
||||
As a result of this code, `s` will contain `lol`.
|
||||
|
||||
#### Concatenation with the `+` Operator or the `format!` Macro
|
||||
|
||||
Often, you’ll want to combine two existing strings. One way is to use the `+`
|
||||
operator, as shown in Listing 8-18:
|
||||
|
||||
```rust
|
||||
let s1 = String::from("Hello, ");
|
||||
let s2 = String::from("world!");
|
||||
let s3 = s1 + &s2; // Note s1 has been moved here and can no longer be used
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-18: Using the `+` operator to combine two
|
||||
`String` values into a new `String` value</span>
|
||||
|
||||
The string `s3` will contain `Hello, world!` as a result of this code. The
|
||||
reason `s1` is no longer valid after the addition and the reason we used a
|
||||
reference to `s2` has to do with the signature of the method that gets called
|
||||
when we use the `+` operator. The `+` operator uses the `add` method, whose
|
||||
signature looks something like this:
|
||||
|
||||
```rust,ignore
|
||||
fn add(self, s: &str) -> String {
|
||||
```
|
||||
|
||||
This isn’t the exact signature that’s in the standard library: in the standard
|
||||
library, `add` is defined using generics. Here, we’re looking at the signature
|
||||
of `add` with concrete types substituted for the generic ones, which is what
|
||||
happens when we call this method with `String` values. We’ll discuss generics
|
||||
in Chapter 10. This signature gives us the clues we need to understand the
|
||||
tricky bits of the `+` operator.
|
||||
|
||||
First, `s2` has an `&`, meaning that we’re adding a *reference* of the second
|
||||
string to the first string because of the `s` parameter in the `add` function:
|
||||
we can only add a `&str` to a `String`; we can’t add two `String` values
|
||||
together. But wait—the type of `&s2` is `&String`, not `&str`, as specified in
|
||||
the second parameter to `add`. So why does Listing 8-18 compile?
|
||||
|
||||
The reason we’re able to use `&s2` in the call to `add` is that the compiler
|
||||
can *coerce* the `&String` argument into a `&str`. When we call the `add`
|
||||
method, Rust uses a *deref coercion*, which here turns `&s2` into `&s2[..]`.
|
||||
We’ll discuss deref coercion in more depth in Chapter 15. Because `add` does
|
||||
not take ownership of the `s` parameter, `s2` will still be a valid `String`
|
||||
after this operation.
|
||||
|
||||
Second, we can see in the signature that `add` takes ownership of `self`,
|
||||
because `self` does *not* have an `&`. This means `s1` in Listing 8-18 will be
|
||||
moved into the `add` call and no longer be valid after that. So although `let
|
||||
s3 = s1 + &s2;` looks like it will copy both strings and create a new one, this
|
||||
statement actually takes ownership of `s1`, appends a copy of the contents of
|
||||
`s2`, and then returns ownership of the result. In other words, it looks like
|
||||
it’s making a lot of copies but isn’t; the implementation is more efficient
|
||||
than copying.
|
||||
|
||||
If we need to concatenate multiple strings, the behavior of the `+` operator
|
||||
gets unwieldy:
|
||||
|
||||
```rust
|
||||
let s1 = String::from("tic");
|
||||
let s2 = String::from("tac");
|
||||
let s3 = String::from("toe");
|
||||
|
||||
let s = s1 + "-" + &s2 + "-" + &s3;
|
||||
```
|
||||
|
||||
At this point, `s` will be `tic-tac-toe`. With all of the `+` and `"`
|
||||
characters, it’s difficult to see what’s going on. For more complicated string
|
||||
combining, we can use the `format!` macro:
|
||||
|
||||
```rust
|
||||
let s1 = String::from("tic");
|
||||
let s2 = String::from("tac");
|
||||
let s3 = String::from("toe");
|
||||
|
||||
let s = format!("{}-{}-{}", s1, s2, s3);
|
||||
```
|
||||
|
||||
This code also sets `s` to `tic-tac-toe`. The `format!` macro works in the same
|
||||
way as `println!`, but instead of printing the output to the screen, it returns
|
||||
a `String` with the contents. The version of the code using `format!` is much
|
||||
easier to read and doesn’t take ownership of any of its parameters.
|
||||
|
||||
### Indexing into Strings
|
||||
|
||||
In many other programming languages, accessing individual characters in a
|
||||
string by referencing them by index is a valid and common operation. However,
|
||||
if you try to access parts of a `String` using indexing syntax in Rust, you’ll
|
||||
get an error. Consider the invalid code in Listing 8-19:
|
||||
|
||||
```rust,ignore
|
||||
let s1 = String::from("hello");
|
||||
let h = s1[0];
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-19: Attempting to use indexing syntax with a
|
||||
String</span>
|
||||
|
||||
This code will result in the following error:
|
||||
|
||||
```text
|
||||
error[E0277]: the trait bound `std::string::String: std::ops::Index<{integer}>` is not satisfied
|
||||
-->
|
||||
|
|
||||
3 | let h = s1[0];
|
||||
| ^^^^^ the type `std::string::String` cannot be indexed by `{integer}`
|
||||
|
|
||||
= help: the trait `std::ops::Index<{integer}>` is not implemented for `std::string::String`
|
||||
```
|
||||
|
||||
The error and the note tell the story: Rust strings don’t support indexing. But
|
||||
why not? To answer that question, we need to discuss how Rust stores strings in
|
||||
memory.
|
||||
|
||||
#### Internal Representation
|
||||
|
||||
A `String` is a wrapper over a `Vec<u8>`. Let’s look at some of our properly
|
||||
encoded UTF-8 example strings from Listing 8-14. First, this one:
|
||||
|
||||
```rust
|
||||
let len = String::from("Hola").len();
|
||||
```
|
||||
|
||||
In this case, `len` will be 4, which means the vector storing the string “Hola”
|
||||
is 4 bytes long. Each of these letters takes 1 byte when encoded in UTF-8. But
|
||||
what about the following line? (Note that this line begins with the capital
|
||||
Cyrillic letter Ze, not the Arabic number 3.)
|
||||
|
||||
```rust
|
||||
let len = String::from("Здравствуйте").len();
|
||||
```
|
||||
|
||||
Asked how long the string is, you might say 12. However, Rust’s answer is 24:
|
||||
that’s the number of bytes it takes to encode “Здравствуйте” in UTF-8, because
|
||||
each Unicode scalar value takes 2 bytes of storage. Therefore, an index into
|
||||
the string’s bytes will not always correlate to a valid Unicode scalar value.
|
||||
To demonstrate, consider this invalid Rust code:
|
||||
|
||||
```rust,ignore
|
||||
let hello = "Здравствуйте";
|
||||
let answer = &hello[0];
|
||||
```
|
||||
|
||||
What should the value of `answer` be? Should it be `З`, the first letter? When
|
||||
encoded in UTF-8, the first byte of `З` is `208` and the second is `151`, so
|
||||
`answer` should in fact be `208`, but `208` is not a valid character on its
|
||||
own. Returning `208` is likely not what a user would want if they asked for the
|
||||
first letter of this string; however, that’s the only data that Rust has at
|
||||
byte index 0. Users generally don’t want the byte value returned, even if the
|
||||
string contains only Latin letters: if `&"hello"[0]` were valid code that
|
||||
returned the byte value, it would return `104`, not `h`. To avoid returning an
|
||||
unexpected value and causing bugs that might not be discovered immediately,
|
||||
Rust doesn’t compile this code at all and prevents misunderstandings early in
|
||||
the development process.
|
||||
|
||||
#### Bytes and Scalar Values and Grapheme Clusters! Oh My!
|
||||
|
||||
Another point about UTF-8 is that there are actually three relevant ways to
|
||||
look at strings from Rust’s perspective: as bytes, scalar values, and grapheme
|
||||
clusters (the closest thing to what we would call *letters*).
|
||||
|
||||
If we look at the Hindi word “नमस्ते” written in the Devanagari script, it is
|
||||
stored as a vector of `u8` values that looks like this:
|
||||
|
||||
```text
|
||||
[224, 164, 168, 224, 164, 174, 224, 164, 184, 224, 165, 141, 224, 164, 164,
|
||||
224, 165, 135]
|
||||
```
|
||||
|
||||
That’s 18 bytes and is how computers ultimately store this data. If we look at
|
||||
them as Unicode scalar values, which are what Rust’s `char` type is, those
|
||||
bytes look like this:
|
||||
|
||||
```text
|
||||
['न', 'म', 'स', '्', 'त', 'े']
|
||||
```
|
||||
|
||||
There are six `char` values here, but the fourth and sixth are not letters:
|
||||
they’re diacritics that don’t make sense on their own. Finally, if we look at
|
||||
them as grapheme clusters, we’d get what a person would call the four letters
|
||||
that make up the Hindi word:
|
||||
|
||||
```text
|
||||
["न", "म", "स्", "ते"]
|
||||
```
|
||||
|
||||
Rust provides different ways of interpreting the raw string data that computers
|
||||
store so that each program can choose the interpretation it needs, no matter
|
||||
what human language the data is in.
|
||||
|
||||
A final reason Rust doesn’t allow us to index into a `String` to get a
|
||||
character is that indexing operations are expected to always take constant time
|
||||
(O(1)). But it isn’t possible to guarantee that performance with a `String`,
|
||||
because Rust would have to walk through the contents from the beginning to the
|
||||
index to determine how many valid characters there were.
|
||||
|
||||
### Slicing Strings
|
||||
|
||||
Indexing into a string is often a bad idea because it’s not clear what the
|
||||
return type of the string-indexing operation should be: a byte value, a
|
||||
character, a grapheme cluster, or a string slice. Therefore, Rust asks you to
|
||||
be more specific if you really need to use indices to create string slices. To
|
||||
be more specific in your indexing and indicate that you want a string slice,
|
||||
rather than indexing using `[]` with a single number, you can use `[]` with a
|
||||
range to create a string slice containing particular bytes:
|
||||
|
||||
```rust
|
||||
let hello = "Здравствуйте";
|
||||
|
||||
let s = &hello[0..4];
|
||||
```
|
||||
|
||||
Here, `s` will be a `&str` that contains the first 4 bytes of the string.
|
||||
Earlier, we mentioned that each of these characters was 2 bytes, which means
|
||||
`s` will be `Зд`.
|
||||
|
||||
What would happen if we used `&hello[0..1]`? The answer: Rust would panic at
|
||||
runtime in the same way as if an invalid index were accessed in a vector:
|
||||
|
||||
```text
|
||||
thread 'main' panicked at 'byte index 1 is not a char boundary; it is inside 'З' (bytes 0..2) of `Здравствуйте`', src/libcore/str/mod.rs:2188:4
|
||||
```
|
||||
|
||||
You should use ranges to create string slices with caution, because doing so
|
||||
can crash your program.
|
||||
|
||||
### Methods for Iterating Over Strings
|
||||
|
||||
Fortunately, you can access elements in a string in other ways.
|
||||
|
||||
If you need to perform operations on individual Unicode scalar values, the best
|
||||
way to do so is to use the `chars` method. Calling `chars` on “नमस्ते” separates
|
||||
out and returns six values of type `char`, and you can iterate over the result
|
||||
in order to access each element:
|
||||
|
||||
```rust
|
||||
for c in "नमस्ते".chars() {
|
||||
println!("{}", c);
|
||||
}
|
||||
```
|
||||
|
||||
This code will print the following:
|
||||
|
||||
```text
|
||||
न
|
||||
म
|
||||
स
|
||||
्
|
||||
त
|
||||
े
|
||||
```
|
||||
|
||||
The `bytes` method returns each raw byte, which might be appropriate for your
|
||||
domain:
|
||||
|
||||
```rust
|
||||
for b in "नमस्ते".bytes() {
|
||||
println!("{}", b);
|
||||
}
|
||||
```
|
||||
|
||||
This code will print the 18 bytes that make up this `String`:
|
||||
|
||||
```text
|
||||
224
|
||||
164
|
||||
// --snip--
|
||||
165
|
||||
135
|
||||
```
|
||||
|
||||
But be sure to remember that valid Unicode scalar values may be made up of more
|
||||
than 1 byte.
|
||||
|
||||
Getting grapheme clusters from strings is complex, so this functionality is not
|
||||
provided by the standard library. Crates are available on
|
||||
[crates.io](https://crates.io) if this is the functionality you need.
|
||||
|
||||
### Strings Are Not So Simple
|
||||
|
||||
To summarize, strings are complicated. Different programming languages make
|
||||
different choices about how to present this complexity to the programmer. Rust
|
||||
has chosen to make the correct handling of `String` data the default behavior
|
||||
for all Rust programs, which means programmers have to put more thought into
|
||||
handling UTF-8 data upfront. This trade-off exposes more of the complexity of
|
||||
strings than is apparent in other programming languages, but it prevents you
|
||||
from having to handle errors involving non-ASCII characters later in your
|
||||
development life cycle.
|
||||
|
||||
Let’s switch to something a bit less complex: hash maps!
|
||||
299
2018-edition/src/ch08-03-hash-maps.md
Normal file
299
2018-edition/src/ch08-03-hash-maps.md
Normal file
@@ -0,0 +1,299 @@
|
||||
## Storing Keys with Associated Values in Hash Maps
|
||||
|
||||
The last of our common collections is the *hash map*. The type `HashMap<K, V>`
|
||||
stores a mapping of keys of type `K` to values of type `V`. It does this via a
|
||||
*hashing function*, which determines how it places these keys and values into
|
||||
memory. Many programming languages support this kind of data structure, but
|
||||
they often use a different name, such as hash, map, object, hash table, or
|
||||
associative array, just to name a few.
|
||||
|
||||
Hash maps are useful when you want to look up data not by using an index, as
|
||||
you can with vectors, but by using a key that can be of any type. For example,
|
||||
in a game, you could keep track of each team’s score in a hash map in which
|
||||
each key is a team’s name and the values are each team’s score. Given a team
|
||||
name, you can retrieve its score.
|
||||
|
||||
We’ll go over the basic API of hash maps in this section, but many more goodies
|
||||
are hiding in the functions defined on `HashMap<K, V>` by the standard library.
|
||||
As always, check the standard library documentation for more information.
|
||||
|
||||
### Creating a New Hash Map
|
||||
|
||||
You can create an empty hash map with `new` and add elements with `insert`. In
|
||||
Listing 8-20, we’re keeping track of the scores of two teams whose names are
|
||||
Blue and Yellow. The Blue team starts with 10 points, and the Yellow team
|
||||
starts with 50:
|
||||
|
||||
```rust
|
||||
use std::collections::HashMap;
|
||||
|
||||
let mut scores = HashMap::new();
|
||||
|
||||
scores.insert(String::from("Blue"), 10);
|
||||
scores.insert(String::from("Yellow"), 50);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-20: Creating a new hash map and inserting some
|
||||
keys and values</span>
|
||||
|
||||
Note that we need to first `use` the `HashMap` from the collections portion of
|
||||
the standard library. Of our three common collections, this one is the least
|
||||
often used, so it’s not included in the features brought into scope
|
||||
automatically in the prelude. Hash maps also have less support from the
|
||||
standard library; there’s no built-in macro to construct them, for example.
|
||||
|
||||
Just like vectors, hash maps store their data on the heap. This `HashMap` has
|
||||
keys of type `String` and values of type `i32`. Like vectors, hash maps are
|
||||
homogeneous: all of the keys must have the same type, and all of the values
|
||||
must have the same type.
|
||||
|
||||
Another way of constructing a hash map is by using the `collect` method on a
|
||||
vector of tuples, where each tuple consists of a key and its value. The
|
||||
`collect` method gathers data into a number of collection types, including
|
||||
`HashMap`. For example, if we had the team names and initial scores in two
|
||||
separate vectors, we could use the `zip` method to create a vector of tuples
|
||||
where “Blue” is paired with 10, and so forth. Then we could use the `collect`
|
||||
method to turn that vector of tuples into a hash map, as shown in Listing 8-21:
|
||||
|
||||
```rust
|
||||
use std::collections::HashMap;
|
||||
|
||||
let teams = vec![String::from("Blue"), String::from("Yellow")];
|
||||
let initial_scores = vec![10, 50];
|
||||
|
||||
let scores: HashMap<_, _> = teams.iter().zip(initial_scores.iter()).collect();
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-21: Creating a hash map from a list of teams
|
||||
and a list of scores</span>
|
||||
|
||||
The type annotation `HashMap<_, _>` is needed here because it’s possible to
|
||||
`collect` into many different data structures and Rust doesn’t know which you
|
||||
want unless you specify. For the parameters for the key and value types,
|
||||
however, we use underscores, and Rust can infer the types that the hash map
|
||||
contains based on the types of the data in the vectors.
|
||||
|
||||
### Hash Maps and Ownership
|
||||
|
||||
For types that implement the `Copy` trait, like `i32`, the values are copied
|
||||
into the hash map. For owned values like `String`, the values will be moved and
|
||||
the hash map will be the owner of those values, as demonstrated in Listing 8-22:
|
||||
|
||||
```rust
|
||||
use std::collections::HashMap;
|
||||
|
||||
let field_name = String::from("Favorite color");
|
||||
let field_value = String::from("Blue");
|
||||
|
||||
let mut map = HashMap::new();
|
||||
map.insert(field_name, field_value);
|
||||
// field_name and field_value are invalid at this point, try using them and
|
||||
// see what compiler error you get!
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-22: Showing that keys and values are owned by
|
||||
the hash map once they’re inserted</span>
|
||||
|
||||
We aren’t able to use the variables `field_name` and `field_value` after
|
||||
they’ve been moved into the hash map with the call to `insert`.
|
||||
|
||||
If we insert references to values into the hash map, the values won’t be moved
|
||||
into the hash map. The values that the references point to must be valid for at
|
||||
least as long as the hash map is valid. We’ll talk more about these issues in
|
||||
the “Validating References with Lifetimes” section in Chapter 10.
|
||||
|
||||
### Accessing Values in a Hash Map
|
||||
|
||||
We can get a value out of the hash map by providing its key to the `get`
|
||||
method, as shown in Listing 8-23:
|
||||
|
||||
```rust
|
||||
use std::collections::HashMap;
|
||||
|
||||
let mut scores = HashMap::new();
|
||||
|
||||
scores.insert(String::from("Blue"), 10);
|
||||
scores.insert(String::from("Yellow"), 50);
|
||||
|
||||
let team_name = String::from("Blue");
|
||||
let score = scores.get(&team_name);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-23: Accessing the score for the Blue team
|
||||
stored in the hash map</span>
|
||||
|
||||
Here, `score` will have the value that’s associated with the Blue team, and the
|
||||
result will be `Some(&10)`. The result is wrapped in `Some` because `get`
|
||||
returns an `Option<&V>`; if there’s no value for that key in the hash map,
|
||||
`get` will return `None`. The program will need to handle the `Option` in one
|
||||
of the ways that we covered in Chapter 6.
|
||||
|
||||
We can iterate over each key/value pair in a hash map in a similar manner as we
|
||||
do with vectors, using a `for` loop:
|
||||
|
||||
```rust
|
||||
use std::collections::HashMap;
|
||||
|
||||
let mut scores = HashMap::new();
|
||||
|
||||
scores.insert(String::from("Blue"), 10);
|
||||
scores.insert(String::from("Yellow"), 50);
|
||||
|
||||
for (key, value) in &scores {
|
||||
println!("{}: {}", key, value);
|
||||
}
|
||||
```
|
||||
|
||||
This code will print each pair in an arbitrary order:
|
||||
|
||||
```text
|
||||
Yellow: 50
|
||||
Blue: 10
|
||||
```
|
||||
|
||||
### Updating a Hash Map
|
||||
|
||||
Although the number of keys and values is growable, each key can only have one
|
||||
value associated with it at a time. When you want to change the data in a hash
|
||||
map, you have to decide how to handle the case when a key already has a value
|
||||
assigned. You could replace the old value with the new value, completely
|
||||
disregarding the old value. You could keep the old value and ignore the new
|
||||
value, only adding the new value if the key *doesn’t* already have a value. Or
|
||||
you could combine the old value and the new value. Let’s look at how to do each
|
||||
of these!
|
||||
|
||||
#### Overwriting a Value
|
||||
|
||||
If we insert a key and a value into a hash map and then insert that same key
|
||||
with a different value, the value associated with that key will be replaced.
|
||||
Even though the code in Listing 8-24 calls `insert` twice, the hash map will
|
||||
only contain one key/value pair because we’re inserting the value for the Blue
|
||||
team’s key both times:
|
||||
|
||||
```rust
|
||||
use std::collections::HashMap;
|
||||
|
||||
let mut scores = HashMap::new();
|
||||
|
||||
scores.insert(String::from("Blue"), 10);
|
||||
scores.insert(String::from("Blue"), 25);
|
||||
|
||||
println!("{:?}", scores);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-24: Replacing a value stored with a particular
|
||||
key</span>
|
||||
|
||||
This code will print `{"Blue": 25}`. The original value of `10` has been
|
||||
overwritten.
|
||||
|
||||
#### Only Inserting a Value If the Key Has No Value
|
||||
|
||||
It’s common to check whether a particular key has a value and, if it doesn’t,
|
||||
insert a value for it. Hash maps have a special API for this called `entry`
|
||||
that takes the key you want to check as a parameter. The return value of the
|
||||
`entry` function is an enum called `Entry` that represents a value that might
|
||||
or might not exist. Let’s say we want to check whether the key for the Yellow
|
||||
team has a value associated with it. If it doesn’t, we want to insert the value
|
||||
50, and the same for the Blue team. Using the `entry` API, the code looks like
|
||||
Listing 8-25:
|
||||
|
||||
```rust
|
||||
use std::collections::HashMap;
|
||||
|
||||
let mut scores = HashMap::new();
|
||||
scores.insert(String::from("Blue"), 10);
|
||||
|
||||
scores.entry(String::from("Yellow")).or_insert(50);
|
||||
scores.entry(String::from("Blue")).or_insert(50);
|
||||
|
||||
println!("{:?}", scores);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-25: Using the `entry` method to only insert if
|
||||
the key does not already have a value</span>
|
||||
|
||||
The `or_insert` method on `Entry` is defined to return a mutable reference to
|
||||
the value for the corresponding `Entry` key if that key exists, and if not,
|
||||
inserts the parameter as the new value for this key and returns a mutable
|
||||
reference to the new value. This technique is much cleaner than writing the
|
||||
logic ourselves and, in addition, plays more nicely with the borrow checker.
|
||||
|
||||
Running the code in Listing 8-25 will print `{"Yellow": 50, "Blue": 10}`. The
|
||||
first call to `entry` will insert the key for the Yellow team with the value
|
||||
`50` because the Yellow team doesn’t have a value already. The second call to
|
||||
`entry` will not change the hash map because the Blue team already has the
|
||||
value `10`.
|
||||
|
||||
#### Updating a Value Based on the Old Value
|
||||
|
||||
Another common use case for hash maps is to look up a key’s value and then
|
||||
update it based on the old value. For instance, Listing 8-26 shows code that
|
||||
counts how many times each word appears in some text. We use a hash map with
|
||||
the words as keys and increment the value to keep track of how many times we’ve
|
||||
seen that word. If it’s the first time we’ve seen a word, we’ll first insert
|
||||
the value `0`:
|
||||
|
||||
```rust
|
||||
use std::collections::HashMap;
|
||||
|
||||
let text = "hello world wonderful world";
|
||||
|
||||
let mut map = HashMap::new();
|
||||
|
||||
for word in text.split_whitespace() {
|
||||
let count = map.entry(word).or_insert(0);
|
||||
*count += 1;
|
||||
}
|
||||
|
||||
println!("{:?}", map);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 8-26: Counting occurrences of words using a hash
|
||||
map that stores words and counts</span>
|
||||
|
||||
This code will print `{"world": 2, "hello": 1, "wonderful": 1}`. The
|
||||
`or_insert` method actually returns a mutable reference (`&mut V`) to the value
|
||||
for this key. Here we store that mutable reference in the `count` variable, so
|
||||
in order to assign to that value, we must first dereference `count` using the
|
||||
asterisk (`*`). The mutable reference goes out of scope at the end of the `for`
|
||||
loop, so all of these changes are safe and allowed by the borrowing rules.
|
||||
|
||||
### Hashing Functions
|
||||
|
||||
By default, `HashMap` uses a cryptographically secure hashing function that can
|
||||
provide resistance to Denial of Service (DoS) attacks. This is not the fastest
|
||||
hashing algorithm available, but the trade-off for better security that comes
|
||||
with the drop in performance is worth it. If you profile your code and find
|
||||
that the default hash function is too slow for your purposes, you can switch to
|
||||
another function by specifying a different *hasher*. A hasher is a type that
|
||||
implements the `BuildHasher` trait. We’ll talk about traits and how to
|
||||
implement them in Chapter 10. You don’t necessarily have to implement your own
|
||||
hasher from scratch; [crates.io](https://crates.io) has libraries shared by
|
||||
other Rust users that provide hashers implementing many common hashing
|
||||
algorithms.
|
||||
|
||||
## Summary
|
||||
|
||||
Vectors, strings, and hash maps will provide a large amount of functionality
|
||||
necessary in programs when you need to store, access, and modify data. Here are
|
||||
some exercises you should now be equipped to solve:
|
||||
|
||||
* Given a list of integers, use a vector and return the mean (the average
|
||||
value), median (when sorted, the value in the middle position), and mode (the
|
||||
value that occurs most often; a hash map will be helpful here) of the list.
|
||||
* Convert strings to pig latin. The first consonant of each word is moved to
|
||||
the end of the word and “ay” is added, so “first” becomes “irst-fay.” Words
|
||||
that start with a vowel have “hay” added to the end instead (“apple” becomes
|
||||
“apple-hay”). Keep in mind the details about UTF-8 encoding!
|
||||
* Using a hash map and vectors, create a text interface to allow a user to add
|
||||
employee names to a department in a company. For example, “Add Sally to
|
||||
Engineering” or “Add Amir to Sales.” Then let the user retrieve a list of all
|
||||
people in a department or all people in the company by department, sorted
|
||||
alphabetically.
|
||||
|
||||
The standard library API documentation describes methods that vectors, strings,
|
||||
and hash maps have that will be helpful for these exercises!
|
||||
|
||||
We’re getting into more complex programs in which operations can fail, so, it’s
|
||||
a perfect time to discuss error handling. We’ll do that next!
|
||||
24
2018-edition/src/ch09-00-error-handling.md
Normal file
24
2018-edition/src/ch09-00-error-handling.md
Normal file
@@ -0,0 +1,24 @@
|
||||
# Error Handling
|
||||
|
||||
Rust’s commitment to reliability extends to error handling. Errors are a fact
|
||||
of life in software, so Rust has a number of features for handling situations
|
||||
in which something goes wrong. In many cases, Rust requires you to acknowledge
|
||||
the possibility of an error and take some action before your code will compile.
|
||||
This requirement makes your program more robust by ensuring that you’ll
|
||||
discover errors and handle them appropriately before you’ve deployed your code
|
||||
to production!
|
||||
|
||||
Rust groups errors into two major categories: *recoverable* and *unrecoverable*
|
||||
errors. For a recoverable error, such as a file not found error, it’s
|
||||
reasonable to report the problem to the user and retry the operation.
|
||||
Unrecoverable errors are always symptoms of bugs, like trying to access a
|
||||
location beyond the end of an array.
|
||||
|
||||
Most languages don’t distinguish between these two kinds of errors and handle
|
||||
both in the same way, using mechanisms such as exceptions. Rust doesn’t have
|
||||
exceptions. Instead, it has the type `Result<T, E>` for recoverable errors and
|
||||
the `panic!` macro that stops execution when the program encounters an
|
||||
unrecoverable error. This chapter covers calling `panic!` first and then talks
|
||||
about returning `Result<T, E>` values. Additionally, we’ll explore
|
||||
considerations when deciding whether to try to recover from an error or to stop
|
||||
execution.
|
||||
191
2018-edition/src/ch09-01-unrecoverable-errors-with-panic.md
Normal file
191
2018-edition/src/ch09-01-unrecoverable-errors-with-panic.md
Normal file
@@ -0,0 +1,191 @@
|
||||
## Unrecoverable Errors with `panic!`
|
||||
|
||||
Sometimes, bad things happen in your code, and there’s nothing you can do about
|
||||
it. In these cases, Rust has the `panic!` macro. When the `panic!` macro
|
||||
executes, your program will print a failure message, unwind and clean up the
|
||||
stack, and then quit. This most commonly occurs when a bug of some kind has
|
||||
been detected and it’s not clear to the programmer how to handle the error.
|
||||
|
||||
> ### Unwinding the Stack or Aborting in Response to a Panic
|
||||
>
|
||||
> By default, when a panic occurs, the program starts *unwinding*, which
|
||||
> means Rust walks back up the stack and cleans up the data from each function
|
||||
> it encounters. But this walking back and cleanup is a lot of work. The
|
||||
> alternative is to immediately *abort*, which ends the program without
|
||||
> cleaning up. Memory that the program was using will then need to be cleaned
|
||||
> up by the operating system. If in your project you need to make the resulting
|
||||
> binary as small as possible, you can switch from unwinding to aborting upon a
|
||||
> panic by adding `panic = 'abort'` to the appropriate `[profile]` sections in
|
||||
> your *Cargo.toml* file. For example, if you want to abort on panic in release
|
||||
> mode, add this:
|
||||
>
|
||||
> ```toml
|
||||
> [profile.release]
|
||||
> panic = 'abort'
|
||||
> ```
|
||||
|
||||
Let’s try calling `panic!` in a simple program:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,should_panic
|
||||
fn main() {
|
||||
panic!("crash and burn");
|
||||
}
|
||||
```
|
||||
|
||||
When you run the program, you’ll see something like this:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling panic v0.1.0 (file:///projects/panic)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.25 secs
|
||||
Running `target/debug/panic`
|
||||
thread 'main' panicked at 'crash and burn', src/main.rs:2:4
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
```
|
||||
|
||||
The call to `panic!` causes the error message contained in the last three
|
||||
lines. The first line shows our panic message and the place in our source code
|
||||
where the panic occurred: *src/main.rs:2:4* indicates that it’s the second
|
||||
line, fourth character of our *src/main.rs* file.
|
||||
|
||||
In this case, the line indicated is part of our code, and if we go to that
|
||||
line, we see the `panic!` macro call. In other cases, the `panic!` call might
|
||||
be in code that our code calls, and the filename and line number reported by
|
||||
the error message will be someone else’s code where the `panic!` macro is
|
||||
called, not the line of our code that eventually led to the `panic!` call. We
|
||||
can use the backtrace of the functions the `panic!` call came from to figure
|
||||
out the part of our code that is causing the problem. We’ll discuss what a
|
||||
backtrace is in more detail next.
|
||||
|
||||
### Using a `panic!` Backtrace
|
||||
|
||||
Let’s look at another example to see what it’s like when a `panic!` call comes
|
||||
from a library because of a bug in our code instead of from our code calling
|
||||
the macro directly. Listing 9-1 has some code that attempts to access an
|
||||
element by index in a vector:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,should_panic
|
||||
fn main() {
|
||||
let v = vec![1, 2, 3];
|
||||
|
||||
v[99];
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 9-1: Attempting to access an element beyond the
|
||||
end of a vector, which will cause a `panic!`</span>
|
||||
|
||||
Here, we’re attempting to access the hundredth element of our vector (which is
|
||||
at index 99 because indexing starts at zero), but it has only three elements.
|
||||
In this situation, Rust will panic. Using `[]` is supposed to return an
|
||||
element, but if you pass an invalid index, there’s no element that Rust could
|
||||
return here that would be correct.
|
||||
|
||||
Other languages, like C, will attempt to give you exactly what you asked for in
|
||||
this situation, even though it isn’t what you want: you’ll get whatever is at
|
||||
the location in memory that would correspond to that element in the vector,
|
||||
even though the memory doesn’t belong to the vector. This is called a *buffer
|
||||
overread* and can lead to security vulnerabilities if an attacker is able to
|
||||
manipulate the index in such a way as to read data they shouldn’t be allowed to
|
||||
that is stored after the array.
|
||||
|
||||
To protect your program from this sort of vulnerability, if you try to read an
|
||||
element at an index that doesn’t exist, Rust will stop execution and refuse to
|
||||
continue. Let’s try it and see:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling panic v0.1.0 (file:///projects/panic)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.27 secs
|
||||
Running `target/debug/panic`
|
||||
thread 'main' panicked at 'index out of bounds: the len is 3 but the index is
|
||||
99', /checkout/src/liballoc/vec.rs:1555:10
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
```
|
||||
|
||||
This error points at a file we didn’t write, *vec.rs*. That’s the
|
||||
implementation of `Vec<T>` in the standard library. The code that gets run when
|
||||
we use `[]` on our vector `v` is in *vec.rs*, and that is where the `panic!` is
|
||||
actually happening.
|
||||
|
||||
The next note line tells us that we can set the `RUST_BACKTRACE` environment
|
||||
variable to get a backtrace of exactly what happened to cause the error. A
|
||||
*backtrace* is a list of all the functions that have been called to get to this
|
||||
point. Backtraces in Rust work as they do in other languages: the key to
|
||||
reading the backtrace is to start from the top and read until you see files you
|
||||
wrote. That’s the spot where the problem originated. The lines above the lines
|
||||
mentioning your files are code that your code called; the lines below are code
|
||||
that called your code. These lines might include core Rust code, standard
|
||||
library code, or crates that you’re using. Let’s try getting a backtrace by
|
||||
setting the `RUST_BACKTRACE` environment variable to any value except 0.
|
||||
Listing 9-2 shows output similar to what you’ll see:
|
||||
|
||||
```text
|
||||
$ RUST_BACKTRACE=1 cargo run
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/panic`
|
||||
thread 'main' panicked at 'index out of bounds: the len is 3 but the index is 99', /checkout/src/liballoc/vec.rs:1555:10
|
||||
stack backtrace:
|
||||
0: std::sys::imp::backtrace::tracing::imp::unwind_backtrace
|
||||
at /checkout/src/libstd/sys/unix/backtrace/tracing/gcc_s.rs:49
|
||||
1: std::sys_common::backtrace::_print
|
||||
at /checkout/src/libstd/sys_common/backtrace.rs:71
|
||||
2: std::panicking::default_hook::{{closure}}
|
||||
at /checkout/src/libstd/sys_common/backtrace.rs:60
|
||||
at /checkout/src/libstd/panicking.rs:381
|
||||
3: std::panicking::default_hook
|
||||
at /checkout/src/libstd/panicking.rs:397
|
||||
4: std::panicking::rust_panic_with_hook
|
||||
at /checkout/src/libstd/panicking.rs:611
|
||||
5: std::panicking::begin_panic
|
||||
at /checkout/src/libstd/panicking.rs:572
|
||||
6: std::panicking::begin_panic_fmt
|
||||
at /checkout/src/libstd/panicking.rs:522
|
||||
7: rust_begin_unwind
|
||||
at /checkout/src/libstd/panicking.rs:498
|
||||
8: core::panicking::panic_fmt
|
||||
at /checkout/src/libcore/panicking.rs:71
|
||||
9: core::panicking::panic_bounds_check
|
||||
at /checkout/src/libcore/panicking.rs:58
|
||||
10: <alloc::vec::Vec<T> as core::ops::index::Index<usize>>::index
|
||||
at /checkout/src/liballoc/vec.rs:1555
|
||||
11: panic::main
|
||||
at src/main.rs:4
|
||||
12: __rust_maybe_catch_panic
|
||||
at /checkout/src/libpanic_unwind/lib.rs:99
|
||||
13: std::rt::lang_start
|
||||
at /checkout/src/libstd/panicking.rs:459
|
||||
at /checkout/src/libstd/panic.rs:361
|
||||
at /checkout/src/libstd/rt.rs:61
|
||||
14: main
|
||||
15: __libc_start_main
|
||||
16: <unknown>
|
||||
```
|
||||
|
||||
<span class="caption">Listing 9-2: The backtrace generated by a call to
|
||||
`panic!` displayed when the environment variable `RUST_BACKTRACE` is set</span>
|
||||
|
||||
That’s a lot of output! The exact output you see might be different depending
|
||||
on your operating system and Rust version. In order to get backtraces with this
|
||||
information, debug symbols must be enabled. Debug symbols are enabled by
|
||||
default when using `cargo build` or `cargo run` without the `--release` flag,
|
||||
as we have here.
|
||||
|
||||
In the output in Listing 9-2, line 11 of the backtrace points to the line in
|
||||
our project that’s causing the problem: line 4 of *src/main.rs*. If we don’t
|
||||
want our program to panic, the location pointed to by the first line mentioning
|
||||
a file we wrote is where we should start investigating. In Listing 9-1, where
|
||||
we deliberately wrote code that would panic in order to demonstrate how to use
|
||||
backtraces, the way to fix the panic is to not request an element at index 99
|
||||
from a vector that only contains 3 items. When your code panics in the future,
|
||||
you’ll need to figure out what action the code is taking with what values to
|
||||
cause the panic and what the code should do instead.
|
||||
|
||||
We’ll come back to `panic!` and when we should and should not use `panic!` to
|
||||
handle error conditions in the “To `panic!` or Not to `panic!`” section later
|
||||
in this chapter. Next, we’ll look at how to recover from an error using
|
||||
`Result`.
|
||||
478
2018-edition/src/ch09-02-recoverable-errors-with-result.md
Normal file
478
2018-edition/src/ch09-02-recoverable-errors-with-result.md
Normal file
@@ -0,0 +1,478 @@
|
||||
## Recoverable Errors with `Result`
|
||||
|
||||
Most errors aren’t serious enough to require the program to stop entirely.
|
||||
Sometimes, when a function fails, it’s for a reason that you can easily
|
||||
interpret and respond to. For example, if you try to open a file and that
|
||||
operation fails because the file doesn’t exist, you might want to create the
|
||||
file instead of terminating the process.
|
||||
|
||||
Recall from “[Handling Potential Failure with the `Result`
|
||||
Type][handle_failure]<!-- ignore -->” in Chapter 2 that the `Result` enum is
|
||||
defined as having two variants, `Ok` and `Err`, as follows:
|
||||
|
||||
[handle_failure]: ch02-00-guessing-game-tutorial.html#handling-potential-failure-with-the-result-type
|
||||
|
||||
```rust
|
||||
enum Result<T, E> {
|
||||
Ok(T),
|
||||
Err(E),
|
||||
}
|
||||
```
|
||||
|
||||
The `T` and `E` are generic type parameters: we’ll discuss generics in more
|
||||
detail in Chapter 10. What you need to know right now is that `T` represents
|
||||
the type of the value that will be returned in a success case within the `Ok`
|
||||
variant, and `E` represents the type of the error that will be returned in a
|
||||
failure case within the `Err` variant. Because `Result` has these generic type
|
||||
parameters, we can use the `Result` type and the functions that the standard
|
||||
library has defined on it in many different situations where the successful
|
||||
value and error value we want to return may differ.
|
||||
|
||||
Let’s call a function that returns a `Result` value because the function could
|
||||
fail. In Listing 9-3 we try to open a file:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::fs::File;
|
||||
|
||||
fn main() {
|
||||
let f = File::open("hello.txt");
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 9-3: Opening a file</span>
|
||||
|
||||
How do we know `File::open` returns a `Result`? We could look at the standard
|
||||
library API documentation, or we could ask the compiler! If we give `f` a type
|
||||
annotation that we know is *not* the return type of the function and then try
|
||||
to compile the code, the compiler will tell us that the types don’t match. The
|
||||
error message will then tell us what the type of `f` *is*. Let’s try it! We
|
||||
know that the return type of `File::open` isn’t of type `u32`, so let’s change
|
||||
the `let f` statement to this:
|
||||
|
||||
```rust,ignore
|
||||
let f: u32 = File::open("hello.txt");
|
||||
```
|
||||
|
||||
Attempting to compile now gives us the following output:
|
||||
|
||||
```text
|
||||
error[E0308]: mismatched types
|
||||
--> src/main.rs:4:18
|
||||
|
|
||||
4 | let f: u32 = File::open("hello.txt");
|
||||
| ^^^^^^^^^^^^^^^^^^^^^^^ expected u32, found enum
|
||||
`std::result::Result`
|
||||
|
|
||||
= note: expected type `u32`
|
||||
found type `std::result::Result<std::fs::File, std::io::Error>`
|
||||
```
|
||||
|
||||
This tells us the return type of the `File::open` function is a `Result<T, E>`.
|
||||
The generic parameter `T` has been filled in here with the type of the success
|
||||
value, `std::fs::File`, which is a file handle. The type of `E` used in the
|
||||
error value is `std::io::Error`.
|
||||
|
||||
This return type means the call to `File::open` might succeed and return a file
|
||||
handle that we can read from or write to. The function call also might fail:
|
||||
for example, the file might not exist, or we might not have permission to
|
||||
access the file. The `File::open` function needs to have a way to tell us
|
||||
whether it succeeded or failed and at the same time give us either the file
|
||||
handle or error information. This information is exactly what the `Result` enum
|
||||
conveys.
|
||||
|
||||
In the case where `File::open` succeeds, the value in the variable `f` will be
|
||||
an instance of `Ok` that contains a file handle. In the case where it fails,
|
||||
the value in `f` will be an instance of `Err` that contains more information
|
||||
about the kind of error that happened.
|
||||
|
||||
We need to add to the code in Listing 9-3 to take different actions depending
|
||||
on the value `File::open` returns. Listing 9-4 shows one way to handle the
|
||||
`Result` using a basic tool, the `match` expression that we discussed in
|
||||
Chapter 6.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,should_panic
|
||||
use std::fs::File;
|
||||
|
||||
fn main() {
|
||||
let f = File::open("hello.txt");
|
||||
|
||||
let f = match f {
|
||||
Ok(file) => file,
|
||||
Err(error) => {
|
||||
panic!("There was a problem opening the file: {:?}", error)
|
||||
},
|
||||
};
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 9-4: Using a `match` expression to handle the
|
||||
`Result` variants that might be returned</span>
|
||||
|
||||
Note that, like the `Option` enum, the `Result` enum and its variants have been
|
||||
imported in the prelude, so we don’t need to specify `Result::` before the `Ok`
|
||||
and `Err` variants in the `match` arms.
|
||||
|
||||
Here we tell Rust that when the result is `Ok`, return the inner `file` value
|
||||
out of the `Ok` variant, and we then assign that file handle value to the
|
||||
variable `f`. After the `match`, we can use the file handle for reading or
|
||||
writing.
|
||||
|
||||
The other arm of the `match` handles the case where we get an `Err` value from
|
||||
`File::open`. In this example, we’ve chosen to call the `panic!` macro. If
|
||||
there’s no file named *hello.txt* in our current directory and we run this
|
||||
code, we’ll see the following output from the `panic!` macro:
|
||||
|
||||
```text
|
||||
thread 'main' panicked at 'There was a problem opening the file: Error { repr:
|
||||
Os { code: 2, message: "No such file or directory" } }', src/main.rs:9:12
|
||||
```
|
||||
|
||||
As usual, this output tells us exactly what has gone wrong.
|
||||
|
||||
### Matching on Different Errors
|
||||
|
||||
The code in Listing 9-4 will `panic!` no matter why `File::open` failed. What
|
||||
we want to do instead is take different actions for different failure reasons:
|
||||
if `File::open` failed because the file doesn’t exist, we want to create the
|
||||
file and return the handle to the new file. If `File::open` failed for any
|
||||
other reason—for example, because we didn’t have permission to open the file—we
|
||||
still want the code to `panic!` in the same way as it did in Listing 9-4. Look
|
||||
at Listing 9-5, which adds another arm to the `match`:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
<!-- ignore this test because otherwise it creates hello.txt which causes other
|
||||
tests to fail lol -->
|
||||
|
||||
```rust,ignore
|
||||
use std::fs::File;
|
||||
use std::io::ErrorKind;
|
||||
|
||||
fn main() {
|
||||
let f = File::open("hello.txt");
|
||||
|
||||
let f = match f {
|
||||
Ok(file) => file,
|
||||
Err(ref error) if error.kind() == ErrorKind::NotFound => {
|
||||
match File::create("hello.txt") {
|
||||
Ok(fc) => fc,
|
||||
Err(e) => {
|
||||
panic!(
|
||||
"Tried to create file but there was a problem: {:?}",
|
||||
e
|
||||
)
|
||||
},
|
||||
}
|
||||
},
|
||||
Err(error) => {
|
||||
panic!(
|
||||
"There was a problem opening the file: {:?}",
|
||||
error
|
||||
)
|
||||
},
|
||||
};
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 9-5: Handling different kinds of errors in
|
||||
different ways</span>
|
||||
|
||||
The type of the value that `File::open` returns inside the `Err` variant is
|
||||
`io::Error`, which is a struct provided by the standard library. This struct
|
||||
has a method `kind` that we can call to get an `io::ErrorKind` value. The enum
|
||||
`io::ErrorKind` is provided by the standard library and has variants
|
||||
representing the different kinds of errors that might result from an `io`
|
||||
operation. The variant we want to use is `ErrorKind::NotFound`, which indicates
|
||||
the file we’re trying to open doesn’t exist yet.
|
||||
|
||||
The condition `if error.kind() == ErrorKind::NotFound` is called a *match
|
||||
guard*: it’s an extra condition on a `match` arm that further refines the arm’s
|
||||
pattern. This condition must be true for that arm’s code to be run; otherwise,
|
||||
the pattern matching will move on to consider the next arm in the `match`. The
|
||||
`ref` in the pattern is needed so `error` is not moved into the guard condition
|
||||
but is merely referenced by it. The reason you use `ref` to create a reference
|
||||
in a pattern instead of `&` will be covered in detail in Chapter 18. In short,
|
||||
in the context of a pattern, `&` matches a reference and gives you its value,
|
||||
but `ref` matches a value and gives you a reference to it.
|
||||
|
||||
The condition we want to check in the match guard is whether the value returned
|
||||
by `error.kind()` is the `NotFound` variant of the `ErrorKind` enum. If it is,
|
||||
we try to create the file with `File::create`. However, because `File::create`
|
||||
could also fail, we need to add an inner `match` statement as well. When the
|
||||
file can’t be opened, a different error message will be printed. The last arm
|
||||
of the outer `match` stays the same so the program panics on any error besides
|
||||
the missing file error.
|
||||
|
||||
### Shortcuts for Panic on Error: `unwrap` and `expect`
|
||||
|
||||
Using `match` works well enough, but it can be a bit verbose and doesn’t always
|
||||
communicate intent well. The `Result<T, E>` type has many helper methods
|
||||
defined on it to do various tasks. One of those methods, called `unwrap`, is a
|
||||
shortcut method that is implemented just like the `match` statement we wrote in
|
||||
Listing 9-4. If the `Result` value is the `Ok` variant, `unwrap` will return
|
||||
the value inside the `Ok`. If the `Result` is the `Err` variant, `unwrap` will
|
||||
call the `panic!` macro for us. Here is an example of `unwrap` in action:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,should_panic
|
||||
use std::fs::File;
|
||||
|
||||
fn main() {
|
||||
let f = File::open("hello.txt").unwrap();
|
||||
}
|
||||
```
|
||||
|
||||
If we run this code without a *hello.txt* file, we’ll see an error message from
|
||||
the `panic!` call that the `unwrap` method makes:
|
||||
|
||||
```text
|
||||
thread 'main' panicked at 'called `Result::unwrap()` on an `Err` value: Error {
|
||||
repr: Os { code: 2, message: "No such file or directory" } }',
|
||||
src/libcore/result.rs:906:4
|
||||
```
|
||||
|
||||
Another method, `expect`, which is similar to `unwrap`, lets us also choose the
|
||||
`panic!` error message. Using `expect` instead of `unwrap` and providing good
|
||||
error messages can convey your intent and make tracking down the source of a
|
||||
panic easier. The syntax of `expect` looks like this:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,should_panic
|
||||
use std::fs::File;
|
||||
|
||||
fn main() {
|
||||
let f = File::open("hello.txt").expect("Failed to open hello.txt");
|
||||
}
|
||||
```
|
||||
|
||||
We use `expect` in the same way as `unwrap`: to return the file handle or call
|
||||
the `panic!` macro. The error message used by `expect` in its call to `panic!`
|
||||
will be the parameter that we pass to `expect`, rather than the default
|
||||
`panic!` message that `unwrap` uses. Here’s what it looks like:
|
||||
|
||||
```text
|
||||
thread 'main' panicked at 'Failed to open hello.txt: Error { repr: Os { code:
|
||||
2, message: "No such file or directory" } }', src/libcore/result.rs:906:4
|
||||
```
|
||||
|
||||
Because this error message starts with the text we specified, `Failed to open
|
||||
hello.txt`, it will be easier to find where in the code this error message is
|
||||
coming from. If we use `unwrap` in multiple places, it can take more time to
|
||||
figure out exactly which `unwrap` is causing the panic because all `unwrap`
|
||||
calls that panic print the same message.
|
||||
|
||||
### Propagating Errors
|
||||
|
||||
When you’re writing a function whose implementation calls something that might
|
||||
fail, instead of handling the error within this function, you can return the
|
||||
error to the calling code so that it can decide what to do. This is known as
|
||||
*propagating* the error and gives more control to the calling code, where there
|
||||
might be more information or logic that dictates how the error should be
|
||||
handled than what you have available in the context of your code.
|
||||
|
||||
For example, Listing 9-6 shows a function that reads a username from a file. If
|
||||
the file doesn’t exist or can’t be read, this function will return those errors
|
||||
to the code that called this function:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::io;
|
||||
use std::io::Read;
|
||||
use std::fs::File;
|
||||
|
||||
fn read_username_from_file() -> Result<String, io::Error> {
|
||||
let f = File::open("hello.txt");
|
||||
|
||||
let mut f = match f {
|
||||
Ok(file) => file,
|
||||
Err(e) => return Err(e),
|
||||
};
|
||||
|
||||
let mut s = String::new();
|
||||
|
||||
match f.read_to_string(&mut s) {
|
||||
Ok(_) => Ok(s),
|
||||
Err(e) => Err(e),
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 9-6: A function that returns errors to the
|
||||
calling code using `match`</span>
|
||||
|
||||
Let’s look at the return type of the function first: `Result<String,
|
||||
io::Error>`. This means the function is returning a value of the type
|
||||
`Result<T, E>` where the generic parameter `T` has been filled in with the
|
||||
concrete type `String`, and the generic type `E` has been filled in with the
|
||||
concrete type `io::Error`. If this function succeeds without any problems, the
|
||||
code that calls this function will receive an `Ok` value that holds a
|
||||
`String`—the username that this function read from the file. If this function
|
||||
encounters any problems, the code that calls this function will receive an
|
||||
`Err` value that holds an instance of `io::Error` that contains more
|
||||
information about what the problems were. We chose `io::Error` as the return
|
||||
type of this function because that happens to be the type of the error value
|
||||
returned from both of the operations we’re calling in this function’s body that
|
||||
might fail: the `File::open` function and the `read_to_string` method.
|
||||
|
||||
The body of the function starts by calling the `File::open` function. Then we
|
||||
handle the `Result` value returned with a `match` similar to the `match` in
|
||||
Listing 9-4, only instead of calling `panic!` in the `Err` case, we return
|
||||
early from this function and pass the error value from `File::open` back to the
|
||||
calling code as this function’s error value. If `File::open` succeeds, we store
|
||||
the file handle in the variable `f` and continue.
|
||||
|
||||
Then we create a new `String` in variable `s` and call the `read_to_string`
|
||||
method on the file handle in `f` to read the contents of the file into `s`. The
|
||||
`read_to_string` method also returns a `Result` because it might fail, even
|
||||
though `File::open` succeeded. So we need another `match` to handle that
|
||||
`Result`: if `read_to_string` succeeds, then our function has succeeded, and we
|
||||
return the username from the file that’s now in `s` wrapped in an `Ok`. If
|
||||
`read_to_string` fails, we return the error value in the same way that we
|
||||
returned the error value in the `match` that handled the return value of
|
||||
`File::open`. However, we don’t need to explicitly say `return`, because this
|
||||
is the last expression in the function.
|
||||
|
||||
The code that calls this code will then handle getting either an `Ok` value
|
||||
that contains a username or an `Err` value that contains an `io::Error`. We
|
||||
don’t know what the calling code will do with those values. If the calling code
|
||||
gets an `Err` value, it could call `panic!` and crash the program, use a
|
||||
default username, or look up the username from somewhere other than a file, for
|
||||
example. We don’t have enough information on what the calling code is actually
|
||||
trying to do, so we propagate all the success or error information upward for
|
||||
it to handle appropriately.
|
||||
|
||||
This pattern of propagating errors is so common in Rust that Rust provides the
|
||||
question mark operator `?` to make this easier.
|
||||
|
||||
#### A Shortcut for Propagating Errors: the `?` Operator
|
||||
|
||||
Listing 9-7 shows an implementation of `read_username_from_file` that has the
|
||||
same functionality as it had in Listing 9-6, but this implementation uses the
|
||||
question mark operator:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::io;
|
||||
use std::io::Read;
|
||||
use std::fs::File;
|
||||
|
||||
fn read_username_from_file() -> Result<String, io::Error> {
|
||||
let mut f = File::open("hello.txt")?;
|
||||
let mut s = String::new();
|
||||
f.read_to_string(&mut s)?;
|
||||
Ok(s)
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 9-7: A function that returns errors to the
|
||||
calling code using `?`</span>
|
||||
|
||||
The `?` placed after a `Result` value is defined to work in almost the same way
|
||||
as the `match` expressions we defined to handle the `Result` values in Listing
|
||||
9-6. If the value of the `Result` is an `Ok`, the value inside the `Ok` will
|
||||
get returned from this expression, and the program will continue. If the value
|
||||
is an `Err`, the value inside the `Err` will be returned from the whole
|
||||
function as if we had used the `return` keyword so the error value gets
|
||||
propagated to the calling code.
|
||||
|
||||
There is a difference between what the `match` expression from Listing 9-6 and
|
||||
`?` do: error values used with `?` go through the `from` function, defined in
|
||||
the `From` trait in the standard library, which is used to convert errors from
|
||||
one type into another. When `?` calls the `from` function, the error type
|
||||
received is converted into the error type defined in the return type of the
|
||||
current function. This is useful when a function returns one error type to
|
||||
represent all the ways a function might fail, even if parts might fail for many
|
||||
different reasons. As long as each error type implements the `from` function to
|
||||
define how to convert itself to the returned error type, `?` takes care of the
|
||||
conversion automatically.
|
||||
|
||||
In the context of Listing 9-7, the `?` at the end of the `File::open` call will
|
||||
return the value inside an `Ok` to the variable `f`. If an error occurs, `?`
|
||||
will return early out of the whole function and give any `Err` value to the
|
||||
calling code. The same thing applies to the `?` at the end of the
|
||||
`read_to_string` call.
|
||||
|
||||
The `?` operator eliminates a lot of boilerplate and makes this function’s
|
||||
implementation simpler. We could even shorten this code further by chaining
|
||||
method calls immediately after the `?`, as shown in Listing 9-8:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::io;
|
||||
use std::io::Read;
|
||||
use std::fs::File;
|
||||
|
||||
fn read_username_from_file() -> Result<String, io::Error> {
|
||||
let mut s = String::new();
|
||||
|
||||
File::open("hello.txt")?.read_to_string(&mut s)?;
|
||||
|
||||
Ok(s)
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 9-8: Chaining method calls after `?`</span>
|
||||
|
||||
We’ve moved the creation of the new `String` in `s` to the beginning of the
|
||||
function; that part hasn’t changed. Instead of creating a variable `f`, we’ve
|
||||
chained the call to `read_to_string` directly onto the result of
|
||||
`File::open("hello.txt")?`. We still have a `?` at the end of the
|
||||
`read_to_string` call, and we still return an `Ok` value containing the
|
||||
username in `s` when both `File::open` and `read_to_string` succeed rather than
|
||||
returning errors. The functionality is again the same as in Listing 9-6 and
|
||||
Listing 9-7; this is just a different, more ergonomic way to write it.
|
||||
|
||||
#### The `?` Operator Can Only Be Used in Functions That Return `Result`
|
||||
|
||||
The `?` operator can only be used in functions that have a return type of
|
||||
`Result`, because it is defined to work in the same way as the `match`
|
||||
expression we defined in Listing 9-6. The part of the `match` that requires a
|
||||
return type of `Result` is `return Err(e)`, so the return type of the function
|
||||
must be a `Result` to be compatible with this `return`.
|
||||
|
||||
Let’s look at what happens if we use `?` in the `main` function, which you’ll
|
||||
recall has a return type of `()`:
|
||||
|
||||
```rust,ignore
|
||||
use std::fs::File;
|
||||
|
||||
fn main() {
|
||||
let f = File::open("hello.txt")?;
|
||||
}
|
||||
```
|
||||
|
||||
When we compile this code, we get the following error message:
|
||||
|
||||
```text
|
||||
error[E0277]: the trait bound `(): std::ops::Try` is not satisfied
|
||||
--> src/main.rs:4:13
|
||||
|
|
||||
4 | let f = File::open("hello.txt")?;
|
||||
| ------------------------
|
||||
| |
|
||||
| the `?` operator can only be used in a function that returns
|
||||
`Result` (or another type that implements `std::ops::Try`)
|
||||
| in this macro invocation
|
||||
|
|
||||
= help: the trait `std::ops::Try` is not implemented for `()`
|
||||
= note: required by `std::ops::Try::from_error`
|
||||
```
|
||||
|
||||
This error points out that we’re only allowed to use `?` in a function that
|
||||
returns `Result`. In functions that don’t return `Result`, when you call other
|
||||
functions that return `Result`, you’ll need to use a `match` or one of the
|
||||
`Result` methods to handle the `Result` instead of using `?` to potentially
|
||||
propagate the error to the calling code.
|
||||
|
||||
Now that we’ve discussed the details of calling `panic!` or returning `Result`,
|
||||
let’s return to the topic of how to decide which is appropriate to use in which
|
||||
cases.
|
||||
243
2018-edition/src/ch09-03-to-panic-or-not-to-panic.md
Normal file
243
2018-edition/src/ch09-03-to-panic-or-not-to-panic.md
Normal file
@@ -0,0 +1,243 @@
|
||||
## To `panic!` or Not to `panic!`
|
||||
|
||||
So how do you decide when you should call `panic!` and when you should return
|
||||
`Result`? When code panics, there’s no way to recover. You could call `panic!`
|
||||
for any error situation, whether there’s a possible way to recover or not, but
|
||||
then you’re making the decision on behalf of the code calling your code that a
|
||||
situation is unrecoverable. When you choose to return a `Result` value, you
|
||||
give the calling code options rather than making the decision for it. The
|
||||
calling code could choose to attempt to recover in a way that’s appropriate for
|
||||
its situation, or it could decide that an `Err` value in this case is
|
||||
unrecoverable, so it can call `panic!` and turn your recoverable error into an
|
||||
unrecoverable one. Therefore, returning `Result` is a good default choice when
|
||||
you’re defining a function that might fail.
|
||||
|
||||
In rare situations, it’s more appropriate to write code that panics instead of
|
||||
returning a `Result`. Let’s explore why it’s appropriate to panic in examples,
|
||||
prototype code, and tests. Then we’ll discuss situations in which the compiler
|
||||
can’t tell that failure is impossible, but you as a human can. The chapter will
|
||||
conclude with some general guidelines on how to decide whether to panic in
|
||||
library code.
|
||||
|
||||
### Examples, Prototype Code, and Tests
|
||||
|
||||
When you’re writing an example to illustrate some concept, having robust
|
||||
error-handling code in the example as well can make the example less clear. In
|
||||
examples, it’s understood that a call to a method like `unwrap` that could
|
||||
panic is meant as a placeholder for the way you’d want your application to
|
||||
handle errors, which can differ based on what the rest of your code is doing.
|
||||
|
||||
Similarly, the `unwrap` and `expect` methods are very handy when prototyping,
|
||||
before you’re ready to decide how to handle errors. They leave clear markers in
|
||||
your code for when you’re ready to make your program more robust.
|
||||
|
||||
If a method call fails in a test, you’d want the whole test to fail, even if
|
||||
that method isn’t the functionality under test. Because `panic!` is how a test
|
||||
is marked as a failure, calling `unwrap` or `expect` is exactly what should
|
||||
happen.
|
||||
|
||||
### Cases in Which You Have More Information Than the Compiler
|
||||
|
||||
It would also be appropriate to call `unwrap` when you have some other logic
|
||||
that ensures the `Result` will have an `Ok` value, but the logic isn’t
|
||||
something the compiler understands. You’ll still have a `Result` value that you
|
||||
need to handle: whatever operation you’re calling still has the possibility of
|
||||
failing in general, even though it’s logically impossible in your particular
|
||||
situation. If you can ensure by manually inspecting the code that you’ll never
|
||||
have an `Err` variant, it’s perfectly acceptable to call `unwrap`. Here’s an
|
||||
example:
|
||||
|
||||
```rust
|
||||
use std::net::IpAddr;
|
||||
|
||||
let home: IpAddr = "127.0.0.1".parse().unwrap();
|
||||
```
|
||||
|
||||
We’re creating an `IpAddr` instance by parsing a hardcoded string. We can see
|
||||
that `127.0.0.1` is a valid IP address, so it’s acceptable to use `unwrap`
|
||||
here. However, having a hardcoded, valid string doesn’t change the return type
|
||||
of the `parse` method: we still get a `Result` value, and the compiler will
|
||||
still make us handle the `Result` as if the `Err` variant is a possibility
|
||||
because the compiler isn’t smart enough to see that this string is always a
|
||||
valid IP address. If the IP address string came from a user rather than being
|
||||
hardcoded into the program and therefore *did* have a possibility of failure,
|
||||
we’d definitely want to handle the `Result` in a more robust way instead.
|
||||
|
||||
### Guidelines for Error Handling
|
||||
|
||||
It’s advisable to have your code panic when it’s possible that your code
|
||||
could end up in a bad state. In this context, a *bad state* is when some
|
||||
assumption, guarantee, contract, or invariant has been broken, such as when
|
||||
invalid values, contradictory values, or missing values are passed to your
|
||||
code—plus one or more of the following:
|
||||
|
||||
* The bad state is not something that’s *expected* to happen occasionally.
|
||||
* Your code after this point needs to rely on not being in this bad state.
|
||||
* There’s not a good way to encode this information in the types you use.
|
||||
|
||||
If someone calls your code and passes in values that don’t make sense, the best
|
||||
choice might be to call `panic!` and alert the person using your library to the
|
||||
bug in their code so they can fix it during development. Similarly, `panic!` is
|
||||
often appropriate if you’re calling external code that is out of your control
|
||||
and it returns an invalid state that you have no way of fixing.
|
||||
|
||||
When a bad state is reached, but it’s expected to happen no matter how well you
|
||||
write your code, it’s still more appropriate to return a `Result` rather than
|
||||
to make a `panic!` call. Examples include a parser being given malformed data
|
||||
or an HTTP request returning a status that indicates you have hit a rate limit.
|
||||
In these cases, you should indicate that failure is an expected possibility by
|
||||
returning a `Result` to propagate these bad states upward so the calling code
|
||||
can decide how to handle the problem. To call `panic!` wouldn’t be the best way
|
||||
to handle these cases.
|
||||
|
||||
When your code performs operations on values, your code should verify the
|
||||
values are valid first and panic if the values aren’t valid. This is mostly for
|
||||
safety reasons: attempting to operate on invalid data can expose your code to
|
||||
vulnerabilities. This is the main reason the standard library will call
|
||||
`panic!` if you attempt an out-of-bounds memory access: trying to access memory
|
||||
that doesn’t belong to the current data structure is a common security problem.
|
||||
Functions often have *contracts*: their behavior is only guaranteed if the
|
||||
inputs meet particular requirements. Panicking when the contract is violated
|
||||
makes sense because a contract violation always indicates a caller-side bug and
|
||||
it’s not a kind of error you want the calling code to have to explicitly
|
||||
handle. In fact, there’s no reasonable way for calling code to recover; the
|
||||
calling *programmers* need to fix the code. Contracts for a function,
|
||||
especially when a violation will cause a panic, should be explained in the API
|
||||
documentation for the function.
|
||||
|
||||
However, having lots of error checks in all of your functions would be verbose
|
||||
and annoying. Fortunately, you can use Rust’s type system (and thus the type
|
||||
checking the compiler does) to do many of the checks for you. If your function
|
||||
has a particular type as a parameter, you can proceed with your code’s logic
|
||||
knowing that the compiler has already ensured you have a valid value. For
|
||||
example, if you have a type rather than an `Option`, your program expects to
|
||||
have *something* rather than *nothing*. Your code then doesn’t have to handle
|
||||
two cases for the `Some` and `None` variants: it will only have one case for
|
||||
definitely having a value. Code trying to pass nothing to your function won’t
|
||||
even compile, so your function doesn’t have to check for that case at runtime.
|
||||
Another example is using an unsigned integer type such as `u32`, which ensures
|
||||
the parameter is never negative.
|
||||
|
||||
Let’s take the idea of using Rust’s type system to ensure we have a valid value
|
||||
one step further and look at creating a custom type for validation. Recall the
|
||||
guessing game in Chapter 2 in which our code asked the user to guess a number
|
||||
between 1 and 100. We never validated that the user’s guess was between those
|
||||
numbers before checking it against our secret number; we only validated that
|
||||
the guess was positive. In this case, the consequences were not very dire: our
|
||||
output of “Too high” or “Too low” would still be correct. But it would be a
|
||||
useful enhancement to guide the user toward valid guesses and have different
|
||||
behavior when a user guesses a number that’s out of range versus when a user
|
||||
types, for example, letters instead.
|
||||
|
||||
One way to do this would be to parse the guess as an `i32` instead of only a
|
||||
`u32` to allow potentially negative numbers, and then add a check for the
|
||||
number being in range, like so:
|
||||
|
||||
```rust,ignore
|
||||
loop {
|
||||
// --snip--
|
||||
|
||||
let guess: i32 = match guess.trim().parse() {
|
||||
Ok(num) => num,
|
||||
Err(_) => continue,
|
||||
};
|
||||
|
||||
if guess < 1 || guess > 100 {
|
||||
println!("The secret number will be between 1 and 100.");
|
||||
continue;
|
||||
}
|
||||
|
||||
match guess.cmp(&secret_number) {
|
||||
// --snip--
|
||||
}
|
||||
```
|
||||
|
||||
The `if` expression checks whether our value is out of range, tells the user
|
||||
about the problem, and calls `continue` to start the next iteration of the loop
|
||||
and ask for another guess. After the `if` expression, we can proceed with the
|
||||
comparisons between `guess` and the secret number knowing that `guess` is
|
||||
between 1 and 100.
|
||||
|
||||
However, this is not an ideal solution: if it was absolutely critical that the
|
||||
program only operated on values between 1 and 100, and it had many functions
|
||||
with this requirement, having a check like this in every function would be
|
||||
tedious (and might impact performance).
|
||||
|
||||
Instead, we can make a new type and put the validations in a function to create
|
||||
an instance of the type rather than repeating the validations everywhere. That
|
||||
way, it’s safe for functions to use the new type in their signatures and
|
||||
confidently use the values they receive. Listing 9-9 shows one way to define a
|
||||
`Guess` type that will only create an instance of `Guess` if the `new` function
|
||||
receives a value between 1 and 100:
|
||||
|
||||
```rust
|
||||
pub struct Guess {
|
||||
value: u32,
|
||||
}
|
||||
|
||||
impl Guess {
|
||||
pub fn new(value: u32) -> Guess {
|
||||
if value < 1 || value > 100 {
|
||||
panic!("Guess value must be between 1 and 100, got {}.", value);
|
||||
}
|
||||
|
||||
Guess {
|
||||
value
|
||||
}
|
||||
}
|
||||
|
||||
pub fn value(&self) -> u32 {
|
||||
self.value
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 9-9: A `Guess` type that will only continue with
|
||||
values between 1 and 100</span>
|
||||
|
||||
First, we define a struct named `Guess` that has a field named `value` that
|
||||
holds a `u32`. This is where the number will be stored.
|
||||
|
||||
Then we implement an associated function named `new` on `Guess` that creates
|
||||
instances of `Guess` values. The `new` function is defined to have one
|
||||
parameter named `value` of type `u32` and to return a `Guess`. The code in the
|
||||
body of the `new` function tests `value` to make sure it’s between 1 and 100.
|
||||
If `value` doesn’t pass this test, we make a `panic!` call, which will alert
|
||||
the programmer who is writing the calling code that they have a bug they need
|
||||
to fix, because creating a `Guess` with a `value` outside this range would
|
||||
violate the contract that `Guess::new` is relying on. The conditions in which
|
||||
`Guess::new` might panic should be discussed in its public-facing API
|
||||
documentation; we’ll cover documentation conventions indicating the possibility
|
||||
of a `panic!` in the API documentation that you create in Chapter 14. If
|
||||
`value` does pass the test, we create a new `Guess` with its `value` field set
|
||||
to the `value` parameter and return the `Guess`.
|
||||
|
||||
Next, we implement a method named `value` that borrows `self`, doesn’t have any
|
||||
other parameters, and returns a `u32`. This kind of method is sometimes called
|
||||
a *getter*, because its purpose is to get some data from its fields and return
|
||||
it. This public method is necessary because the `value` field of the `Guess`
|
||||
struct is private. It’s important that the `value` field be private so code
|
||||
using the `Guess` struct is not allowed to set `value` directly: code outside
|
||||
the module *must* use the `Guess::new` function to create an instance of
|
||||
`Guess`, thereby ensuring there’s no way for a `Guess` to have a `value` that
|
||||
hasn’t been checked by the conditions in the `Guess::new` function.
|
||||
|
||||
A function that has a parameter or returns only numbers between 1 and 100 could
|
||||
then declare in its signature that it takes or returns a `Guess` rather than a
|
||||
`u32` and wouldn’t need to do any additional checks in its body.
|
||||
|
||||
## Summary
|
||||
|
||||
Rust’s error handling features are designed to help you write more robust code.
|
||||
The `panic!` macro signals that your program is in a state it can’t handle and
|
||||
lets you tell the process to stop instead of trying to proceed with invalid or
|
||||
incorrect values. The `Result` enum uses Rust’s type system to indicate that
|
||||
operations might fail in a way that your code could recover from. You can use
|
||||
`Result` to tell code that calls your code that it needs to handle potential
|
||||
success or failure as well. Using `panic!` and `Result` in the appropriate
|
||||
situations will make your code more reliable in the face of inevitable problems.
|
||||
|
||||
Now that you’ve seen useful ways that the standard library uses generics with
|
||||
the `Option` and `Result` enums, we’ll talk about how generics work and how you
|
||||
can use them in your code.
|
||||
|
||||
175
2018-edition/src/ch10-00-generics.md
Normal file
175
2018-edition/src/ch10-00-generics.md
Normal file
@@ -0,0 +1,175 @@
|
||||
# Generic Types, Traits, and Lifetimes
|
||||
|
||||
Every programming language has tools for effectively handling the duplication
|
||||
of concepts. In Rust, one such tool is *generics*. Generics are abstract
|
||||
stand-ins for concrete types or other properties. When we’re writing code, we
|
||||
can express the behavior of generics or how they relate to other generics
|
||||
without knowing what will be in their place when compiling and running the code.
|
||||
|
||||
Similar to the way a function takes parameters with unknown values to run the
|
||||
same code on multiple concrete values, functions can take parameters of some
|
||||
generic type instead of a concrete type, like `i32` or `String`. In fact, we’ve
|
||||
already used generics in Chapter 6 with `Option<T>`, Chapter 8 with `Vec<T>`
|
||||
and `HashMap<K, V>`, and Chapter 9 with `Result<T, E>`. In this chapter, you’ll
|
||||
explore how to define your own types, functions, and methods with generics!
|
||||
|
||||
First, we’ll review how to extract a function to reduce code duplication. Next,
|
||||
we’ll use the same technique to make a generic function from two functions that
|
||||
only differ in the types of their parameters. We’ll also explain how to use
|
||||
generic types in struct and enum definitions.
|
||||
|
||||
Then you’ll learn how to use *traits* to define behavior in a generic way. You
|
||||
can then combine traits with generic types to constrain a generic type to only
|
||||
those types that have a particular behavior, as opposed to just any type.
|
||||
|
||||
Finally, we’ll discuss *lifetimes*, a variety of generics that give the
|
||||
compiler information about how references relate to each other. Lifetimes allow
|
||||
us to borrow values in many situations while still enabling the compiler to
|
||||
check that the references are valid.
|
||||
|
||||
## Removing Duplication by Extracting a Function
|
||||
|
||||
Before diving into generics syntax, let’s first look at how to remove
|
||||
duplication that doesn’t involve generic types by extracting a function. Then
|
||||
we’ll apply this technique to extract a generic function! In the same way that
|
||||
you recognize duplicated code to extract into a function, you’ll start to
|
||||
recognize duplicated code that can use generics.
|
||||
|
||||
Consider a short program that finds the largest number in a list, as shown in
|
||||
Listing 10-1:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let number_list = vec![34, 50, 25, 100, 65];
|
||||
|
||||
let mut largest = number_list[0];
|
||||
|
||||
for number in number_list {
|
||||
if number > largest {
|
||||
largest = number;
|
||||
}
|
||||
}
|
||||
|
||||
println!("The largest number is {}", largest);
|
||||
# assert_eq!(largest, 100);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-1: Code to find the largest number in a list
|
||||
of numbers</span>
|
||||
|
||||
This code stores a list of integers in the variable `number_list` and places
|
||||
the first number in the list in a variable named `largest`. Then it iterates
|
||||
through all the numbers in the list, and if the current number is greater than
|
||||
the number stored in `largest`, it replaces the number in that variable.
|
||||
However, if the current number is less than the largest number seen so far, the
|
||||
variable doesn’t change and the code moves on to the next number in the list.
|
||||
After considering all the numbers in the list, `largest` should hold the
|
||||
largest number, which in this case is 100.
|
||||
|
||||
To find the largest number in two different lists of numbers, we can duplicate
|
||||
the code in Listing 10-1 and use the same logic at two different places in the
|
||||
program, as shown in Listing 10-2:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let number_list = vec![34, 50, 25, 100, 65];
|
||||
|
||||
let mut largest = number_list[0];
|
||||
|
||||
for number in number_list {
|
||||
if number > largest {
|
||||
largest = number;
|
||||
}
|
||||
}
|
||||
|
||||
println!("The largest number is {}", largest);
|
||||
|
||||
let number_list = vec![102, 34, 6000, 89, 54, 2, 43, 8];
|
||||
|
||||
let mut largest = number_list[0];
|
||||
|
||||
for number in number_list {
|
||||
if number > largest {
|
||||
largest = number;
|
||||
}
|
||||
}
|
||||
|
||||
println!("The largest number is {}", largest);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-2: Code to find the largest number in *two*
|
||||
lists of numbers</span>
|
||||
|
||||
Although this code works, duplicating code is tedious and error prone. We also
|
||||
have to update the code in multiple places to change it.
|
||||
|
||||
To eliminate this duplication, we can create an abstraction by defining a
|
||||
function that operates on any list of integers given to it in a parameter. This
|
||||
solution makes our code clearer and lets us express the concept of finding the
|
||||
largest number in a list abstractly.
|
||||
|
||||
In Listing 10-3, we extracted the code that finds the largest number into a
|
||||
function named `largest`. Unlike the code in Listing 10-1, which can find the
|
||||
largest number in only one particular list, this program can find the largest
|
||||
number in two different lists:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn largest(list: &[i32]) -> i32 {
|
||||
let mut largest = list[0];
|
||||
|
||||
for &item in list.iter() {
|
||||
if item > largest {
|
||||
largest = item;
|
||||
}
|
||||
}
|
||||
|
||||
largest
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let number_list = vec![34, 50, 25, 100, 65];
|
||||
|
||||
let result = largest(&number_list);
|
||||
println!("The largest number is {}", result);
|
||||
# assert_eq!(result, 100);
|
||||
|
||||
let number_list = vec![102, 34, 6000, 89, 54, 2, 43, 8];
|
||||
|
||||
let result = largest(&number_list);
|
||||
println!("The largest number is {}", result);
|
||||
# assert_eq!(result, 6000);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-3: Abstracted code to find the largest number
|
||||
in two lists</span>
|
||||
|
||||
The `largest` function has a parameter called `list`, which represents any
|
||||
concrete slice of `i32` values that we might pass into the function. As a
|
||||
result, when we call the function, the code runs on the specific values that we
|
||||
pass in.
|
||||
|
||||
In sum, here are the steps we took to change the code from Listing 10-2 to
|
||||
Listing 10-3:
|
||||
|
||||
1. Identify duplicate code.
|
||||
2. Extract the duplicate code into the body of the function, and specify the
|
||||
inputs and return values of that code in the function signature.
|
||||
3. Update the two instances of duplicated code to call the function instead.
|
||||
|
||||
Next, we’ll use these same steps with generics to reduce code duplication in
|
||||
different ways. In the same way that the function body can operate on an
|
||||
abstract `list` instead of specific values, generics allow code to operate on
|
||||
abstract types.
|
||||
|
||||
For example, say we had two functions: one that finds the largest item in a
|
||||
slice of `i32` values and one that finds the largest item in a slice of `char`
|
||||
values. How would we eliminate that duplication? Let’s find out!
|
||||
462
2018-edition/src/ch10-01-syntax.md
Normal file
462
2018-edition/src/ch10-01-syntax.md
Normal file
@@ -0,0 +1,462 @@
|
||||
## Generic Data Types
|
||||
|
||||
We can use generics to create definitions for items like function signatures or
|
||||
structs, which we can then use with many different concrete data types. Let’s
|
||||
first look at how to define functions, structs, enums, and methods using
|
||||
generics. Then we’ll discuss how generics affect code performance.
|
||||
|
||||
### In Function Definitions
|
||||
|
||||
When defining a function that uses generics, we place the generics in the
|
||||
signature of the function where we would usually specify the data types of the
|
||||
parameters and return value. Doing so makes our code more flexible and provides
|
||||
more functionality to callers of our function while preventing code duplication.
|
||||
|
||||
Continuing with our `largest` function, Listing 10-4 shows two functions that
|
||||
both find the largest value in a slice:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn largest_i32(list: &[i32]) -> i32 {
|
||||
let mut largest = list[0];
|
||||
|
||||
for &item in list.iter() {
|
||||
if item > largest {
|
||||
largest = item;
|
||||
}
|
||||
}
|
||||
|
||||
largest
|
||||
}
|
||||
|
||||
fn largest_char(list: &[char]) -> char {
|
||||
let mut largest = list[0];
|
||||
|
||||
for &item in list.iter() {
|
||||
if item > largest {
|
||||
largest = item;
|
||||
}
|
||||
}
|
||||
|
||||
largest
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let number_list = vec![34, 50, 25, 100, 65];
|
||||
|
||||
let result = largest_i32(&number_list);
|
||||
println!("The largest number is {}", result);
|
||||
# assert_eq!(result, 100);
|
||||
|
||||
let char_list = vec!['y', 'm', 'a', 'q'];
|
||||
|
||||
let result = largest_char(&char_list);
|
||||
println!("The largest char is {}", result);
|
||||
# assert_eq!(result, 'y');
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-4: Two functions that differ only in their
|
||||
names and the types in their signatures</span>
|
||||
|
||||
The `largest_i32` function is the one we extracted in Listing 10-3 that finds
|
||||
the largest `i32` in a slice. The `largest_char` function finds the largest
|
||||
`char` in a slice. The function bodies have the same code, so let’s eliminate
|
||||
the duplication by introducing a generic type parameter in a single function.
|
||||
|
||||
To parameterize the types in the new function we’ll define, we need to name the
|
||||
type parameter, just like we do for the value parameters to a function. You can
|
||||
use any identifier as a type parameter name. But we’ll use `T` because, by
|
||||
convention, parameter names in Rust are short, often just a letter, and Rust’s
|
||||
type naming convention is CamelCase. Short for “type,” `T` is the default
|
||||
choice of most Rust programmers.
|
||||
|
||||
When we use a parameter in the body of the function, we have to declare the
|
||||
parameter name in the signature so that the compiler knows what that name
|
||||
means. Similarly, when we use a type parameter name in a function signature, we
|
||||
have to declare the type parameter name before we use it. To define the generic
|
||||
`largest` function, place type name declarations inside angle brackets (`<>`)
|
||||
between the name of the function and the parameter list, like this:
|
||||
|
||||
```rust,ignore
|
||||
fn largest<T>(list: &[T]) -> T {
|
||||
```
|
||||
|
||||
We read this definition as: the function `largest` is generic over some type
|
||||
`T`. This function has one parameter named `list`, which is a slice of values
|
||||
of type `T`. The `largest` function will return a value of the same type `T`.
|
||||
|
||||
Listing 10-5 shows the combined `largest` function definition using the generic
|
||||
data type in its signature. The listing also shows how we can call the function
|
||||
with either a slice of `i32` values or `char` values. Note that this code won’t
|
||||
compile yet, but we’ll fix it later in this chapter.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn largest<T>(list: &[T]) -> T {
|
||||
let mut largest = list[0];
|
||||
|
||||
for &item in list.iter() {
|
||||
if item > largest {
|
||||
largest = item;
|
||||
}
|
||||
}
|
||||
|
||||
largest
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let number_list = vec![34, 50, 25, 100, 65];
|
||||
|
||||
let result = largest(&number_list);
|
||||
println!("The largest number is {}", result);
|
||||
|
||||
let char_list = vec!['y', 'm', 'a', 'q'];
|
||||
|
||||
let result = largest(&char_list);
|
||||
println!("The largest char is {}", result);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-5: A definition of the `largest` function that
|
||||
uses generic type parameters but doesn’t compile yet</span>
|
||||
|
||||
If we compile this code right now, we’ll get this error:
|
||||
|
||||
```text
|
||||
error[E0369]: binary operation `>` cannot be applied to type `T`
|
||||
--> src/main.rs:5:12
|
||||
|
|
||||
5 | if item > largest {
|
||||
| ^^^^^^^^^^^^^^
|
||||
|
|
||||
= note: an implementation of `std::cmp::PartialOrd` might be missing for `T`
|
||||
```
|
||||
|
||||
The note mentions `std::cmp::PartialOrd`, which is a *trait*. We’ll talk about
|
||||
traits in the next section. For now, this error states that the body of
|
||||
`largest` won’t work for all possible types that `T` could be. Because we want
|
||||
to compare values of type `T` in the body, we can only use types whose values
|
||||
can be ordered. To enable comparisons, the standard library has the
|
||||
`std::cmp::PartialOrd` trait that you can implement on types (see Appendix C,
|
||||
“Derivable Traits,” for more on this trait). You’ll learn how to specify that a
|
||||
generic type has a particular trait in the “Trait Bounds” section, but let’s
|
||||
first explore other ways of using generic type parameters.
|
||||
|
||||
### In Struct Definitions
|
||||
|
||||
We can also define structs to use a generic type parameter in one or more
|
||||
fields using the `<>` syntax. Listing 10-6 shows how to define a `Point<T>`
|
||||
struct to hold `x` and `y` coordinate values of any type:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
struct Point<T> {
|
||||
x: T,
|
||||
y: T,
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let integer = Point { x: 5, y: 10 };
|
||||
let float = Point { x: 1.0, y: 4.0 };
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-6: A `Point<T>` struct that holds `x` and `y`
|
||||
values of type `T`</span>
|
||||
|
||||
The syntax for using generics in struct definitions is similar to that used in
|
||||
function definitions. First, we declare the name of the type parameter inside
|
||||
angle brackets just after the name of the struct. Then we can use the generic
|
||||
type in the struct definition where we would otherwise specify concrete data
|
||||
types.
|
||||
|
||||
Note that because we’ve only used one generic type to define `Point<T>`, this
|
||||
definition says that the `Point<T>` struct is generic over some type `T`, and
|
||||
the fields `x` and `y` are *both* that same type, whatever that type may be. If
|
||||
we create an instance of a `Point<T>` that has values of different types, as in
|
||||
Listing 10-7, our code won’t compile:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
struct Point<T> {
|
||||
x: T,
|
||||
y: T,
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let wont_work = Point { x: 5, y: 4.0 };
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-7: The fields `x` and `y` must be the same
|
||||
type because both have the same generic data type `T`</span>
|
||||
|
||||
In this example, when we assign the integer value `5` to `x`, we let the
|
||||
compiler know that the generic type `T` will be an integer for this instance of
|
||||
`Point<T>`. Then when we specify `4.0` for `y`, which we’ve defined to have the
|
||||
same type as `x`, we’ll get a type mismatch error like this:
|
||||
|
||||
```text
|
||||
error[E0308]: mismatched types
|
||||
--> src/main.rs:7:38
|
||||
|
|
||||
7 | let wont_work = Point { x: 5, y: 4.0 };
|
||||
| ^^^ expected integral variable, found
|
||||
floating-point variable
|
||||
|
|
||||
= note: expected type `{integer}`
|
||||
found type `{float}`
|
||||
```
|
||||
|
||||
To define a `Point` struct where `x` and `y` are both generics but could have
|
||||
different types, we can use multiple generic type parameters. For example, in
|
||||
Listing 10-8, we can change the definition of `Point` to be generic over types
|
||||
`T` and `U` where `x` is of type `T` and `y` is of type `U`:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
struct Point<T, U> {
|
||||
x: T,
|
||||
y: U,
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let both_integer = Point { x: 5, y: 10 };
|
||||
let both_float = Point { x: 1.0, y: 4.0 };
|
||||
let integer_and_float = Point { x: 5, y: 4.0 };
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-8: A `Point<T, U>` generic over two types so
|
||||
that `x` and `y` can be values of different types</span>
|
||||
|
||||
Now all the instances of `Point` shown are allowed! You can use as many generic
|
||||
type parameters in a definition as you want, but using more than a few makes
|
||||
your code hard to read. When you need lots of generic types in your code, it
|
||||
could indicate that your code needs restructuring into smaller pieces.
|
||||
|
||||
### In Enum Definitions
|
||||
|
||||
As we did with structs, we can define enums to hold generic data types in their
|
||||
variants. Let’s take another look at the `Option<T>` enum that the standard
|
||||
library provides that we used in Chapter 6:
|
||||
|
||||
```rust
|
||||
enum Option<T> {
|
||||
Some(T),
|
||||
None,
|
||||
}
|
||||
```
|
||||
|
||||
This definition should now make more sense to you. As you can see, `Option<T>`
|
||||
is an enum that is generic over type `T` and has two variants: `Some`, which
|
||||
holds one value of type `T`, and a `None` variant that doesn’t hold any value.
|
||||
By using the `Option<T>` enum, we can express the abstract concept of having an
|
||||
optional value, and because `Option<T>` is generic, we can use this abstraction
|
||||
no matter what the type of the optional value is.
|
||||
|
||||
Enums can use multiple generic types as well. The definition of the `Result`
|
||||
enum that we used in Chapter 9 is one example:
|
||||
|
||||
```rust
|
||||
enum Result<T, E> {
|
||||
Ok(T),
|
||||
Err(E),
|
||||
}
|
||||
```
|
||||
|
||||
The `Result` enum is generic over two types, `T` and `E`, and has two variants:
|
||||
`Ok`, which holds a value of type `T`, and `Err`, which holds a value of type
|
||||
`E`. This definition makes it convenient to use the `Result` enum anywhere we
|
||||
have an operation that might succeed (return a value of some type `T`) or fail
|
||||
(return an error of some type `E`). In fact, this is what we used to open a
|
||||
file in Listing 9-3 where `T` was filled in with the type `std::fs::File` when
|
||||
the file was opened successfully and `E` was filled in with the type
|
||||
`std::io::Error` when there were problems opening the file.
|
||||
|
||||
When you recognize situations in your code with multiple struct or enum
|
||||
definitions that differ only in the types of the values they hold, you can
|
||||
avoid duplication by using generic types instead.
|
||||
|
||||
### In Method Definitions
|
||||
|
||||
As we did in Chapter 5, we can implement methods on structs and enums that have
|
||||
generic types in their definitions. Listing 10-9 shows the `Point<T>` struct we
|
||||
defined in Listing 10-6 with a method named `x` implemented on it:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
struct Point<T> {
|
||||
x: T,
|
||||
y: T,
|
||||
}
|
||||
|
||||
impl<T> Point<T> {
|
||||
fn x(&self) -> &T {
|
||||
&self.x
|
||||
}
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let p = Point { x: 5, y: 10 };
|
||||
|
||||
println!("p.x = {}", p.x());
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-9: Implementing a method named `x` on the
|
||||
`Point<T>` struct that will return a reference to the `x` field of type
|
||||
`T`</span>
|
||||
|
||||
Here, we’ve defined a method named `x` on `Point<T>` that returns a reference
|
||||
to the data in the field `x`.
|
||||
|
||||
Note that we have to declare `T` just after `impl` so we can use it to specify
|
||||
that we’re implementing methods on the type `Point<T>`. By declaring `T` as a
|
||||
generic type after `impl`, Rust can identify that the type in the angle
|
||||
brackets in `Point` is a generic type rather than a concrete type.
|
||||
|
||||
We could, for example, implement methods only on `Point<f32>` instances rather
|
||||
than on `Point<T>` instances with any generic type. In Listing 10-10 we use the
|
||||
concrete type `f32`, meaning we don’t declare any types after `impl`:
|
||||
|
||||
```rust
|
||||
# struct Point<T> {
|
||||
# x: T,
|
||||
# y: T,
|
||||
# }
|
||||
#
|
||||
impl Point<f32> {
|
||||
fn distance_from_origin(&self) -> f32 {
|
||||
(self.x.powi(2) + self.y.powi(2)).sqrt()
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-10: An `impl` block that only applies to a
|
||||
struct with a particular concrete type for the generic type parameter `T`</span>
|
||||
|
||||
This code means the type `Point<f32>` will have a method named
|
||||
`distance_from_origin`, and other instances of `Point<T>` where `T` is not of
|
||||
type `f32` will not have this method defined. The method measures how far our
|
||||
point is from the point at coordinates (0.0, 0.0) and uses mathematical
|
||||
operations that are only available for floating point types.
|
||||
|
||||
Generic type parameters in a struct definition aren’t always the same as those
|
||||
you use in that struct’s method signatures. For example, Listing 10-11 defines
|
||||
the method `mixup` on the `Point<T, U>` struct from Listing 10-8. The method
|
||||
takes another `Point` as a parameter, which might have different types than the
|
||||
`self` `Point` we’re calling `mixup` on. The method creates a new `Point`
|
||||
instance with the `x` value from the `self` `Point` (of type `T`) and the `y`
|
||||
value from the passed-in `Point` (of type `W`):
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
struct Point<T, U> {
|
||||
x: T,
|
||||
y: U,
|
||||
}
|
||||
|
||||
impl<T, U> Point<T, U> {
|
||||
fn mixup<V, W>(self, other: Point<V, W>) -> Point<T, W> {
|
||||
Point {
|
||||
x: self.x,
|
||||
y: other.y,
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let p1 = Point { x: 5, y: 10.4 };
|
||||
let p2 = Point { x: "Hello", y: 'c'};
|
||||
|
||||
let p3 = p1.mixup(p2);
|
||||
|
||||
println!("p3.x = {}, p3.y = {}", p3.x, p3.y);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-11: A method that uses different generic types
|
||||
than its struct’s definition</span>
|
||||
|
||||
In `main`, we’ve defined a `Point` that has an `i32` for `x` (with value `5`)
|
||||
and an `f64` for `y` (with value `10.4`). The `p2` variable is a `Point` struct
|
||||
that has a string slice for `x` (with value `"Hello"`) and a `char` for `y`
|
||||
(with value `c`). Calling `mixup` on `p1` with the argument `p2` gives us `p3`,
|
||||
which will have an `i32` for `x`, because `x` came from `p1`. The `p3` variable
|
||||
will have a `char` for `y`, because `y` came from `p2`. The `println!` macro
|
||||
call will print `p3.x = 5, p3.y = c`.
|
||||
|
||||
The purpose of this example is to demonstrate a situation in which some generic
|
||||
parameters are declared with `impl` and some are declared with the method
|
||||
definition. Here, the generic parameters `T` and `U` are declared after `impl`,
|
||||
because they go with the struct definition. The generic parameters `V` and `W`
|
||||
are declared after `fn mixup`, because they’re only relevant to the method.
|
||||
|
||||
### Performance of Code Using Generics
|
||||
|
||||
You might be wondering whether there is a runtime cost when you’re using
|
||||
generic type parameters. The good news is that Rust implements generics in such
|
||||
a way that your code doesn’t run any slower using generic types than it would
|
||||
with concrete types.
|
||||
|
||||
Rust accomplishes this by performing monomorphization of the code that is using
|
||||
generics at compile time. *Monomorphization* is the process of turning generic
|
||||
code into specific code by filling in the concrete types that are used when
|
||||
compiled.
|
||||
|
||||
In this process, the compiler does the opposite of the steps we used to create
|
||||
the generic function in Listing 10-5: the compiler looks at all the places
|
||||
where generic code is called and generates code for the concrete types the
|
||||
generic code is called with.
|
||||
|
||||
Let’s look at how this works with an example that uses the standard library’s
|
||||
`Option<T>` enum:
|
||||
|
||||
```rust
|
||||
let integer = Some(5);
|
||||
let float = Some(5.0);
|
||||
```
|
||||
|
||||
When Rust compiles this code, it performs monomorphization. During that
|
||||
process, the compiler reads the values that have been used in the instances of
|
||||
`Option<T>` and identifies two kinds of `Option<T>`: one is `i32` and the other
|
||||
is `f64`. As such, it expands the generic definition of `Option<T>` into
|
||||
`Option_i32` and `Option_f64`, thereby replacing the generic definition with
|
||||
the specific ones.
|
||||
|
||||
The monomorphized version of the code looks like the following. The generic
|
||||
`Option<T>` is replaced with the specific definitions created by the compiler:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
enum Option_i32 {
|
||||
Some(i32),
|
||||
None,
|
||||
}
|
||||
|
||||
enum Option_f64 {
|
||||
Some(f64),
|
||||
None,
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let integer = Option_i32::Some(5);
|
||||
let float = Option_f64::Some(5.0);
|
||||
}
|
||||
```
|
||||
|
||||
Because Rust compiles generic code into code that specifies the type in each
|
||||
instance, we pay no runtime cost for using generics. When the code runs, it
|
||||
performs just like it would if we had duplicated each definition by hand. The
|
||||
process of monomorphization makes Rust’s generics extremely efficient at
|
||||
runtime.
|
||||
510
2018-edition/src/ch10-02-traits.md
Normal file
510
2018-edition/src/ch10-02-traits.md
Normal file
@@ -0,0 +1,510 @@
|
||||
## Traits: Defining Shared Behavior
|
||||
|
||||
A *trait* tells the Rust compiler about functionality a particular type has and
|
||||
can share with other types. We can use traits to define shared behavior in an
|
||||
abstract way. We can use trait bounds to specify that a generic can be any type
|
||||
that has certain behavior.
|
||||
|
||||
> Note: Traits are similar to a feature often called *interfaces* in other
|
||||
> languages, although with some differences.
|
||||
|
||||
### Defining a Trait
|
||||
|
||||
A type’s behavior consists of the methods we can call on that type. Different
|
||||
types share the same behavior if we can call the same methods on all of those
|
||||
types. Trait definitions are a way to group method signatures together to
|
||||
define a set of behaviors necessary to accomplish some purpose.
|
||||
|
||||
For example, let’s say we have multiple structs that hold various kinds and
|
||||
amounts of text: a `NewsArticle` struct that holds a news story filed in a
|
||||
particular location and a `Tweet` that can have at most 280 characters along
|
||||
with metadata that indicates whether it was a new tweet, a retweet, or a reply
|
||||
to another tweet.
|
||||
|
||||
We want to make a media aggregator library that can display summaries of data
|
||||
that might be stored in a `NewsArticle` or `Tweet` instance. To do this, we
|
||||
need a summary from each type, and we need to request that summary by calling a
|
||||
`summarize` method on an instance. Listing 10-12 shows the definition of a
|
||||
`Summary` trait that expresses this behavior:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub trait Summary {
|
||||
fn summarize(&self) -> String;
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-12: A `Summary` trait that consists of the
|
||||
behavior provided by a `summarize` method</span>
|
||||
|
||||
Here, we declare a trait using the `trait` keyword and then the trait’s name,
|
||||
which is `Summary` in this case. Inside the curly brackets we declare the
|
||||
method signatures that describe the behaviors of the types that implement this
|
||||
trait, which in this case is `fn summarize(&self) -> String`.
|
||||
|
||||
After the method signature, instead of providing an implementation within curly
|
||||
brackets, we use a semicolon. Each type implementing this trait must provide
|
||||
its own custom behavior for the body of the method. The compiler will enforce
|
||||
that any type that has the `Summary` trait will have the method `summarize`
|
||||
defined with this signature exactly.
|
||||
|
||||
A trait can have multiple methods in its body: the method signatures are listed
|
||||
one per line and each line ends in a semicolon.
|
||||
|
||||
### Implementing a Trait on a Type
|
||||
|
||||
Now that we’ve defined the desired behavior using the `Summary` trait, we can
|
||||
implement it on the types in our media aggregator. Listing 10-13 shows an
|
||||
implementation of the `Summary` trait on the `NewsArticle` struct that uses the
|
||||
headline, the author, and the location to create the return value of
|
||||
`summarize`. For the `Tweet` struct, we define `summarize` as the username
|
||||
followed by the entire text of the tweet, assuming that tweet content is
|
||||
already limited to 280 characters.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# pub trait Summary {
|
||||
# fn summarize(&self) -> String;
|
||||
# }
|
||||
#
|
||||
pub struct NewsArticle {
|
||||
pub headline: String,
|
||||
pub location: String,
|
||||
pub author: String,
|
||||
pub content: String,
|
||||
}
|
||||
|
||||
impl Summary for NewsArticle {
|
||||
fn summarize(&self) -> String {
|
||||
format!("{}, by {} ({})", self.headline, self.author, self.location)
|
||||
}
|
||||
}
|
||||
|
||||
pub struct Tweet {
|
||||
pub username: String,
|
||||
pub content: String,
|
||||
pub reply: bool,
|
||||
pub retweet: bool,
|
||||
}
|
||||
|
||||
impl Summary for Tweet {
|
||||
fn summarize(&self) -> String {
|
||||
format!("{}: {}", self.username, self.content)
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-13: Implementing the `Summary` trait on the
|
||||
`NewsArticle` and `Tweet` types</span>
|
||||
|
||||
Implementing a trait on a type is similar to implementing regular methods. The
|
||||
difference is that after `impl`, we put the trait name that we want to
|
||||
implement, then use the `for` keyword, and then specify the name of the type we
|
||||
want to implement the trait for. Within the `impl` block, we put the method
|
||||
signatures that the trait definition has defined. Instead of adding a semicolon
|
||||
after each signature, we use curly brackets and fill in the method body with
|
||||
the specific behavior that we want the methods of the trait to have for the
|
||||
particular type.
|
||||
|
||||
After implementing the trait, we can call the methods on instances of
|
||||
`NewsArticle` and `Tweet` in the same way we call regular methods, like this:
|
||||
|
||||
```rust,ignore
|
||||
let tweet = Tweet {
|
||||
username: String::from("horse_ebooks"),
|
||||
content: String::from("of course, as you probably already know, people"),
|
||||
reply: false,
|
||||
retweet: false,
|
||||
};
|
||||
|
||||
println!("1 new tweet: {}", tweet.summarize());
|
||||
```
|
||||
|
||||
This code prints `1 new tweet: horse_ebooks: of course, as you probably already
|
||||
know, people`.
|
||||
|
||||
Note that because we defined the `Summary` trait and the `NewsArticle` and
|
||||
`Tweet` types in the same *lib.rs* in Listing 10-13, they’re all in the same
|
||||
scope. Let’s say this *lib.rs* is for a crate we’ve called `aggregator`, and
|
||||
someone else wants to use our crate’s functionality to implement the `Summary`
|
||||
trait on a struct defined within their library’s scope. They would need to
|
||||
import the trait into their scope first. They would do so by specifying `use
|
||||
aggregator::Summary;`, which then enables them to implement `Summary` for their
|
||||
type. The `Summary` trait would also need to be a public trait for another
|
||||
crate to implement it, which it is because we put the `pub` keyword before
|
||||
`trait` in Listing 10-12.
|
||||
|
||||
One restriction to note with trait implementations is that we can implement a
|
||||
trait on a type only if either the trait or the type is local to our crate.
|
||||
For example, we can implement standard library traits like `Display` on a
|
||||
custom type like `Tweet` as part of our `aggregator` crate functionality,
|
||||
because the type `Tweet` is local to our `aggregator` crate. We can also
|
||||
implement `Summary` on `Vec<T>` in our `aggregator` crate, because the
|
||||
trait `Summary` is local to our `aggregator` crate.
|
||||
|
||||
But we can’t implement external traits on external types. For example, we can’t
|
||||
implement the `Display` trait on `Vec<T>` within our `aggregator` crate,
|
||||
because `Display` and `Vec<T>` are defined in the standard library and aren’t
|
||||
local to our `aggregator` crate. This restriction is part of a property of
|
||||
programs called *coherence*, and more specifically the *orphan rule*, so named
|
||||
because the parent type is not present. This rule ensures that other people’s
|
||||
code can’t break your code and vice versa. Without the rule, two crates could
|
||||
implement the same trait for the same type, and Rust wouldn’t know which
|
||||
implementation to use.
|
||||
|
||||
### Default Implementations
|
||||
|
||||
Sometimes it’s useful to have default behavior for some or all of the methods
|
||||
in a trait instead of requiring implementations for all methods on every type.
|
||||
Then, as we implement the trait on a particular type, we can keep or override
|
||||
each method’s default behavior.
|
||||
|
||||
Listing 10-14 shows how to specify a default string for the `summarize` method
|
||||
of the `Summary` trait instead of only defining the method signature, like we
|
||||
did in Listing 10-12:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub trait Summary {
|
||||
fn summarize(&self) -> String {
|
||||
String::from("(Read more...)")
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-14: Definition of a `Summary` trait with a
|
||||
default implementation of the `summarize` method</span>
|
||||
|
||||
To use a default implementation to summarize instances of `NewsArticle` instead
|
||||
of defining a custom implementation, we specify an empty `impl` block with
|
||||
`impl Summary for NewsArticle {}`.
|
||||
|
||||
Even though we’re no longer defining the `summarize` method on `NewsArticle`
|
||||
directly, we’ve provided a default implementation and specified that
|
||||
`NewsArticle` implements the `Summary` trait. As a result, we can still call
|
||||
the `summarize` method on an instance of `NewsArticle`, like this:
|
||||
|
||||
```rust,ignore
|
||||
let article = NewsArticle {
|
||||
headline: String::from("Penguins win the Stanley Cup Championship!"),
|
||||
location: String::from("Pittsburgh, PA, USA"),
|
||||
author: String::from("Iceburgh"),
|
||||
content: String::from("The Pittsburgh Penguins once again are the best
|
||||
hockey team in the NHL."),
|
||||
};
|
||||
|
||||
println!("New article available! {}", article.summarize());
|
||||
```
|
||||
|
||||
This code prints `New article available! (Read more...)`.
|
||||
|
||||
Creating a default implementation for `summarize` doesn’t require us to change
|
||||
anything about the implementation of `Summary` on `Tweet` in Listing 10-13. The
|
||||
reason is that the syntax for overriding a default implementation is the same
|
||||
as the syntax for implementing a trait method that doesn’t have a default
|
||||
implementation.
|
||||
|
||||
Default implementations can call other methods in the same trait, even if those
|
||||
other methods don’t have a default implementation. In this way, a trait can
|
||||
provide a lot of useful functionality and only require implementors to specify
|
||||
a small part of it. For example, we could define the `Summary` trait to have a
|
||||
`summarize_author` method whose implementation is required, and then define a
|
||||
`summarize` method that has a default implementation that calls the
|
||||
`summarize_author` method:
|
||||
|
||||
```rust
|
||||
pub trait Summary {
|
||||
fn summarize_author(&self) -> String;
|
||||
|
||||
fn summarize(&self) -> String {
|
||||
format!("(Read more from {}...)", self.summarize_author())
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
To use this version of `Summary`, we only need to define `summarize_author`
|
||||
when we implement the trait on a type:
|
||||
|
||||
```rust,ignore
|
||||
impl Summary for Tweet {
|
||||
fn summarize_author(&self) -> String {
|
||||
format!("@{}", self.username)
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
After we define `summarize_author`, we can call `summarize` on instances of the
|
||||
`Tweet` struct, and the default implementation of `summarize` will call the
|
||||
definition of `summarize_author` that we’ve provided. Because we’ve implemented
|
||||
`summarize_author`, the `Summary` trait has given us the behavior of the
|
||||
`summarize` method without requiring us to write any more code.
|
||||
|
||||
```rust,ignore
|
||||
let tweet = Tweet {
|
||||
username: String::from("horse_ebooks"),
|
||||
content: String::from("of course, as you probably already know, people"),
|
||||
reply: false,
|
||||
retweet: false,
|
||||
};
|
||||
|
||||
println!("1 new tweet: {}", tweet.summarize());
|
||||
```
|
||||
|
||||
This code prints `1 new tweet: (Read more from @horse_ebooks...)`.
|
||||
|
||||
Note that it isn’t possible to call the default implementation from an
|
||||
overriding implementation of that same method.
|
||||
|
||||
### Trait Bounds
|
||||
|
||||
Now that you know how to define traits and implement those traits on types, we
|
||||
can explore how to use traits with generic type parameters. We can use *trait
|
||||
bounds* to constrain generic types to ensure the type will be limited to those
|
||||
that implement a particular trait and behavior.
|
||||
|
||||
For example, in Listing 10-13, we implemented the `Summary` trait on the types
|
||||
`NewsArticle` and `Tweet`. We can define a function `notify` that calls the
|
||||
`summarize` method on its parameter `item`, which is of the generic type `T`.
|
||||
To be able to call `summarize` on `item` without getting an error telling us
|
||||
that the generic type `T` doesn’t implement the method `summarize`, we can use
|
||||
trait bounds on `T` to specify that `item` must be of a type that implements
|
||||
the `Summary` trait:
|
||||
|
||||
```rust,ignore
|
||||
pub fn notify<T: Summary>(item: T) {
|
||||
println!("Breaking news! {}", item.summarize());
|
||||
}
|
||||
```
|
||||
|
||||
We place trait bounds with the declaration of the generic type parameter, after
|
||||
a colon and inside angle brackets. Because of the trait bound on `T`, we can
|
||||
call `notify` and pass in any instance of `NewsArticle` or `Tweet`. Code that
|
||||
calls the function with any other type, like a `String` or an `i32`, won’t
|
||||
compile, because those types don’t implement `Summary`.
|
||||
|
||||
We can specify multiple trait bounds on a generic type using the `+` syntax.
|
||||
For example, to use display formatting on the type `T` in a function as well as
|
||||
the `summarize` method, we can use `T: Summary + Display` to say `T` can be any
|
||||
type that implements `Summary` and `Display`.
|
||||
|
||||
However, there are downsides to using too many trait bounds. Each generic has
|
||||
its own trait bounds; so functions with multiple generic type parameters can
|
||||
have lots of trait bound information between a function’s name and its
|
||||
parameter list, making the function signature hard to read. For this reason,
|
||||
Rust has alternate syntax for specifying trait bounds inside a `where` clause
|
||||
after the function signature. So instead of writing this:
|
||||
|
||||
```rust,ignore
|
||||
fn some_function<T: Display + Clone, U: Clone + Debug>(t: T, u: U) -> i32 {
|
||||
```
|
||||
|
||||
we can use a `where` clause, like this:
|
||||
|
||||
```rust,ignore
|
||||
fn some_function<T, U>(t: T, u: U) -> i32
|
||||
where T: Display + Clone,
|
||||
U: Clone + Debug
|
||||
{
|
||||
```
|
||||
|
||||
This function’s signature is less cluttered in that the function name,
|
||||
parameter list, and return type are close together, similar to a function
|
||||
without lots of trait bounds.
|
||||
|
||||
### Fixing the `largest` Function with Trait Bounds
|
||||
|
||||
Now that you know how to specify the behavior you want to use using the generic
|
||||
type parameter’s bounds, let’s return to Listing 10-5 to fix the definition of
|
||||
the `largest` function that uses a generic type parameter! Last time we tried
|
||||
to run that code, we received this error:
|
||||
|
||||
```text
|
||||
error[E0369]: binary operation `>` cannot be applied to type `T`
|
||||
--> src/main.rs:5:12
|
||||
|
|
||||
5 | if item > largest {
|
||||
| ^^^^^^^^^^^^^^
|
||||
|
|
||||
= note: an implementation of `std::cmp::PartialOrd` might be missing for `T`
|
||||
```
|
||||
|
||||
In the body of `largest` we wanted to compare two values of type `T` using the
|
||||
greater-than (`>`) operator. Because that operator is defined as a default
|
||||
method on the standard library trait `std::cmp::PartialOrd`, we need to specify
|
||||
`PartialOrd` in the trait bounds for `T` so the `largest` function can work on
|
||||
slices of any type that we can compare. We don’t need to bring `PartialOrd`
|
||||
into scope because it’s in the prelude. Change the signature of `largest` to
|
||||
look like this:
|
||||
|
||||
```rust,ignore
|
||||
fn largest<T: PartialOrd>(list: &[T]) -> T {
|
||||
```
|
||||
|
||||
This time when we compile the code, we get a different set of errors:
|
||||
|
||||
```text
|
||||
error[E0508]: cannot move out of type `[T]`, a non-copy slice
|
||||
--> src/main.rs:2:23
|
||||
|
|
||||
2 | let mut largest = list[0];
|
||||
| ^^^^^^^
|
||||
| |
|
||||
| cannot move out of here
|
||||
| help: consider using a reference instead: `&list[0]`
|
||||
|
||||
error[E0507]: cannot move out of borrowed content
|
||||
--> src/main.rs:4:9
|
||||
|
|
||||
4 | for &item in list.iter() {
|
||||
| ^----
|
||||
| ||
|
||||
| |hint: to prevent move, use `ref item` or `ref mut item`
|
||||
| cannot move out of borrowed content
|
||||
```
|
||||
|
||||
The key line in this error is `cannot move out of type [T], a non-copy slice`.
|
||||
With our non-generic versions of the `largest` function, we were only trying to
|
||||
find the largest `i32` or `char`. As discussed in the “Stack-Only Data: Copy”
|
||||
section in Chapter 4, types like `i32` and `char` that have a known size can be
|
||||
stored on the stack, so they implement the `Copy` trait. But when we made the
|
||||
`largest` function generic, it became possible for the `list` parameter to have
|
||||
types in it that don’t implement the `Copy` trait. Consequently, we wouldn’t be
|
||||
able to move the value out of `list[0]` and into the `largest` variable,
|
||||
resulting in this error.
|
||||
|
||||
To call this code with only those types that implement the `Copy` trait, we can
|
||||
add `Copy` to the trait bounds of `T`! Listing 10-15 shows the complete code of
|
||||
a generic `largest` function that will compile as long as the types of the
|
||||
values in the slice that we pass into the function implement the `PartialOrd`
|
||||
*and* `Copy` traits, like `i32` and `char` do:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn largest<T: PartialOrd + Copy>(list: &[T]) -> T {
|
||||
let mut largest = list[0];
|
||||
|
||||
for &item in list.iter() {
|
||||
if item > largest {
|
||||
largest = item;
|
||||
}
|
||||
}
|
||||
|
||||
largest
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let number_list = vec![34, 50, 25, 100, 65];
|
||||
|
||||
let result = largest(&number_list);
|
||||
println!("The largest number is {}", result);
|
||||
|
||||
let char_list = vec!['y', 'm', 'a', 'q'];
|
||||
|
||||
let result = largest(&char_list);
|
||||
println!("The largest char is {}", result);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-15: A working definition of the `largest`
|
||||
function that works on any generic type that implements the `PartialOrd` and
|
||||
`Copy` traits</span>
|
||||
|
||||
If we don’t want to restrict the `largest` function to the types that implement
|
||||
the `Copy` trait, we could specify that `T` has the trait bound `Clone` instead
|
||||
of `Copy`. Then we could clone each value in the slice when we want the
|
||||
`largest` function to have ownership. Using the `clone` function means we’re
|
||||
potentially making more heap allocations in the case of types that own heap
|
||||
data like `String`, and heap allocations can be slow if we’re working with
|
||||
large amounts of data.
|
||||
|
||||
Another way we could implement `largest` is for the function to return a
|
||||
reference to a `T` value in the slice. If we change the return type to `&T`
|
||||
instead of `T`, thereby changing the body of the function to return a
|
||||
reference, we wouldn’t need the `Clone` or `Copy` trait bounds and we could
|
||||
avoid heap allocations. Try implementing these alternate solutions on your own!
|
||||
|
||||
### Using Trait Bounds to Conditionally Implement Methods
|
||||
|
||||
By using a trait bound with an `impl` block that uses generic type parameters,
|
||||
we can implement methods conditionally for types that implement the specified
|
||||
traits. For example, the type `Pair<T>` in Listing 10-16 always implements the
|
||||
`new` function. But `Pair<T>` only implements the `cmp_display` method if its
|
||||
inner type `T` implements the `PartialOrd` trait that enables comparison *and*
|
||||
the `Display` trait that enables printing:
|
||||
|
||||
```rust
|
||||
use std::fmt::Display;
|
||||
|
||||
struct Pair<T> {
|
||||
x: T,
|
||||
y: T,
|
||||
}
|
||||
|
||||
impl<T> Pair<T> {
|
||||
fn new(x: T, y: T) -> Self {
|
||||
Self {
|
||||
x,
|
||||
y,
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
impl<T: Display + PartialOrd> Pair<T> {
|
||||
fn cmp_display(&self) {
|
||||
if self.x >= self.y {
|
||||
println!("The largest member is x = {}", self.x);
|
||||
} else {
|
||||
println!("The largest member is y = {}", self.y);
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-16: Conditionally implement methods on a
|
||||
generic type depending on trait bounds</span>
|
||||
|
||||
We can also conditionally implement a trait for any type that implements
|
||||
another trait. Implementations of a trait on any type that satisfies the trait
|
||||
bounds are called *blanket implementations* and are extensively used in the
|
||||
Rust standard library. For example, the standard library implements the
|
||||
`ToString` trait on any type that implements the `Display` trait. The `impl`
|
||||
block in the standard library looks similar to this code:
|
||||
|
||||
```rust,ignore
|
||||
impl<T: Display> ToString for T {
|
||||
// --snip--
|
||||
}
|
||||
```
|
||||
|
||||
Because the standard library has this blanket implementation, we can call the
|
||||
`to_string` method defined by the `ToString` trait on any type that implements
|
||||
the `Display` trait. For example, we can turn integers into their corresponding
|
||||
`String` values like this because integers implement `Display`:
|
||||
|
||||
```rust
|
||||
let s = 3.to_string();
|
||||
```
|
||||
|
||||
Blanket implementations appear in the documentation for the trait in the
|
||||
“Implementors” section.
|
||||
|
||||
Traits and trait bounds let us write code that uses generic type parameters to
|
||||
reduce duplication but also specify to the compiler that we want the generic
|
||||
type to have particular behavior. The compiler can then use the trait bound
|
||||
information to check that all the concrete types used with our code provide the
|
||||
correct behavior. In dynamically typed languages, we would get an error at
|
||||
runtime if we called a method on a type that the type didn’t implement. But
|
||||
Rust moves these errors to compile time so we’re forced to fix the problems
|
||||
before our code is even able to run. Additionally, we don’t have to write code
|
||||
that checks for behavior at runtime because we’ve already checked at compile
|
||||
time. Doing so improves performance without having to give up the flexibility
|
||||
of generics.
|
||||
|
||||
Another kind of generic that we’ve already been using is called *lifetimes*.
|
||||
Rather than ensuring that a type has the behavior we want, lifetimes ensure
|
||||
that references are valid as long as we need them to be. Let’s look at how
|
||||
lifetimes do that.
|
||||
768
2018-edition/src/ch10-03-lifetime-syntax.md
Normal file
768
2018-edition/src/ch10-03-lifetime-syntax.md
Normal file
@@ -0,0 +1,768 @@
|
||||
## Validating References with Lifetimes
|
||||
|
||||
One detail we didn’t discuss in the “References and Borrowing” section in
|
||||
Chapter 4 is that every reference in Rust has a *lifetime*, which is the scope
|
||||
for which that reference is valid. Most of the time lifetimes are implicit and
|
||||
inferred, just like most of the time types are inferred. We must annotate types
|
||||
when multiple types are possible. In a similar way, we must annotate lifetimes
|
||||
when the lifetimes of references could be related in a few different ways. Rust
|
||||
requires us to annotate the relationships using generic lifetime parameters to
|
||||
ensure the actual references used at runtime will definitely be valid.
|
||||
|
||||
The concept of lifetimes is somewhat different from tools in other programming
|
||||
languages, arguably making lifetimes Rust’s most distinctive feature. Although
|
||||
we won’t cover lifetimes in their entirety in this chapter, we’ll discuss
|
||||
common ways you might encounter lifetime syntax so you can become familiar with
|
||||
the concepts. See the “Advanced Lifetimes” section in Chapter 19 for more
|
||||
detailed information.
|
||||
|
||||
### Lifetimes Prevent Dangling References
|
||||
|
||||
The main aim of lifetimes is to prevent dangling references, which cause a
|
||||
program to reference data other than the data it’s intended to reference.
|
||||
Consider the program in Listing 10-17, which has an outer scope and an inner
|
||||
scope:
|
||||
|
||||
```rust,ignore
|
||||
{
|
||||
let r;
|
||||
|
||||
{
|
||||
let x = 5;
|
||||
r = &x;
|
||||
}
|
||||
|
||||
println!("r: {}", r);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-17: An attempt to use a reference whose value
|
||||
has gone out of scope</span>
|
||||
|
||||
> Note: The example in Listing 10-17 and the next few examples declare
|
||||
> variables without giving them an initial value, so the variable name exists
|
||||
> in the outer scope. At first glance, this might appear to be in conflict with
|
||||
> Rust having no null values. However, if we try to use a variable before
|
||||
> giving it a value, we’ll get a compile time error, which shows that Rust
|
||||
> indeed does not allow null values.
|
||||
|
||||
The outer scope declares a variable named `r` with no initial value, and the
|
||||
inner scope declares a variable named `x` with the initial value of `5`. Inside
|
||||
the inner scope, we attempt to set the value of `r` as a reference to `x`. Then
|
||||
the inner scope ends, and we attempt to print the value in `r`. This code won’t
|
||||
compile because the value `r` is referring to has gone out of scope before we
|
||||
try to use it. Here is the error message:
|
||||
|
||||
```text
|
||||
error[E0597]: `x` does not live long enough
|
||||
--> src/main.rs:7:5
|
||||
|
|
||||
6 | r = &x;
|
||||
| - borrow occurs here
|
||||
7 | }
|
||||
| ^ `x` dropped here while still borrowed
|
||||
...
|
||||
10 | }
|
||||
| - borrowed value needs to live until here
|
||||
```
|
||||
|
||||
The variable `x` doesn’t “live long enough.” The reason is that `x` will be out
|
||||
of scope when the inner scope ends on line 7. But `r` is still valid for the
|
||||
outer scope; because its scope is larger, we say that it “lives longer.” If
|
||||
Rust allowed this code to work, `r` would be referencing memory that was
|
||||
deallocated when `x` went out of scope, and anything we tried to do with `r`
|
||||
wouldn’t work correctly. So how does Rust determine that this code is invalid?
|
||||
It uses a borrow checker.
|
||||
|
||||
### The Borrow Checker
|
||||
|
||||
The Rust compiler has a *borrow checker* that compares scopes to determine that
|
||||
all borrows are valid. Listing 10-18 shows the same code as Listing 10-17 but
|
||||
with annotations showing the lifetimes of the variables:
|
||||
|
||||
```rust,ignore
|
||||
{
|
||||
let r; // ---------+-- 'a
|
||||
// |
|
||||
{ // |
|
||||
let x = 5; // -+-- 'b |
|
||||
r = &x; // | |
|
||||
} // -+ |
|
||||
// |
|
||||
println!("r: {}", r); // |
|
||||
} // ---------+
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-18: Annotations of the lifetimes of `r` and
|
||||
`x`, named `'a` and `'b`, respectively</span>
|
||||
|
||||
Here, we’ve annotated the lifetime of `r` with `'a` and the lifetime of `x`
|
||||
with `'b`. As you can see, the inner `'b` block is much smaller than the outer
|
||||
`'a` lifetime block. At compile time, Rust compares the size of the two
|
||||
lifetimes and sees that `r` has a lifetime of `'a` but that it refers to memory
|
||||
with a lifetime of `'b`. The program is rejected because `'b` is shorter than
|
||||
`'a`: the subject of the reference doesn’t live as long as the reference.
|
||||
|
||||
Listing 10-19 fixes the code so it doesn’t have a dangling reference and
|
||||
compiles without any errors:
|
||||
|
||||
```rust
|
||||
{
|
||||
let x = 5; // ----------+-- 'b
|
||||
// |
|
||||
let r = &x; // --+-- 'a |
|
||||
// | |
|
||||
println!("r: {}", r); // | |
|
||||
// --+ |
|
||||
} // ----------+
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-19: A valid reference because the data has a
|
||||
longer lifetime than the reference</span>
|
||||
|
||||
Here, `x` has the lifetime `'b`, which in this case is larger than `'a`. This
|
||||
means `r` can reference `x` because Rust knows that the reference in `r` will
|
||||
always be valid while `x` is valid.
|
||||
|
||||
Now that you know where the lifetimes of references are and how Rust analyzes
|
||||
lifetimes to ensure references will always be valid, let’s explore generic
|
||||
lifetimes of parameters and return values in the context of functions.
|
||||
|
||||
### Generic Lifetimes in Functions
|
||||
|
||||
Let’s write a function that returns the longer of two string slices. This
|
||||
function will take two string slices and return a string slice. After we’ve
|
||||
implemented the `longest` function, the code in Listing 10-20 should print `The
|
||||
longest string is abcd`:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let string1 = String::from("abcd");
|
||||
let string2 = "xyz";
|
||||
|
||||
let result = longest(string1.as_str(), string2);
|
||||
println!("The longest string is {}", result);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-20: A `main` function that calls the `longest`
|
||||
function to find the longest of two string slices</span>
|
||||
|
||||
Note that we want the function to take string slices, which are references,
|
||||
because we don’t want the `longest` function to take ownership of its
|
||||
parameters. We want to allow the function to accept slices of a `String` (the
|
||||
type stored in the variable `string1`) as well as string literals (which is
|
||||
what variable `string2` contains).
|
||||
|
||||
Refer to the “String Slices as Parameters” section in Chapter 4 for more
|
||||
discussion about why the parameters we use in Listing 10-20 are the ones we
|
||||
want.
|
||||
|
||||
If we try to implement the `longest` function as shown in Listing 10-21, it
|
||||
won’t compile:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn longest(x: &str, y: &str) -> &str {
|
||||
if x.len() > y.len() {
|
||||
x
|
||||
} else {
|
||||
y
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-21: An implementation of the `longest`
|
||||
function that returns the longer of two string slices but does not yet
|
||||
compile</span>
|
||||
|
||||
Instead, we get the following error that talks about lifetimes:
|
||||
|
||||
```text
|
||||
error[E0106]: missing lifetime specifier
|
||||
--> src/main.rs:1:33
|
||||
|
|
||||
1 | fn longest(x: &str, y: &str) -> &str {
|
||||
| ^ expected lifetime parameter
|
||||
|
|
||||
= help: this function's return type contains a borrowed value, but the
|
||||
signature does not say whether it is borrowed from `x` or `y`
|
||||
```
|
||||
|
||||
The help text reveals that the return type needs a generic lifetime parameter
|
||||
on it because Rust can’t tell whether the reference being returned refers to
|
||||
`x` or `y`. Actually, we don’t know either, because the `if` block in the body
|
||||
of this function returns a reference to `x` and the `else` block returns a
|
||||
reference to `y`!
|
||||
|
||||
When we’re defining this function, we don’t know the concrete values that will
|
||||
be passed into this function, so we don’t know whether the `if` case or the
|
||||
`else` case will execute. We also don’t know the concrete lifetimes of the
|
||||
references that will be passed in, so we can’t look at the scopes like we did
|
||||
in Listings 10-18 and 10-19 to determine that the reference we return will
|
||||
always be valid. The borrow checker can’t determine this either, because it
|
||||
doesn’t know how the lifetimes of `x` and `y` relate to the lifetime of the
|
||||
return value. To fix this error, we’ll add generic lifetime parameters that
|
||||
define the relationship between the references so the borrow checker can
|
||||
perform its analysis.
|
||||
|
||||
### Lifetime Annotation Syntax
|
||||
|
||||
Lifetime annotations don’t change how long any of the references live. Just
|
||||
like functions can accept any type when the signature specifies a generic type
|
||||
parameter, functions can accept references with any lifetime by specifying a
|
||||
generic lifetime parameter. Lifetime annotations describe the relationships of
|
||||
the lifetimes of multiple references to each other without affecting the
|
||||
lifetimes.
|
||||
|
||||
Lifetime annotations have a slightly unusual syntax: the names of lifetime
|
||||
parameters must start with an apostrophe `'` and are usually all lowercase and
|
||||
very short, like generic types. Most people use the name `'a`. We place
|
||||
lifetime parameter annotations after the `&` of a reference, using a space to
|
||||
separate the annotation from the reference’s type.
|
||||
|
||||
Here are some examples: a reference to an `i32` without a lifetime parameter, a
|
||||
reference to an `i32` that has a lifetime parameter named `'a`, and a mutable
|
||||
reference to an `i32` that also has the lifetime `'a`.
|
||||
|
||||
```rust,ignore
|
||||
&i32 // a reference
|
||||
&'a i32 // a reference with an explicit lifetime
|
||||
&'a mut i32 // a mutable reference with an explicit lifetime
|
||||
```
|
||||
|
||||
One lifetime annotation by itself doesn’t have much meaning because the
|
||||
annotations are meant to tell Rust how generic lifetime parameters of multiple
|
||||
references relate to each other. For example, let’s say we have a function with
|
||||
the parameter `first` that is a reference to an `i32` with lifetime `'a`. The
|
||||
function also has another parameter named `second` that is another reference to
|
||||
an `i32` that also has the lifetime `'a`. The lifetime annotations indicate
|
||||
that the references `first` and `second` must both live as long as that generic
|
||||
lifetime.
|
||||
|
||||
### Lifetime Annotations in Function Signatures
|
||||
|
||||
Now let’s examine lifetime annotations in the context of the `longest`
|
||||
function. As with generic type parameters, we need to declare generic lifetime
|
||||
parameters inside angle brackets between the function name and the parameter
|
||||
list. The constraint we want to express in this signature is that all the
|
||||
references in the parameters and the return value must have the same lifetime.
|
||||
We’ll name the lifetime `'a`, and then add it to each reference, as shown in
|
||||
Listing 10-22:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn longest<'a>(x: &'a str, y: &'a str) -> &'a str {
|
||||
if x.len() > y.len() {
|
||||
x
|
||||
} else {
|
||||
y
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-22: The `longest` function definition
|
||||
specifying that all the references in the signature must have the same lifetime
|
||||
`'a`</span>
|
||||
|
||||
This code should compile and produce the result we want when we use it with the
|
||||
`main` function in Listing 10-20.
|
||||
|
||||
The function signature now tells Rust that for some lifetime `'a`, the function
|
||||
takes two parameters, both of which are string slices that live at least as
|
||||
long as lifetime `'a`. The function signature also tells Rust that the string
|
||||
slice returned from the function will live at least as long as lifetime `'a`.
|
||||
These constraints are what we want Rust to enforce. Remember, when we specify
|
||||
the lifetime parameters in this function signature, we’re not changing the
|
||||
lifetimes of any values passed in or returned. Rather, we’re specifying that
|
||||
the borrow checker should reject any values that don’t adhere to these
|
||||
constraints. Note that the `longest` function doesn’t need to know exactly how
|
||||
long `x` and `y` will live, only that some scope can be substituted for `'a`
|
||||
that will satisfy this signature.
|
||||
|
||||
When annotating lifetimes in functions, the annotations go in the function
|
||||
signature, not in the function body. Rust can analyze the code within the
|
||||
function without any help. However, when a function has references to or from
|
||||
code outside that function, it becomes almost impossible for Rust to figure out
|
||||
the lifetimes of the parameters or return values on its own. The lifetimes
|
||||
might be different each time the function is called. This is why we need to
|
||||
annotate the lifetimes manually.
|
||||
|
||||
When we pass concrete references to `longest`, the concrete lifetime that is
|
||||
substituted for `'a` is the part of the scope of `x` that overlaps with the
|
||||
scope of `y`. In other words, the generic lifetime `'a` will get the concrete
|
||||
lifetime that is equal to the smaller of the lifetimes of `x` and `y`. Because
|
||||
we’ve annotated the returned reference with the same lifetime parameter `'a`,
|
||||
the returned reference will also be valid for the length of the smaller of the
|
||||
lifetimes of `x` and `y`.
|
||||
|
||||
Let’s look at how the lifetime annotations restrict the `longest` function by
|
||||
passing in references that have different concrete lifetimes. Listing 10-23 is
|
||||
a straightforward example:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# fn longest<'a>(x: &'a str, y: &'a str) -> &'a str {
|
||||
# if x.len() > y.len() {
|
||||
# x
|
||||
# } else {
|
||||
# y
|
||||
# }
|
||||
# }
|
||||
#
|
||||
fn main() {
|
||||
let string1 = String::from("long string is long");
|
||||
|
||||
{
|
||||
let string2 = String::from("xyz");
|
||||
let result = longest(string1.as_str(), string2.as_str());
|
||||
println!("The longest string is {}", result);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-23: Using the `longest` function with
|
||||
references to `String` values that have different concrete lifetimes</span>
|
||||
|
||||
In this example, `string1` is valid until the end of the outer scope, `string2`
|
||||
is valid until the end of the inner scope, and `result` references something
|
||||
that is valid until the end of the inner scope. Run this code, and you’ll see
|
||||
that the borrow checker approves of this code; it will compile and print `The
|
||||
longest string is long string is long`.
|
||||
|
||||
Next, let’s try an example that shows that the lifetime of the reference in
|
||||
`result` must be the smaller lifetime of the two arguments. We’ll move the
|
||||
declaration of the `result` variable outside the inner scope but leave the
|
||||
assignment of the value to the `result` variable inside the scope with
|
||||
`string2`. Then we’ll move the `println!` that uses `result` outside the inner
|
||||
scope, after the inner scope has ended. The code in Listing 10-24 will not
|
||||
compile:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let string1 = String::from("long string is long");
|
||||
let result;
|
||||
{
|
||||
let string2 = String::from("xyz");
|
||||
result = longest(string1.as_str(), string2.as_str());
|
||||
}
|
||||
println!("The longest string is {}", result);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-24: Attempting to use `result` after `string2`
|
||||
has gone out of scope; the code won’t compile</span>
|
||||
|
||||
When we try to compile this code, we’ll get this error:
|
||||
|
||||
```text
|
||||
error[E0597]: `string2` does not live long enough
|
||||
--> src/main.rs:15:5
|
||||
|
|
||||
14 | result = longest(string1.as_str(), string2.as_str());
|
||||
| ------- borrow occurs here
|
||||
15 | }
|
||||
| ^ `string2` dropped here while still borrowed
|
||||
16 | println!("The longest string is {}", result);
|
||||
17 | }
|
||||
| - borrowed value needs to live until here
|
||||
```
|
||||
|
||||
The error shows that for `result` to be valid for the `println!` statement,
|
||||
`string2` would need to be valid until the end of the outer scope. Rust knows
|
||||
this because we annotated the lifetimes of the function parameters and return
|
||||
values using the same lifetime parameter `'a`.
|
||||
|
||||
As humans, we can look at this code and see that `string1` is longer than
|
||||
`string2`, and therefore `result` will contain a reference to `string1`.
|
||||
Because `string1` has not gone out of scope yet, a reference to `string1` will
|
||||
still be valid for the `println!` statement. However, the compiler can’t see
|
||||
that the reference is valid in this case. We’ve told Rust that the lifetime of
|
||||
the reference returned by the `longest` function is the same as the smaller of
|
||||
the lifetimes of the references passed in. Therefore, the borrow checker
|
||||
disallows the code in Listing 10-24 as possibly having an invalid reference.
|
||||
|
||||
Try designing more experiments that vary the values and lifetimes of the
|
||||
references passed in to the `longest` function and how the returned reference
|
||||
is used. Make hypotheses about whether or not your experiments will pass the
|
||||
borrow checker before you compile; then check to see if you’re right!
|
||||
|
||||
### Thinking in Terms of Lifetimes
|
||||
|
||||
The way in which you need to specify lifetime parameters depends on what your
|
||||
function is doing. For example, if we changed the implementation of the
|
||||
`longest` function to always return the first parameter rather than the longest
|
||||
string slice, we wouldn’t need to specify a lifetime on the `y` parameter. The
|
||||
following code will compile:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn longest<'a>(x: &'a str, y: &str) -> &'a str {
|
||||
x
|
||||
}
|
||||
```
|
||||
|
||||
In this example, we’ve specified a lifetime parameter `'a` for the parameter
|
||||
`x` and the return type, but not for the parameter `y`, because the lifetime of
|
||||
`y` does not have any relationship with the lifetime of `x` or the return value.
|
||||
|
||||
When returning a reference from a function, the lifetime parameter for the
|
||||
return type needs to match the lifetime parameter for one of the parameters. If
|
||||
the reference returned does *not* refer to one of the parameters, it must refer
|
||||
to a value created within this function, which would be a dangling reference
|
||||
because the value will go out of scope at the end of the function. Consider
|
||||
this attempted implementation of the `longest` function that won’t compile:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn longest<'a>(x: &str, y: &str) -> &'a str {
|
||||
let result = String::from("really long string");
|
||||
result.as_str()
|
||||
}
|
||||
```
|
||||
|
||||
Here, even though we’ve specified a lifetime parameter `'a` for the return
|
||||
type, this implementation will fail to compile because the return value
|
||||
lifetime is not related to the lifetime of the parameters at all. Here is the
|
||||
error message we get:
|
||||
|
||||
```text
|
||||
error[E0597]: `result` does not live long enough
|
||||
--> src/main.rs:3:5
|
||||
|
|
||||
3 | result.as_str()
|
||||
| ^^^^^^ does not live long enough
|
||||
4 | }
|
||||
| - borrowed value only lives until here
|
||||
|
|
||||
note: borrowed value must be valid for the lifetime 'a as defined on the
|
||||
function body at 1:1...
|
||||
--> src/main.rs:1:1
|
||||
|
|
||||
1 | / fn longest<'a>(x: &str, y: &str) -> &'a str {
|
||||
2 | | let result = String::from("really long string");
|
||||
3 | | result.as_str()
|
||||
4 | | }
|
||||
| |_^
|
||||
```
|
||||
|
||||
The problem is that `result` goes out of scope and gets cleaned up at the end
|
||||
of the `longest` function. We’re also trying to return a reference to `result`
|
||||
from the function. There is no way we can specify lifetime parameters that
|
||||
would change the dangling reference, and Rust won’t let us create a dangling
|
||||
reference. In this case, the best fix would be to return an owned data type
|
||||
rather than a reference so the calling function is then responsible for
|
||||
cleaning up the value.
|
||||
|
||||
Ultimately, lifetime syntax is about connecting the lifetimes of various
|
||||
parameters and return values of functions. Once they’re connected, Rust has
|
||||
enough information to allow memory-safe operations and disallow operations that
|
||||
would create dangling pointers or otherwise violate memory safety.
|
||||
|
||||
### Lifetime Annotations in Struct Definitions
|
||||
|
||||
So far, we’ve only defined structs to hold owned types. It’s possible for
|
||||
structs to hold references, but in that case we would need to add a lifetime
|
||||
annotation on every reference in the struct’s definition. Listing 10-25 has a
|
||||
struct named `ImportantExcerpt` that holds a string slice:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
struct ImportantExcerpt<'a> {
|
||||
part: &'a str,
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let novel = String::from("Call me Ishmael. Some years ago...");
|
||||
let first_sentence = novel.split('.')
|
||||
.next()
|
||||
.expect("Could not find a '.'");
|
||||
let i = ImportantExcerpt { part: first_sentence };
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-25: A struct that holds a reference, so its
|
||||
definition needs a lifetime annotation</span>
|
||||
|
||||
This struct has one field, `part`, that holds a string slice, which is a
|
||||
reference. As with generic data types, we declare the name of the generic
|
||||
lifetime parameter inside angle brackets after the name of the struct so we can
|
||||
use the lifetime parameter in the body of the struct definition. This
|
||||
annotation means an instance of `ImportantExcerpt` can’t outlive the reference
|
||||
it holds in its `part` field.
|
||||
|
||||
The `main` function here creates an instance of the `ImportantExcerpt` struct
|
||||
that holds a reference to the first sentence of the `String` owned by the
|
||||
variable `novel`. The data in `novel` exists before the `ImportantExcerpt`
|
||||
instance is created. In addition, `novel` doesn’t go out of scope until after
|
||||
the `ImportantExcerpt` goes out of scope, so the reference in the
|
||||
`ImportantExcerpt` instance is valid.
|
||||
|
||||
### Lifetime Elision
|
||||
|
||||
You’ve learned that every reference has a lifetime and that you need to specify
|
||||
lifetime parameters for functions or structs that use references. However, in
|
||||
Chapter 4 we had a function in the “String Slices” section, which is shown again
|
||||
in Listing 10-26, that compiled without lifetime annotations:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
fn first_word(s: &str) -> &str {
|
||||
let bytes = s.as_bytes();
|
||||
|
||||
for (i, &item) in bytes.iter().enumerate() {
|
||||
if item == b' ' {
|
||||
return &s[0..i];
|
||||
}
|
||||
}
|
||||
|
||||
&s[..]
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 10-26: A function we defined in Chapter 4 that
|
||||
compiled without lifetime annotations, even though the parameter and return
|
||||
type are references</span>
|
||||
|
||||
The reason this function compiles without lifetime annotations is historical:
|
||||
in early versions (pre-1.0) of Rust, this code wouldn’t have compiled because
|
||||
every reference needed an explicit lifetime. At that time, the function
|
||||
signature would have been written like this:
|
||||
|
||||
```rust,ignore
|
||||
fn first_word<'a>(s: &'a str) -> &'a str {
|
||||
```
|
||||
|
||||
After writing a lot of Rust code, the Rust team found that Rust programmers
|
||||
were entering the same lifetime annotations over and over in particular
|
||||
situations. These situations were predictable and followed a few deterministic
|
||||
patterns. The developers programmed these patterns into the compiler’s code so
|
||||
the borrow checker could infer the lifetimes in these situations and not need
|
||||
explicit annotations.
|
||||
|
||||
This piece of Rust history is relevant because it’s possible that more
|
||||
deterministic patterns will emerge and be added to the compiler. In the future,
|
||||
even fewer lifetime annotations might be required.
|
||||
|
||||
The patterns programmed into Rust’s analysis of references are called the
|
||||
*lifetime elision rules*. These aren’t rules for programmers to follow; they’re
|
||||
a set of particular cases that the compiler will consider, and if your code
|
||||
fits these cases, you don’t need to write the lifetimes explicitly.
|
||||
|
||||
The elision rules don’t provide full inference. If Rust deterministically
|
||||
applies the rules but there is still ambiguity as to what lifetimes the
|
||||
references have, the compiler won’t guess what the lifetime of the remaining
|
||||
references should be. In this case, instead of guessing, the compiler will give
|
||||
you an error that you can resolve by adding the lifetime annotations that
|
||||
specify how the references relate to each other.
|
||||
|
||||
Lifetimes on function or method parameters are called *input lifetimes*, and
|
||||
lifetimes on return values are called *output lifetimes*.
|
||||
|
||||
The compiler uses three rules to figure out what lifetimes references have when
|
||||
there aren’t explicit annotations. The first rule applies to input lifetimes,
|
||||
and the second and third rules apply to output lifetimes. If the compiler gets
|
||||
to the end of the three rules and there are still references for which it can’t
|
||||
figure out lifetimes, the compiler will stop with an error.
|
||||
|
||||
The first rule is that each parameter that is a reference gets its own lifetime
|
||||
parameter. In other words, a function with one parameter gets one lifetime
|
||||
parameter: `fn foo<'a>(x: &'a i32)`; a function with two parameters gets two
|
||||
separate lifetime parameters: `fn foo<'a, 'b>(x: &'a i32, y: &'b i32)`; and so
|
||||
on.
|
||||
|
||||
The second rule is if there is exactly one input lifetime parameter, that
|
||||
lifetime is assigned to all output lifetime parameters: `fn foo<'a>(x: &'a i32)
|
||||
-> &'a i32`.
|
||||
|
||||
The third rule is if there are multiple input lifetime parameters, but one of
|
||||
them is `&self` or `&mut self` because this is a method, the lifetime of `self`
|
||||
is assigned to all output lifetime parameters. This third rule makes methods
|
||||
much nicer to read and write because fewer symbols are necessary.
|
||||
|
||||
Let’s pretend we’re the compiler. We’ll apply these rules to figure out what
|
||||
the lifetimes of the references in the signature of the `first_word` function
|
||||
in Listing 10-26 are. The signature starts without any lifetimes associated
|
||||
with the references:
|
||||
|
||||
```rust,ignore
|
||||
fn first_word(s: &str) -> &str {
|
||||
```
|
||||
|
||||
Then the compiler applies the first rule, which specifies that each parameter
|
||||
gets its own lifetime. We’ll call it `'a` as usual, so now the signature is:
|
||||
|
||||
```rust,ignore
|
||||
fn first_word<'a>(s: &'a str) -> &str {
|
||||
```
|
||||
|
||||
The second rule applies because there is exactly one input lifetime. The second
|
||||
rule specifies that the lifetime of the one input parameter gets assigned to
|
||||
the output lifetime, so the signature is now this:
|
||||
|
||||
```rust,ignore
|
||||
fn first_word<'a>(s: &'a str) -> &'a str {
|
||||
```
|
||||
|
||||
Now all the references in this function signature have lifetimes, and the
|
||||
compiler can continue its analysis without needing the programmer to annotate
|
||||
the lifetimes in this function signature.
|
||||
|
||||
Let’s look at another example, this time using the `longest` function that had
|
||||
no lifetime parameters when we started working with it in Listing 10-21:
|
||||
|
||||
```rust,ignore
|
||||
fn longest(x: &str, y: &str) -> &str {
|
||||
```
|
||||
|
||||
Let’s apply the first rule: each parameter gets its own lifetime. This time we
|
||||
have two parameters instead of one, so we have two lifetimes:
|
||||
|
||||
```rust,ignore
|
||||
fn longest<'a, 'b>(x: &'a str, y: &'b str) -> &str {
|
||||
```
|
||||
|
||||
You can see that the second rule doesn’t apply because there is more than one
|
||||
input lifetime. The third rule doesn’t apply either, because `longest` is a
|
||||
function rather than a method, so none of the parameters are `self`. After
|
||||
working through all three rules, we still haven’t figured out what the return
|
||||
type’s lifetime is. This is why we got an error trying to compile the code in
|
||||
Listing 10-21: the compiler worked through the lifetime elision rules but still
|
||||
couldn’t figure out all the lifetimes of the references in the signature.
|
||||
|
||||
Because the third rule really only applies in method signatures, we’ll look at
|
||||
lifetimes in that context next to see why the third rule means we don’t have to
|
||||
annotate lifetimes in method signatures very often.
|
||||
|
||||
### Lifetime Annotations in Method Definitions
|
||||
|
||||
When we implement methods on a struct with lifetimes, we use the same syntax as
|
||||
that of generic type parameters shown in Listing 10-11. Where we declare and
|
||||
use the lifetime parameters depends on whether they’re related to the struct
|
||||
fields or the method parameters and return values.
|
||||
|
||||
Lifetime names for struct fields always need to be declared after the `impl`
|
||||
keyword and then used after the struct’s name, because those lifetimes are part
|
||||
of the struct’s type.
|
||||
|
||||
In method signatures inside the `impl` block, references might be tied to the
|
||||
lifetime of references in the struct’s fields, or they might be independent. In
|
||||
addition, the lifetime elision rules often make it so that lifetime annotations
|
||||
aren’t necessary in method signatures. Let’s look at some examples using the
|
||||
struct named `ImportantExcerpt` that we defined in Listing 10-25.
|
||||
|
||||
First, we’ll use a method named `level` whose only parameter is a reference to
|
||||
`self` and whose return value is an `i32`, which is not a reference to anything:
|
||||
|
||||
```rust
|
||||
# struct ImportantExcerpt<'a> {
|
||||
# part: &'a str,
|
||||
# }
|
||||
#
|
||||
impl<'a> ImportantExcerpt<'a> {
|
||||
fn level(&self) -> i32 {
|
||||
3
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
The lifetime parameter declaration after `impl` and use after the type name is
|
||||
required, but we’re not required to annotate the lifetime of the reference to
|
||||
`self` because of the first elision rule.
|
||||
|
||||
Here is an example where the third lifetime elision rule applies:
|
||||
|
||||
```rust
|
||||
# struct ImportantExcerpt<'a> {
|
||||
# part: &'a str,
|
||||
# }
|
||||
#
|
||||
impl<'a> ImportantExcerpt<'a> {
|
||||
fn announce_and_return_part(&self, announcement: &str) -> &str {
|
||||
println!("Attention please: {}", announcement);
|
||||
self.part
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
There are two input lifetimes, so Rust applies the first lifetime elision rule
|
||||
and gives both `&self` and `announcement` their own lifetimes. Then, because
|
||||
one of the parameters is `&self`, the return type gets the lifetime of `&self`,
|
||||
and all lifetimes have been accounted for.
|
||||
|
||||
### The Static Lifetime
|
||||
|
||||
One special lifetime we need to discuss is `'static`, which denotes the entire
|
||||
duration of the program. All string literals have the `'static` lifetime, which
|
||||
we can annotate as follows: `let s: &'static str = "I have a static
|
||||
lifetime.";`.
|
||||
|
||||
The text of this string is stored directly in the binary of your program, which
|
||||
is always available. Therefore, the lifetime of all string literals is
|
||||
`'static`.
|
||||
|
||||
You might see suggestions to use the `'static` lifetime in error messages. But
|
||||
before specifying `'static` as the lifetime for a reference, think about
|
||||
whether the reference you have actually lives the entire lifetime of your
|
||||
program or not. You might consider whether you want it to live that long, even
|
||||
if it could. Most of the time, the problem results from attempting to create a
|
||||
dangling reference or a mismatch of the available lifetimes. In such cases, the
|
||||
solution is fixing those problems, not specifying the `'static` lifetime.
|
||||
|
||||
## Generic Type Parameters, Trait Bounds, and Lifetimes Together
|
||||
|
||||
Let’s briefly look at the syntax of specifying generic type parameters, trait
|
||||
bounds, and lifetimes all in one function!
|
||||
|
||||
```rust
|
||||
use std::fmt::Display;
|
||||
|
||||
fn longest_with_an_announcement<'a, T>(x: &'a str, y: &'a str, ann: T) -> &'a str
|
||||
where T: Display
|
||||
{
|
||||
println!("Announcement! {}", ann);
|
||||
if x.len() > y.len() {
|
||||
x
|
||||
} else {
|
||||
y
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
This is the `longest` function from Listing 10-22 that returns the longer of
|
||||
two string slices. But now it has an extra parameter named `ann` of the generic
|
||||
type `T`, which can be filled in by any type that implements the `Display`
|
||||
trait as specified by the `where` clause. This extra parameter will be printed
|
||||
before the function compares the lengths of the string slices, which is why the
|
||||
`Display` trait bound is necessary. Because lifetimes are a type of generic,
|
||||
the declarations of the lifetime parameter `'a` and the generic type parameter
|
||||
`T` go in the same list inside the angle brackets after the function name.
|
||||
|
||||
## Summary
|
||||
|
||||
We covered a lot in this chapter! Now that you know about generic type
|
||||
parameters, traits and trait bounds, and generic lifetime parameters, you’re
|
||||
ready to write code without repetition that works in many different situations.
|
||||
Generic type parameters let you apply the code to different types. Traits and
|
||||
trait bounds ensure that even though the types are generic, they’ll have the
|
||||
behavior the code needs. You learned how to use lifetime annotations to ensure
|
||||
that this flexible code won’t have any dangling references. And all of this
|
||||
analysis happens at compile time, which doesn’t affect runtime performance!
|
||||
|
||||
Believe it or not, there is much more to learn on the topics we discussed in
|
||||
this chapter: Chapter 17 discusses trait objects, which are another way to use
|
||||
traits. Chapter 19 covers more complex scenarios involving lifetime annotations
|
||||
as well as some advanced type system features. But in the next chapter, you’ll
|
||||
learn how to write tests in Rust so you can make sure your code is working the
|
||||
way it should.
|
||||
34
2018-edition/src/ch11-00-testing.md
Normal file
34
2018-edition/src/ch11-00-testing.md
Normal file
@@ -0,0 +1,34 @@
|
||||
# Writing Automated Tests
|
||||
|
||||
In his 1972 essay “The Humble Programmer,” Edsger W. Dijkstra said that
|
||||
“Program testing can be a very effective way to show the presence of bugs, but
|
||||
it is hopelessly inadequate for showing their absence.” That doesn’t mean we
|
||||
shouldn’t try to test as much as we can!
|
||||
|
||||
Correctness in our programs is the extent to which our code does what we intend
|
||||
it to do. Rust is designed with a high degree of concern about the correctness
|
||||
of programs, but correctness is complex and not easy to prove. Rust’s type
|
||||
system shoulders a huge part of this burden, but the type system cannot catch
|
||||
every kind of incorrectness. As such, Rust includes support for writing
|
||||
automated software tests within the language.
|
||||
|
||||
As an example, say we write a function called `add_two` that adds 2 to whatever
|
||||
number is passed to it. This function’s signature accepts an integer as a
|
||||
parameter and returns an integer as a result. When we implement and compile
|
||||
that function, Rust does all the type checking and borrow checking that you’ve
|
||||
learned so far to ensure that, for instance, we aren’t passing a `String` value
|
||||
or an invalid reference to this function. But Rust *can’t* check that this
|
||||
function will do precisely what we intend, which is return the parameter plus 2
|
||||
rather than, say, the parameter plus 10 or the parameter minus 50! That’s where
|
||||
tests come in.
|
||||
|
||||
We can write tests that assert, for example, that when we pass `3` to the
|
||||
`add_two` function, the returned value is `5`. We can run these tests whenever
|
||||
we make changes to our code to make sure any existing correct behavior has not
|
||||
changed.
|
||||
|
||||
Testing is a complex skill: although we can’t cover every detail about how to
|
||||
write good tests in one chapter, we’ll discuss the mechanics of Rust’s testing
|
||||
facilities. We’ll talk about the annotations and macros available to you when
|
||||
writing your tests, the default behavior and options provided for running your
|
||||
tests, and how to organize tests into unit tests and integration tests.
|
||||
806
2018-edition/src/ch11-01-writing-tests.md
Normal file
806
2018-edition/src/ch11-01-writing-tests.md
Normal file
@@ -0,0 +1,806 @@
|
||||
## How to Write Tests
|
||||
|
||||
Tests are Rust functions that verify that the non-test code is functioning in
|
||||
the expected manner. The bodies of test functions typically perform these three
|
||||
actions:
|
||||
|
||||
1. Set up any needed data or state.
|
||||
2. Run the code you want to test.
|
||||
3. Assert the results are what you expect.
|
||||
|
||||
Let’s look at the features Rust provides specifically for writing tests that
|
||||
take these actions, which include the `test` attribute, a few macros, and the
|
||||
`should_panic` attribute.
|
||||
|
||||
### The Anatomy of a Test Function
|
||||
|
||||
At its simplest, a test in Rust is a function that’s annotated with the `test`
|
||||
attribute. Attributes are metadata about pieces of Rust code; one example is
|
||||
the `derive` attribute we used with structs in Chapter 5. To change a function
|
||||
into a test function, add `#[test]` on the line before `fn`. When you run your
|
||||
tests with the `cargo test` command, Rust builds a test runner binary that runs
|
||||
the functions annotated with the `test` attribute and reports on whether each
|
||||
test function passes or fails.
|
||||
|
||||
In Chapter 7, we saw that when we make a new library project with Cargo, a test
|
||||
module with a test function in it is automatically generated for us. This
|
||||
module helps you start writing your tests so you don’t have to look up the
|
||||
exact structure and syntax of test functions every time you start a new
|
||||
project. You can add as many additional test functions and as many test modules
|
||||
as you want!
|
||||
|
||||
We’ll explore some aspects of how tests work by experimenting with the template
|
||||
test generated for us without actually testing any code. Then we’ll write some
|
||||
real-world tests that call some code that we’ve written and assert that its
|
||||
behavior is correct.
|
||||
|
||||
Let’s create a new library project called `adder`:
|
||||
|
||||
```text
|
||||
$ cargo new adder --lib
|
||||
Created library `adder` project
|
||||
$ cd adder
|
||||
```
|
||||
|
||||
The contents of the *src/lib.rs* file in your `adder` library should look like
|
||||
Listing 11-1:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
#[test]
|
||||
fn it_works() {
|
||||
assert_eq!(2 + 2, 4);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-1: The test module and function generated
|
||||
automatically by `cargo new`</span>
|
||||
|
||||
For now, let’s ignore the top two lines and focus on the function to see how it
|
||||
works. Note the `#[test]` annotation before the `fn` line: this attribute
|
||||
indicates this is a test function, so the test runner knows to treat this
|
||||
function as a test. We could also have non-test functions in the `tests` module
|
||||
to help set up common scenarios or perform common operations, so we need to
|
||||
indicate which functions are tests by using the `#[test]` attribute.
|
||||
|
||||
The function body uses the `assert_eq!` macro to assert that 2 + 2 equals 4.
|
||||
This assertion serves as an example of the format for a typical test. Let’s run
|
||||
it to see that this test passes.
|
||||
|
||||
The `cargo test` command runs all tests in our project, as shown in Listing
|
||||
11-2:
|
||||
|
||||
```text
|
||||
$ cargo test
|
||||
Compiling adder v0.1.0 (file:///projects/adder)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.22 secs
|
||||
Running target/debug/deps/adder-ce99bcc2479f4607
|
||||
|
||||
running 1 test
|
||||
test tests::it_works ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
Doc-tests adder
|
||||
|
||||
running 0 tests
|
||||
|
||||
test result: ok. 0 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-2: The output from running the automatically
|
||||
generated test</span>
|
||||
|
||||
Cargo compiled and ran the test. After the `Compiling`, `Finished`, and
|
||||
`Running` lines is the line `running 1 test`. The next line shows the name
|
||||
of the generated test function, called `it_works`, and the result of running
|
||||
that test, `ok`. The overall summary of running the tests appears next. The
|
||||
text `test result: ok.` means that all the tests passed, and the portion that
|
||||
reads `1 passed; 0 failed` totals the number of tests that passed or failed.
|
||||
|
||||
Because we don’t have any tests we’ve marked as ignored, the summary shows `0
|
||||
ignored`. We also haven’t filtered the tests being run, so the end of the
|
||||
summary shows `0 filtered out`. We’ll talk about ignoring and filtering out
|
||||
tests in the next section, “Controlling How Tests Are Run.”
|
||||
|
||||
The `0 measured` statistic is for benchmark tests that measure performance.
|
||||
Benchmark tests are, as of this writing, only available in nightly Rust. See
|
||||
[the documentation about benchmark tests][bench] to learn more.
|
||||
|
||||
[bench]: ../../unstable-book/library-features/test.html
|
||||
|
||||
The next part of the test output, which starts with `Doc-tests adder`, is for
|
||||
the results of any documentation tests. We don’t have any documentation tests
|
||||
yet, but Rust can compile any code examples that appear in our API
|
||||
documentation. This feature helps us keep our docs and our code in sync! We’ll
|
||||
discuss how to write documentation tests in the “Documentation Comments”
|
||||
section of Chapter 14. For now, we’ll ignore the `Doc-tests` output.
|
||||
|
||||
Let’s change the name of our test to see how that changes the test output.
|
||||
Change the `it_works` function to a different name, such as `exploration`, like
|
||||
so:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
#[test]
|
||||
fn exploration() {
|
||||
assert_eq!(2 + 2, 4);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
Then run `cargo test` again. The output now shows `exploration` instead of
|
||||
`it_works`:
|
||||
|
||||
```text
|
||||
running 1 test
|
||||
test tests::exploration ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Let’s add another test, but this time we’ll make a test that fails! Tests fail
|
||||
when something in the test function panics. Each test is run in a new thread,
|
||||
and when the main thread sees that a test thread has died, the test is marked
|
||||
as failed. We talked about the simplest way to cause a panic in Chapter 9,
|
||||
which is to call the `panic!` macro. Enter the new test, `another`, so your
|
||||
*src/lib.rs* file looks like Listing 11-3:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
#[test]
|
||||
fn exploration() {
|
||||
assert_eq!(2 + 2, 4);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn another() {
|
||||
panic!("Make this test fail");
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-3: Adding a second test that will fail because
|
||||
we call the `panic!` macro</span>
|
||||
|
||||
Run the tests again using `cargo test`. The output should look like Listing
|
||||
11-4, which shows that our `exploration` test passed and `another` failed:
|
||||
|
||||
```text
|
||||
running 2 tests
|
||||
test tests::exploration ... ok
|
||||
test tests::another ... FAILED
|
||||
|
||||
failures:
|
||||
|
||||
---- tests::another stdout ----
|
||||
thread 'tests::another' panicked at 'Make this test fail', src/lib.rs:10:8
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
|
||||
failures:
|
||||
tests::another
|
||||
|
||||
test result: FAILED. 1 passed; 1 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
error: test failed
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-4: Test results when one test passes and one
|
||||
test fails</span>
|
||||
|
||||
Instead of `ok`, the line `test tests::another` shows `FAILED`. Two new
|
||||
sections appear between the individual results and the summary: the first
|
||||
section displays the detailed reason for each test failure. In this case,
|
||||
`another` failed because it `panicked at 'Make this test fail'`, which happened
|
||||
on line 10 in the *src/lib.rs* file. The next section lists just the names of
|
||||
all the failing tests, which is useful when there are lots of tests and lots of
|
||||
detailed failing test output. We can use the name of a failing test to run just
|
||||
that test to more easily debug it; we’ll talk more about ways to run tests in
|
||||
the “Controlling How Tests Are Run” section.
|
||||
|
||||
The summary line displays at the end: overall, our test result is `FAILED`.
|
||||
We had one test pass and one test fail.
|
||||
|
||||
Now that you’ve seen what the test results look like in different scenarios,
|
||||
let’s look at some macros other than `panic!` that are useful in tests.
|
||||
|
||||
### Checking Results with the `assert!` Macro
|
||||
|
||||
The `assert!` macro, provided by the standard library, is useful when you want
|
||||
to ensure that some condition in a test evaluates to `true`. We give the
|
||||
`assert!` macro an argument that evaluates to a Boolean. If the value is
|
||||
`true`, `assert!` does nothing and the test passes. If the value is `false`,
|
||||
the `assert!` macro calls the `panic!` macro, which causes the test to fail.
|
||||
Using the `assert!` macro helps us check that our code is functioning in the
|
||||
way we intend.
|
||||
|
||||
In Chapter 5, Listing 5-15, we used a `Rectangle` struct and a `can_hold`
|
||||
method, which are repeated here in Listing 11-5. Let’s put this code in the
|
||||
*src/lib.rs* file and write some tests for it using the `assert!` macro.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
#[derive(Debug)]
|
||||
pub struct Rectangle {
|
||||
length: u32,
|
||||
width: u32,
|
||||
}
|
||||
|
||||
impl Rectangle {
|
||||
pub fn can_hold(&self, other: &Rectangle) -> bool {
|
||||
self.length > other.length && self.width > other.width
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-5: Using the `Rectangle` struct and its
|
||||
`can_hold` method from Chapter 5</span>
|
||||
|
||||
The `can_hold` method returns a Boolean, which means it’s a perfect use case
|
||||
for the `assert!` macro. In Listing 11-6, we write a test that exercises the
|
||||
`can_hold` method by creating a `Rectangle` instance that has a length of 8 and
|
||||
a width of 7 and asserting that it can hold another `Rectangle` instance that
|
||||
has a length of 5 and a width of 1:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn larger_can_hold_smaller() {
|
||||
let larger = Rectangle { length: 8, width: 7 };
|
||||
let smaller = Rectangle { length: 5, width: 1 };
|
||||
|
||||
assert!(larger.can_hold(&smaller));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-6: A test for `can_hold` that checks whether a
|
||||
larger rectangle can indeed hold a smaller rectangle</span>
|
||||
|
||||
Note that we’ve added a new line inside the `tests` module: `use super::*;`.
|
||||
The `tests` module is a regular module that follows the usual visibility rules
|
||||
we covered in Chapter 7 in the “Privacy Rules” section. Because the `tests`
|
||||
module is an inner module, we need to bring the code under test in the outer
|
||||
module into the scope of the inner module. We use a glob here so anything we
|
||||
define in the outer module is available to this `tests` module.
|
||||
|
||||
We’ve named our test `larger_can_hold_smaller`, and we’ve created the two
|
||||
`Rectangle` instances that we need. Then we called the `assert!` macro and
|
||||
passed it the result of calling `larger.can_hold(&smaller)`. This expression
|
||||
is supposed to return `true`, so our test should pass. Let’s find out!
|
||||
|
||||
```text
|
||||
running 1 test
|
||||
test tests::larger_can_hold_smaller ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
It does pass! Let’s add another test, this time asserting that a smaller
|
||||
rectangle cannot hold a larger rectangle:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn larger_can_hold_smaller() {
|
||||
// --snip--
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn smaller_cannot_hold_larger() {
|
||||
let larger = Rectangle { length: 8, width: 7 };
|
||||
let smaller = Rectangle { length: 5, width: 1 };
|
||||
|
||||
assert!(!smaller.can_hold(&larger));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
Because the correct result of the `can_hold` function in this case is `false`,
|
||||
we need to negate that result before we pass it to the `assert!` macro. As a
|
||||
result, our test will pass if `can_hold` returns `false`:
|
||||
|
||||
```text
|
||||
running 2 tests
|
||||
test tests::smaller_cannot_hold_larger ... ok
|
||||
test tests::larger_can_hold_smaller ... ok
|
||||
|
||||
test result: ok. 2 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Two tests that pass! Now let’s see what happens to our test results when we
|
||||
introduce a bug in our code. Let’s change the implementation of the `can_hold`
|
||||
method by replacing the greater-than sign with a less-than sign when it
|
||||
compares the lengths:
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
# #[derive(Debug)]
|
||||
# pub struct Rectangle {
|
||||
# length: u32,
|
||||
# width: u32,
|
||||
# }
|
||||
// --snip--
|
||||
|
||||
impl Rectangle {
|
||||
pub fn can_hold(&self, other: &Rectangle) -> bool {
|
||||
self.length < other.length && self.width > other.width
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
Running the tests now produces the following:
|
||||
|
||||
```text
|
||||
running 2 tests
|
||||
test tests::smaller_cannot_hold_larger ... ok
|
||||
test tests::larger_can_hold_smaller ... FAILED
|
||||
|
||||
failures:
|
||||
|
||||
---- tests::larger_can_hold_smaller stdout ----
|
||||
thread 'tests::larger_can_hold_smaller' panicked at 'assertion failed:
|
||||
larger.can_hold(&smaller)', src/lib.rs:22:8
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
|
||||
failures:
|
||||
tests::larger_can_hold_smaller
|
||||
|
||||
test result: FAILED. 1 passed; 1 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Our tests caught the bug! Because `larger.length` is 8 and `smaller.length` is
|
||||
5, the comparison of the lengths in `can_hold` now returns `false`: 8 is not
|
||||
less than 5.
|
||||
|
||||
### Testing Equality with the `assert_eq!` and `assert_ne!` Macros
|
||||
|
||||
A common way to test functionality is to compare the result of the code under
|
||||
test to the value you expect the code to return to make sure they’re equal. You
|
||||
could do this using the `assert!` macro and passing it an expression using the
|
||||
`==` operator. However, this is such a common test that the standard library
|
||||
provides a pair of macros—`assert_eq!` and `assert_ne!`—to perform this test
|
||||
more conveniently. These macros compare two arguments for equality or
|
||||
inequality, respectively. They’ll also print the two values if the assertion
|
||||
fails, which makes it easier to see *why* the test failed; conversely, the
|
||||
`assert!` macro only indicates that it got a `false` value for the `==`
|
||||
expression, not the values that lead to the `false` value.
|
||||
|
||||
In Listing 11-7, we write a function named `add_two` that adds `2` to its
|
||||
parameter and returns the result. Then we test this function using the
|
||||
`assert_eq!` macro.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
pub fn add_two(a: i32) -> i32 {
|
||||
a + 2
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn it_adds_two() {
|
||||
assert_eq!(4, add_two(2));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-7: Testing the function `add_two` using the
|
||||
`assert_eq!` macro</span>
|
||||
|
||||
Let’s check that it passes!
|
||||
|
||||
```text
|
||||
running 1 test
|
||||
test tests::it_adds_two ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
The first argument we gave to the `assert_eq!` macro, `4`, is equal to the
|
||||
result of calling `add_two(2)`. The line for this test is `test
|
||||
tests::it_adds_two ... ok`, and the `ok` text indicates that our test passed!
|
||||
|
||||
Let’s introduce a bug into our code to see what it looks like when a test that
|
||||
uses `assert_eq!` fails. Change the implementation of the `add_two` function to
|
||||
instead add `3`:
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
pub fn add_two(a: i32) -> i32 {
|
||||
a + 3
|
||||
}
|
||||
```
|
||||
|
||||
Run the tests again:
|
||||
|
||||
```text
|
||||
running 1 test
|
||||
test tests::it_adds_two ... FAILED
|
||||
|
||||
failures:
|
||||
|
||||
---- tests::it_adds_two stdout ----
|
||||
thread 'tests::it_adds_two' panicked at 'assertion failed: `(left == right)`
|
||||
left: `4`,
|
||||
right: `5`', src/lib.rs:11:8
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
|
||||
failures:
|
||||
tests::it_adds_two
|
||||
|
||||
test result: FAILED. 0 passed; 1 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Our test caught the bug! The `it_adds_two` test failed, displaying the message
|
||||
`` assertion failed: `(left == right)` `` and showing that `left` was `4` and
|
||||
`right` was `5`. This message is useful and helps us start debugging: it means
|
||||
the `left` argument to `assert_eq!` was `4` but the `right` argument, where we
|
||||
had `add_two(2)`, was `5`.
|
||||
|
||||
Note that in some languages and test frameworks, the parameters to the
|
||||
functions that assert two values are equal are called `expected` and `actual`,
|
||||
and the order in which we specify the arguments matters. However, in Rust,
|
||||
they’re called `left` and `right`, and the order in which we specify the value
|
||||
we expect and the value that the code under test produces doesn’t matter. We
|
||||
could write the assertion in this test as `assert_eq!(add_two(2), 4)`, which
|
||||
would result in a failure message that displays `` assertion failed: `(left ==
|
||||
right)` `` and that `left` was `5` and `right` was `4`.
|
||||
|
||||
The `assert_ne!` macro will pass if the two values we give it are not equal and
|
||||
fail if they’re equal. This macro is most useful for cases when we’re not sure
|
||||
what a value *will* be, but we know what the value definitely *won’t* be if our
|
||||
code is functioning as we intend. For example, if we’re testing a function that
|
||||
is guaranteed to change its input in some way, but the way in which the input
|
||||
is changed depends on the day of the week that we run our tests, the best thing
|
||||
to assert might be that the output of the function is not equal to the input.
|
||||
|
||||
Under the surface, the `assert_eq!` and `assert_ne!` macros use the operators
|
||||
`==` and `!=`, respectively. When the assertions fail, these macros print their
|
||||
arguments using debug formatting, which means the values being compared must
|
||||
implement the `PartialEq` and `Debug` traits. All the primitive types and most
|
||||
of the standard library types implement these traits. For structs and enums
|
||||
that you define, you’ll need to implement `PartialEq` to assert that values of
|
||||
those types are equal or not equal. You’ll need to implement `Debug` to print
|
||||
the values when the assertion fails. Because both traits are derivable traits,
|
||||
as mentioned in Listing 5-12 in Chapter 5, this is usually as straightforward
|
||||
as adding the `#[derive(PartialEq, Debug)]` annotation to your struct or enum
|
||||
definition. See Appendix C, “Derivable Traits,” for more details about these
|
||||
and other derivable traits.
|
||||
|
||||
### Adding Custom Failure Messages
|
||||
|
||||
You can also add a custom message to be printed with the failure message as
|
||||
optional arguments to the `assert!`, `assert_eq!`, and `assert_ne!` macros. Any
|
||||
arguments specified after the one required argument to `assert!` or the two
|
||||
required arguments to `assert_eq!` and `assert_ne!` are passed along to the
|
||||
`format!` macro (discussed in Chapter 8 in the “Concatenation with the `+`
|
||||
Operator or the `format!` Macro” section), so you can pass a format string that
|
||||
contains `{}` placeholders and values to go in those placeholders. Custom
|
||||
messages are useful to document what an assertion means; when a test fails,
|
||||
you’ll have a better idea of what the problem is with the code.
|
||||
|
||||
For example, let’s say we have a function that greets people by name and we
|
||||
want to test that the name we pass into the function appears in the output:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
pub fn greeting(name: &str) -> String {
|
||||
format!("Hello {}!", name)
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn greeting_contains_name() {
|
||||
let result = greeting("Carol");
|
||||
assert!(result.contains("Carol"));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
The requirements for this program haven’t been agreed upon yet, and we’re
|
||||
pretty sure the `Hello` text at the beginning of the greeting will change. We
|
||||
decided we don’t want to have to update the test when the requirements change,
|
||||
so instead of checking for exact equality to the value returned from the
|
||||
`greeting` function, we’ll just assert that the output contains the text of the
|
||||
input parameter.
|
||||
|
||||
Let’s introduce a bug into this code by changing `greeting` to not include
|
||||
`name` to see what this test failure looks like:
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
pub fn greeting(name: &str) -> String {
|
||||
String::from("Hello!")
|
||||
}
|
||||
```
|
||||
|
||||
Running this test produces the following:
|
||||
|
||||
```text
|
||||
running 1 test
|
||||
test tests::greeting_contains_name ... FAILED
|
||||
|
||||
failures:
|
||||
|
||||
---- tests::greeting_contains_name stdout ----
|
||||
thread 'tests::greeting_contains_name' panicked at 'assertion failed:
|
||||
result.contains("Carol")', src/lib.rs:12:8
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
|
||||
failures:
|
||||
tests::greeting_contains_name
|
||||
```
|
||||
|
||||
This result just indicates that the assertion failed and which line the
|
||||
assertion is on. A more useful failure message in this case would print the
|
||||
value we got from the `greeting` function. Let’s change the test function,
|
||||
giving it a custom failure message made from a format string with a placeholder
|
||||
filled in with the actual value we got from the `greeting` function:
|
||||
|
||||
```rust,ignore
|
||||
#[test]
|
||||
fn greeting_contains_name() {
|
||||
let result = greeting("Carol");
|
||||
assert!(
|
||||
result.contains("Carol"),
|
||||
"Greeting did not contain name, value was `{}`", result
|
||||
);
|
||||
}
|
||||
```
|
||||
|
||||
Now when we run the test, we’ll get a more informative error message:
|
||||
|
||||
```text
|
||||
---- tests::greeting_contains_name stdout ----
|
||||
thread 'tests::greeting_contains_name' panicked at 'Greeting did not
|
||||
contain name, value was `Hello!`', src/lib.rs:12:8
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
```
|
||||
|
||||
We can see the value we actually got in the test output, which would help us
|
||||
debug what happened instead of what we were expecting to happen.
|
||||
|
||||
### Checking for Panics with `should_panic`
|
||||
|
||||
In addition to checking that our code returns the correct values we expect,
|
||||
it’s also important to check that our code handles error conditions as we
|
||||
expect. For example, consider the `Guess` type that we created in Chapter 9,
|
||||
Listing 9-9. Other code that uses `Guess` depends on the guarantee that `Guess`
|
||||
instances will contain only values between 1 and 100. We can write a test that
|
||||
ensures that attempting to create a `Guess` instance with a value outside that
|
||||
range panics.
|
||||
|
||||
We do this by adding another attribute, `should_panic`, to our test function.
|
||||
This attribute makes a test pass if the code inside the function panics; the
|
||||
test will fail if the code inside the function doesn’t panic.
|
||||
|
||||
Listing 11-8 shows a test that checks that the error conditions of `Guess::new`
|
||||
happen when we expect them to:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
pub struct Guess {
|
||||
value: u32,
|
||||
}
|
||||
|
||||
impl Guess {
|
||||
pub fn new(value: u32) -> Guess {
|
||||
if value < 1 || value > 100 {
|
||||
panic!("Guess value must be between 1 and 100, got {}.", value);
|
||||
}
|
||||
|
||||
Guess {
|
||||
value
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
#[should_panic]
|
||||
fn greater_than_100() {
|
||||
Guess::new(200);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-8: Testing that a condition will cause a
|
||||
`panic!`</span>
|
||||
|
||||
We place the `#[should_panic]` attribute after the `#[test]` attribute and
|
||||
before the test function it applies to. Let’s look at the result when this test
|
||||
passes:
|
||||
|
||||
```text
|
||||
running 1 test
|
||||
test tests::greater_than_100 ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Looks good! Now let’s introduce a bug in our code by removing the condition
|
||||
that the `new` function will panic if the value is greater than 100:
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
# pub struct Guess {
|
||||
# value: u32,
|
||||
# }
|
||||
#
|
||||
// --snip--
|
||||
|
||||
impl Guess {
|
||||
pub fn new(value: u32) -> Guess {
|
||||
if value < 1 {
|
||||
panic!("Guess value must be between 1 and 100, got {}.", value);
|
||||
}
|
||||
|
||||
Guess {
|
||||
value
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
When we run the test in Listing 11-8, it will fail:
|
||||
|
||||
```text
|
||||
running 1 test
|
||||
test tests::greater_than_100 ... FAILED
|
||||
|
||||
failures:
|
||||
|
||||
failures:
|
||||
tests::greater_than_100
|
||||
|
||||
test result: FAILED. 0 passed; 1 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
We don’t get a very helpful message in this case, but when we look at the test
|
||||
function, we see that it’s annotated with `#[should_panic]`. The failure we got
|
||||
means that the code in the test function did not cause a panic.
|
||||
|
||||
Tests that use `should_panic` can be imprecise because they only indicate that
|
||||
the code has caused some panic. A `should_panic` test would pass even if the
|
||||
test panics for a different reason than the one we were expecting to happen. To
|
||||
make `should_panic` tests more precise, we can add an optional `expected`
|
||||
parameter to the `should_panic` attribute. The test harness will make sure that
|
||||
the failure message contains the provided text. For example, consider the
|
||||
modified code for `Guess` in Listing 11-9 where the `new` function panics with
|
||||
different messages depending on whether the value is too small or too large:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
# pub struct Guess {
|
||||
# value: u32,
|
||||
# }
|
||||
#
|
||||
// --snip--
|
||||
|
||||
impl Guess {
|
||||
pub fn new(value: u32) -> Guess {
|
||||
if value < 1 {
|
||||
panic!("Guess value must be greater than or equal to 1, got {}.",
|
||||
value);
|
||||
} else if value > 100 {
|
||||
panic!("Guess value must be less than or equal to 100, got {}.",
|
||||
value);
|
||||
}
|
||||
|
||||
Guess {
|
||||
value
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
#[should_panic(expected = "Guess value must be less than or equal to 100")]
|
||||
fn greater_than_100() {
|
||||
Guess::new(200);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-9: Testing that a condition will cause a
|
||||
`panic!` with a particular panic message</span>
|
||||
|
||||
This test will pass because the value we put in the `should_panic` attribute’s
|
||||
`expected` parameter is a substring of the message that the `Guess::new`
|
||||
function panics with. We could have specified the entire panic message that we
|
||||
expect, which in this case would be `Guess value must be less than or equal to
|
||||
100, got 200.` What you choose to specify in the expected parameter for
|
||||
`should_panic` depends on how much of the panic message is unique or dynamic
|
||||
and how precise you want your test to be. In this case, a substring of the
|
||||
panic message is enough to ensure that the code in the test function executes
|
||||
the `else if value > 100` case.
|
||||
|
||||
To see what happens when a `should_panic` test with an `expected` message
|
||||
fails, let’s again introduce a bug into our code by swapping the bodies of the
|
||||
`if value < 1` and the `else if value > 100` blocks:
|
||||
|
||||
```rust,ignore
|
||||
if value < 1 {
|
||||
panic!("Guess value must be less than or equal to 100, got {}.", value);
|
||||
} else if value > 100 {
|
||||
panic!("Guess value must be greater than or equal to 1, got {}.", value);
|
||||
}
|
||||
```
|
||||
|
||||
This time when we run the `should_panic` test, it will fail:
|
||||
|
||||
```text
|
||||
running 1 test
|
||||
test tests::greater_than_100 ... FAILED
|
||||
|
||||
failures:
|
||||
|
||||
---- tests::greater_than_100 stdout ----
|
||||
thread 'tests::greater_than_100' panicked at 'Guess value must be
|
||||
greater than or equal to 1, got 200.', src/lib.rs:11:12
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
note: Panic did not include expected string 'Guess value must be less than or
|
||||
equal to 100'
|
||||
|
||||
failures:
|
||||
tests::greater_than_100
|
||||
|
||||
test result: FAILED. 0 passed; 1 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
The failure message indicates that this test did indeed panic as we expected,
|
||||
but the panic message did not include the expected string `'Guess value must be
|
||||
less than or equal to 100'`. The panic message that we did get in this case was
|
||||
`Guess value must be greater than or equal to 1, got 200.` Now we can start
|
||||
figuring out where our bug is!
|
||||
|
||||
Now that you know several ways to write tests, let’s look at what is happening
|
||||
when we run our tests and explore the different options we can use with `cargo
|
||||
test`.
|
||||
306
2018-edition/src/ch11-02-running-tests.md
Normal file
306
2018-edition/src/ch11-02-running-tests.md
Normal file
@@ -0,0 +1,306 @@
|
||||
## Controlling How Tests Are Run
|
||||
|
||||
Just as `cargo run` compiles your code and then runs the resulting binary,
|
||||
`cargo test` compiles your code in test mode and runs the resulting test
|
||||
binary. You can specify command line options to change the default behavior of
|
||||
`cargo test`. For example, the default behavior of the binary produced by
|
||||
`cargo test` is to run all the tests in parallel and capture output generated
|
||||
during test runs, preventing the output from being displayed and making it
|
||||
easier to read the output related to the test results.
|
||||
|
||||
Some command line options go to `cargo test`, and some go to the resulting test
|
||||
binary. To separate these two types of arguments, you list the arguments that
|
||||
go to `cargo test` followed by the separator `--` and then the ones that go to
|
||||
the test binary. Running `cargo test --help` displays the options you can use
|
||||
with `cargo test`, and running `cargo test -- --help` displays the options you
|
||||
can use after the separator `--`.
|
||||
|
||||
### Running Tests in Parallel or Consecutively
|
||||
|
||||
When you run multiple tests, by default they run in parallel using threads.
|
||||
This means the tests will finish running faster so you can get feedback quicker
|
||||
on whether or not your code is working. Because the tests are running at the
|
||||
same time, make sure your tests don’t depend on each other or on any shared
|
||||
state, including a shared environment, such as the current working directory or
|
||||
environment variables.
|
||||
|
||||
For example, say each of your tests runs some code that creates a file on disk
|
||||
named *test-output.txt* and writes some data to that file. Then each test reads
|
||||
the data in that file and asserts that the file contains a particular value,
|
||||
which is different in each test. Because the tests run at the same time, one
|
||||
test might overwrite the file between when another test writes and reads the
|
||||
file. The second test will then fail, not because the code is incorrect but
|
||||
because the tests have interfered with each other while running in parallel.
|
||||
One solution is to make sure each test writes to a different file; another
|
||||
solution is to run the tests one at a time.
|
||||
|
||||
If you don’t want to run the tests in parallel or if you want more fine-grained
|
||||
control over the number of threads used, you can send the `--test-threads` flag
|
||||
and the number of threads you want to use to the test binary. Take a look at
|
||||
the following example:
|
||||
|
||||
```text
|
||||
$ cargo test -- --test-threads=1
|
||||
```
|
||||
|
||||
We set the number of test threads to `1`, telling the program not to use any
|
||||
parallelism. Running the tests using one thread will take longer than running
|
||||
them in parallel, but the tests won’t interfere with each other if they share
|
||||
state.
|
||||
|
||||
### Showing Function Output
|
||||
|
||||
By default, if a test passes, Rust’s test library captures anything printed to
|
||||
standard output. For example, if we call `println!` in a test and the test
|
||||
passes, we won’t see the `println!` output in the terminal; we’ll see only the
|
||||
line that indicates the test passed. If a test fails, we’ll see whatever was
|
||||
printed to standard output with the rest of the failure message.
|
||||
|
||||
As an example, Listing 11-10 has a silly function that prints the value of its
|
||||
parameter and returns 10, as well as a test that passes and a test that fails.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
fn prints_and_returns_10(a: i32) -> i32 {
|
||||
println!("I got the value {}", a);
|
||||
10
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn this_test_will_pass() {
|
||||
let value = prints_and_returns_10(4);
|
||||
assert_eq!(10, value);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn this_test_will_fail() {
|
||||
let value = prints_and_returns_10(8);
|
||||
assert_eq!(5, value);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-10: Tests for a function that calls
|
||||
`println!`</span>
|
||||
|
||||
When we run these tests with `cargo test`, we’ll see the following output:
|
||||
|
||||
```text
|
||||
running 2 tests
|
||||
test tests::this_test_will_pass ... ok
|
||||
test tests::this_test_will_fail ... FAILED
|
||||
|
||||
failures:
|
||||
|
||||
---- tests::this_test_will_fail stdout ----
|
||||
I got the value 8
|
||||
thread 'tests::this_test_will_fail' panicked at 'assertion failed: `(left == right)`
|
||||
left: `5`,
|
||||
right: `10`', src/lib.rs:19:8
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
|
||||
failures:
|
||||
tests::this_test_will_fail
|
||||
|
||||
test result: FAILED. 1 passed; 1 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Note that nowhere in this output do we see `I got the value 4`, which is what
|
||||
is printed when the test that passes runs. That output has been captured. The
|
||||
output from the test that failed, `I got the value 8`, appears in the section
|
||||
of the test summary output, which also shows the cause of the test failure.
|
||||
|
||||
If we want to see printed values for passing tests as well, we can disable the
|
||||
output capture behavior by using the `--nocapture` flag:
|
||||
|
||||
```text
|
||||
$ cargo test -- --nocapture
|
||||
```
|
||||
|
||||
When we run the tests in Listing 11-10 again with the `--nocapture` flag, we
|
||||
see the following output:
|
||||
|
||||
```text
|
||||
running 2 tests
|
||||
I got the value 4
|
||||
I got the value 8
|
||||
test tests::this_test_will_pass ... ok
|
||||
thread 'tests::this_test_will_fail' panicked at 'assertion failed: `(left == right)`
|
||||
left: `5`,
|
||||
right: `10`', src/lib.rs:19:8
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
test tests::this_test_will_fail ... FAILED
|
||||
|
||||
failures:
|
||||
|
||||
failures:
|
||||
tests::this_test_will_fail
|
||||
|
||||
test result: FAILED. 1 passed; 1 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Note that the output for the tests and the test results are interleaved; the
|
||||
reason is that the tests are running in parallel, as we talked about in the
|
||||
previous section. Try using the `--test-threads=1` option and the `--nocapture`
|
||||
flag, and see what the output looks like then!
|
||||
|
||||
### Running a Subset of Tests by Name
|
||||
|
||||
Sometimes, running a full test suite can take a long time. If you’re working on
|
||||
code in a particular area, you might want to run only the tests pertaining to
|
||||
that code. You can choose which tests to run by passing `cargo test` the name
|
||||
or names of the test(s) you want to run as an argument.
|
||||
|
||||
To demonstrate how to run a subset of tests, we’ll create three tests for our
|
||||
`add_two` function, as shown in Listing 11-11, and choose which ones to run:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub fn add_two(a: i32) -> i32 {
|
||||
a + 2
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn add_two_and_two() {
|
||||
assert_eq!(4, add_two(2));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn add_three_and_two() {
|
||||
assert_eq!(5, add_two(3));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn one_hundred() {
|
||||
assert_eq!(102, add_two(100));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-11: Three tests with three different
|
||||
names</span>
|
||||
|
||||
If we run the tests without passing any arguments, as we saw earlier, all the
|
||||
tests will run in parallel:
|
||||
|
||||
```text
|
||||
running 3 tests
|
||||
test tests::add_two_and_two ... ok
|
||||
test tests::add_three_and_two ... ok
|
||||
test tests::one_hundred ... ok
|
||||
|
||||
test result: ok. 3 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
#### Running Single Tests
|
||||
|
||||
We can pass the name of any test function to `cargo test` to run only that test:
|
||||
|
||||
```text
|
||||
$ cargo test one_hundred
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running target/debug/deps/adder-06a75b4a1f2515e9
|
||||
|
||||
running 1 test
|
||||
test tests::one_hundred ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 2 filtered out
|
||||
```
|
||||
|
||||
Only the test with the name `one_hundred` ran; the other two tests didn’t match
|
||||
that name. The test output lets us know we had more tests than what this
|
||||
command ran by displaying `2 filtered out` at the end of the summary line.
|
||||
|
||||
We can’t specify the names of multiple tests in this way; only the first value
|
||||
given to `cargo test` will be used. But there is a way to run multiple tests.
|
||||
|
||||
#### Filtering to Run Multiple Tests
|
||||
|
||||
We can specify part of a test name, and any test whose name matches that value
|
||||
will be run. For example, because two of our tests’ names contain `add`, we can
|
||||
run those two by running `cargo test add`:
|
||||
|
||||
```text
|
||||
$ cargo test add
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running target/debug/deps/adder-06a75b4a1f2515e9
|
||||
|
||||
running 2 tests
|
||||
test tests::add_two_and_two ... ok
|
||||
test tests::add_three_and_two ... ok
|
||||
|
||||
test result: ok. 2 passed; 0 failed; 0 ignored; 0 measured; 1 filtered out
|
||||
```
|
||||
|
||||
This command ran all tests with `add` in the name and filtered out the test
|
||||
named `one_hundred`. Also note that the module in which tests appear becomes
|
||||
part of the test’s name, so we can run all the tests in a module by filtering
|
||||
on the module’s name.
|
||||
|
||||
### Ignoring Some Tests Unless Specifically Requested
|
||||
|
||||
Sometimes a few specific tests can be very time-consuming to execute, so you
|
||||
might want to exclude them during most runs of `cargo test`. Rather than
|
||||
listing as arguments all tests you do want to run, you can instead annotate the
|
||||
time-consuming tests using the `ignore` attribute to exclude them, as shown
|
||||
here:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[test]
|
||||
fn it_works() {
|
||||
assert_eq!(2 + 2, 4);
|
||||
}
|
||||
|
||||
#[test]
|
||||
#[ignore]
|
||||
fn expensive_test() {
|
||||
// code that takes an hour to run
|
||||
}
|
||||
```
|
||||
|
||||
After `#[test]` we add the `#[ignore]` line to the test we want to exclude. Now
|
||||
when we run our tests, `it_works` runs, but `expensive_test` doesn’t:
|
||||
|
||||
```text
|
||||
$ cargo test
|
||||
Compiling adder v0.1.0 (file:///projects/adder)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.24 secs
|
||||
Running target/debug/deps/adder-ce99bcc2479f4607
|
||||
|
||||
running 2 tests
|
||||
test expensive_test ... ignored
|
||||
test it_works ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 1 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
The `expensive_test` function is listed as `ignored`. If we want to run only
|
||||
the ignored tests, we can use `cargo test -- --ignored`:
|
||||
|
||||
```text
|
||||
$ cargo test -- --ignored
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running target/debug/deps/adder-ce99bcc2479f4607
|
||||
|
||||
running 1 test
|
||||
test expensive_test ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 1 filtered out
|
||||
```
|
||||
|
||||
By controlling which tests run, you can make sure your `cargo test` results
|
||||
will be fast. When you’re at a point where it makes sense to check the results
|
||||
of the `ignored` tests and you have time to wait for the results, you can run
|
||||
`cargo test -- --ignored` instead.
|
||||
324
2018-edition/src/ch11-03-test-organization.md
Normal file
324
2018-edition/src/ch11-03-test-organization.md
Normal file
@@ -0,0 +1,324 @@
|
||||
## Test Organization
|
||||
|
||||
As mentioned at the start of the chapter, testing is a complex discipline, and
|
||||
different people use different terminology and organization. The Rust community
|
||||
thinks about tests in terms of two main categories: *unit tests* and
|
||||
*integration tests*. Unit tests are small and more focused, testing one module
|
||||
in isolation at a time, and can test private interfaces. Integration tests are
|
||||
entirely external to your library and use your code in the same way any other
|
||||
external code would, using only the public interface and potentially exercising
|
||||
multiple modules per test.
|
||||
|
||||
Writing both kinds of tests is important to ensure that the pieces of your
|
||||
library are doing what you expect them to separately and together.
|
||||
|
||||
### Unit Tests
|
||||
|
||||
The purpose of unit tests is to test each unit of code in isolation from the
|
||||
rest of the code to quickly pinpoint where code is and isn’t working as
|
||||
expected. You’ll put unit tests in the *src* directory in each file with the
|
||||
code that they’re testing. The convention is to create a module named `tests`
|
||||
in each file to contain the test functions and to annotate the module with
|
||||
`cfg(test)`.
|
||||
|
||||
#### The Tests Module and `#[cfg(test)]`
|
||||
|
||||
The `#[cfg(test)]` annotation on the tests module tells Rust to compile and run
|
||||
the test code only when you run `cargo test`, not when you run `cargo build`.
|
||||
This saves compile time when you only want to build the library and saves space
|
||||
in the resulting compiled artifact because the tests are not included. You’ll
|
||||
see that because integration tests go in a different directory, they don’t need
|
||||
the `#[cfg(test)]` annotation. However, because unit tests go in the same files
|
||||
as the code, you’ll use `#[cfg(test)]` to specify that they shouldn’t be
|
||||
included in the compiled result.
|
||||
|
||||
Recall that when we generated the new `adder` project in the first section of
|
||||
this chapter, Cargo generated this code for us:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
#[test]
|
||||
fn it_works() {
|
||||
assert_eq!(2 + 2, 4);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
This code is the automatically generated test module. The attribute `cfg`
|
||||
stands for *configuration* and tells Rust that the following item should only
|
||||
be included given a certain configuration option. In this case, the
|
||||
configuration option is `test`, which is provided by Rust for compiling and
|
||||
running tests. By using the `cfg` attribute, Cargo compiles our test code only
|
||||
if we actively run the tests with `cargo test`. This includes any helper
|
||||
functions that might be within this module, in addition to the functions
|
||||
annotated with `#[test]`.
|
||||
|
||||
#### Testing Private Functions
|
||||
|
||||
There’s debate within the testing community about whether or not private
|
||||
functions should be tested directly, and other languages make it difficult or
|
||||
impossible to test private functions. Regardless of which testing ideology you
|
||||
adhere to, Rust’s privacy rules do allow you to test private functions.
|
||||
Consider the code in Listing 11-12 with the private function `internal_adder`:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub fn add_two(a: i32) -> i32 {
|
||||
internal_adder(a, 2)
|
||||
}
|
||||
|
||||
fn internal_adder(a: i32, b: i32) -> i32 {
|
||||
a + b
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn internal() {
|
||||
assert_eq!(4, internal_adder(2, 2));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-12: Testing a private function</span>
|
||||
|
||||
Note that the `internal_adder` function is not marked as `pub`, but because
|
||||
tests are just Rust code and the `tests` module is just another module, you can
|
||||
import and call `internal_adder` in a test just fine. If you don’t think
|
||||
private functions should be tested, there’s nothing in Rust that will compel
|
||||
you to do so.
|
||||
|
||||
### Integration Tests
|
||||
|
||||
In Rust, integration tests are entirely external to your library. They use your
|
||||
library in the same way any other code would, which means they can only call
|
||||
functions that are part of your library’s public API. Their purpose is to test
|
||||
whether many parts of your library work together correctly. Units of code that
|
||||
work correctly on their own could have problems when integrated, so test
|
||||
coverage of the integrated code is important as well. To create integration
|
||||
tests, you first need a *tests* directory.
|
||||
|
||||
#### The *tests* Directory
|
||||
|
||||
We create a *tests* directory at the top level of our project directory, next
|
||||
to *src*. Cargo knows to look for integration test files in this directory. We
|
||||
can then make as many test files as we want to in this directory, and Cargo
|
||||
will compile each of the files as an individual crate.
|
||||
|
||||
Let’s create an integration test. With the code in Listing 11-12 still in the
|
||||
*src/lib.rs* file, make a *tests* directory, create a new file named
|
||||
*tests/integration_test.rs*, and enter the code in Listing 11-13:
|
||||
|
||||
<span class="filename">Filename: tests/integration_test.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
extern crate adder;
|
||||
|
||||
#[test]
|
||||
fn it_adds_two() {
|
||||
assert_eq!(4, adder::add_two(2));
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 11-13: An integration test of a function in the
|
||||
`adder` crate</span>
|
||||
|
||||
We’ve added `extern crate adder` at the top of the code, which we didn’t need
|
||||
in the unit tests. The reason is that each test in the `tests` directory is a
|
||||
separate crate, so we need to import our library into each of them.
|
||||
|
||||
We don’t need to annotate any code in *tests/integration_test.rs* with
|
||||
`#[cfg(test)]`. Cargo treats the `tests` directory specially and compiles files
|
||||
in this directory only when we run `cargo test`. Run `cargo test` now:
|
||||
|
||||
```text
|
||||
$ cargo test
|
||||
Compiling adder v0.1.0 (file:///projects/adder)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.31 secs
|
||||
Running target/debug/deps/adder-abcabcabc
|
||||
|
||||
running 1 test
|
||||
test tests::internal ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
Running target/debug/deps/integration_test-ce99bcc2479f4607
|
||||
|
||||
running 1 test
|
||||
test it_adds_two ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
Doc-tests adder
|
||||
|
||||
running 0 tests
|
||||
|
||||
test result: ok. 0 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
The three sections of output include the unit tests, the integration test, and
|
||||
the doc tests. The first section for the unit tests is the same as we’ve been
|
||||
seeing: one line for each unit test (one named `internal` that we added in
|
||||
Listing 11-12) and then a summary line for the unit tests.
|
||||
|
||||
The integration tests section starts with the line `Running
|
||||
target/debug/deps/integration-test-ce99bcc2479f4607` (the hash at the end of
|
||||
your output will be different). Next, there is a line for each test function in
|
||||
that integration test and a summary line for the results of the integration
|
||||
test just before the `Doc-tests adder` section starts.
|
||||
|
||||
Similarly to how adding more unit test functions adds more result lines to the
|
||||
unit tests section, adding more test functions to the integration test file
|
||||
adds more result lines to this integration test file’s section. Each
|
||||
integration test file has its own section, so if we add more files in the
|
||||
*tests* directory, there will be more integration test sections.
|
||||
|
||||
We can still run a particular integration test function by specifying the test
|
||||
function’s name as an argument to `cargo test`. To run all the tests in a
|
||||
particular integration test file, use the `--test` argument of `cargo test`
|
||||
followed by the name of the file:
|
||||
|
||||
```text
|
||||
$ cargo test --test integration_test
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running target/debug/integration_test-952a27e0126bb565
|
||||
|
||||
running 1 test
|
||||
test it_adds_two ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
This command runs only the tests in the *tests/integration_test.rs* file.
|
||||
|
||||
#### Submodules in Integration Tests
|
||||
|
||||
As you add more integration tests, you might want to make more than one file in
|
||||
the *tests* directory to help organize them; for example, you can group the
|
||||
test functions by the functionality they’re testing. As mentioned earlier, each
|
||||
file in the *tests* directory is compiled as its own separate crate.
|
||||
|
||||
Treating each integration test file as its own crate is useful to create
|
||||
separate scopes that are more like the way end users will be using your crate.
|
||||
However, this means files in the *tests* directory don’t share the same
|
||||
behavior as files in *src* do, as you learned in Chapter 7 regarding how to
|
||||
separate code into modules and files.
|
||||
|
||||
The different behavior of files in the *tests* directory is most noticeable
|
||||
when you have a set of helper functions that would be useful in multiple
|
||||
integration test files and you try to follow the steps in the “Moving Modules
|
||||
to Other Files” section of Chapter 7 to extract them into a common module. For
|
||||
example, if we create *tests/common.rs* and place a function named `setup` in
|
||||
it, we can add some code to `setup` that we want to call from multiple test
|
||||
functions in multiple test files:
|
||||
|
||||
<span class="filename">Filename: tests/common.rs</span>
|
||||
|
||||
```rust
|
||||
pub fn setup() {
|
||||
// setup code specific to your library's tests would go here
|
||||
}
|
||||
```
|
||||
|
||||
When we run the tests again, we’ll see a new section in the test output for the
|
||||
*common.rs* file, even though this file doesn’t contain any test functions nor
|
||||
did we call the `setup` function from anywhere:
|
||||
|
||||
```text
|
||||
running 1 test
|
||||
test tests::internal ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
Running target/debug/deps/common-b8b07b6f1be2db70
|
||||
|
||||
running 0 tests
|
||||
|
||||
test result: ok. 0 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
Running target/debug/deps/integration_test-d993c68b431d39df
|
||||
|
||||
running 1 test
|
||||
test it_adds_two ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
Doc-tests adder
|
||||
|
||||
running 0 tests
|
||||
|
||||
test result: ok. 0 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Having `common` appear in the test results with `running 0 tests` displayed for
|
||||
it is not what we wanted. We just wanted to share some code with the other
|
||||
integration test files.
|
||||
|
||||
To avoid having `common` appear in the test output, instead of creating
|
||||
*tests/common.rs*, we’ll create *tests/common/mod.rs*. In the “Rules of Module
|
||||
Filesystems” section of Chapter 7, we used the naming convention
|
||||
*module_name/mod.rs* for files of modules that have submodules. We don’t have
|
||||
submodules for `common` here, but naming the file this way tells Rust not to
|
||||
treat the `common` module as an integration test file. When we move the `setup`
|
||||
function code into *tests/common/mod.rs* and delete the *tests/common.rs* file,
|
||||
the section in the test output will no longer appear. Files in subdirectories
|
||||
of the *tests* directory don’t get compiled as separate crates or have sections
|
||||
in the test output.
|
||||
|
||||
After we’ve created *tests/common/mod.rs*, we can use it from any of the
|
||||
integration test files as a module. Here’s an example of calling the `setup`
|
||||
function from the `it_adds_two` test in *tests/integration_test.rs*:
|
||||
|
||||
<span class="filename">Filename: tests/integration_test.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
extern crate adder;
|
||||
|
||||
mod common;
|
||||
|
||||
#[test]
|
||||
fn it_adds_two() {
|
||||
common::setup();
|
||||
assert_eq!(4, adder::add_two(2));
|
||||
}
|
||||
```
|
||||
|
||||
Note that the `mod common;` declaration is the same as the module declarations
|
||||
we demonstrated in Listing 7-4. Then in the test function, we can call the
|
||||
`common::setup()` function.
|
||||
|
||||
#### Integration Tests for Binary Crates
|
||||
|
||||
If our project is a binary crate that only contains a *src/main.rs* file and
|
||||
doesn’t have a *src/lib.rs* file, we can’t create integration tests in the
|
||||
*tests* directory and use `extern crate` to import functions defined in the
|
||||
*src/main.rs* file. Only library crates expose functions that other crates can
|
||||
call and use; binary crates are meant to be run on their own.
|
||||
|
||||
This is one of the reasons Rust projects that provide a binary have a
|
||||
straightforward *src/main.rs* file that calls logic that lives in the
|
||||
*src/lib.rs* file. Using that structure, integration tests *can* test the
|
||||
library crate by using `extern crate` to exercise the important functionality.
|
||||
If the important functionality works, the small amount of code in the
|
||||
*src/main.rs* file will work as well, and that small amount of code doesn’t
|
||||
need to be tested.
|
||||
|
||||
## Summary
|
||||
|
||||
Rust’s testing features provide a way to specify how code should function to
|
||||
ensure it continues to work as you expect, even as you make changes. Unit tests
|
||||
exercise different parts of a library separately and can test private
|
||||
implementation details. Integration tests check that many parts of the library
|
||||
work together correctly, and they use the library’s public API to test the code
|
||||
in the same way external code will use it. Even though Rust’s type system and
|
||||
ownership rules help prevent some kinds of bugs, tests are still important to
|
||||
reduce logic bugs having to do with how your code is expected to behave.
|
||||
|
||||
Let’s combine the knowledge you learned in this chapter and in previous
|
||||
chapters to work on a project!
|
||||
38
2018-edition/src/ch12-00-an-io-project.md
Normal file
38
2018-edition/src/ch12-00-an-io-project.md
Normal file
@@ -0,0 +1,38 @@
|
||||
# An I/O Project: Building a Command Line Program
|
||||
|
||||
This chapter is a recap of the many skills you’ve learned so far and an
|
||||
exploration of a few more standard library features. We’ll build a command line
|
||||
tool that interacts with file and command line input/output to practice some of
|
||||
the Rust concepts you now have under your belt.
|
||||
|
||||
Rust’s speed, safety, single binary output, and cross-platform support make it
|
||||
an ideal language for creating command line tools, so for our project, we’ll
|
||||
make our own version of the classic command line tool `grep` (**g**lobally
|
||||
search a **r**egular **e**xpression and **p**rint). In the simplest use case,
|
||||
`grep` searches a specified file for a specified string. To do so, `grep` takes
|
||||
as its arguments a filename and a string. Then it reads the file, finds lines
|
||||
in that file that contain the string argument, and prints those lines.
|
||||
|
||||
Along the way, we’ll show how to make our command line tool use features of the
|
||||
terminal that many command line tools use. We’ll read the value of an
|
||||
environment variable to allow the user to configure the behavior of our tool.
|
||||
We’ll also print to the standard error console stream (`stderr`) instead of
|
||||
standard output (`stdout`), so, for example, the user can redirect successful
|
||||
output to a file while still seeing error messages onscreen.
|
||||
|
||||
One Rust community member, Andrew Gallant, has already created a fully
|
||||
featured, very fast version of `grep`, called `ripgrep`. By comparison, our
|
||||
version of `grep` will be fairly simple, but this chapter will give you some of
|
||||
the background knowledge you need to understand a real-world project such as
|
||||
`ripgrep`.
|
||||
|
||||
Our `grep` project will combine a number of concepts you’ve learned so far:
|
||||
|
||||
* Organizing code (using what you learned in modules, Chapter 7)
|
||||
* Using vectors and strings (collections, Chapter 8)
|
||||
* Handling errors (Chapter 9)
|
||||
* Using traits and lifetimes where appropriate (Chapter 10)
|
||||
* Writing tests (Chapter 11)
|
||||
|
||||
We’ll also briefly introduce closures, iterators, and trait objects, which
|
||||
Chapters 13 and 17 will cover in detail.
|
||||
153
2018-edition/src/ch12-01-accepting-command-line-arguments.md
Normal file
153
2018-edition/src/ch12-01-accepting-command-line-arguments.md
Normal file
@@ -0,0 +1,153 @@
|
||||
## Accepting Command Line Arguments
|
||||
|
||||
Let’s create a new project with, as always, `cargo new`. We’ll call our project
|
||||
`minigrep` to distinguish it from the `grep` tool that you might already have
|
||||
on your system.
|
||||
|
||||
```text
|
||||
$ cargo new --bin minigrep
|
||||
Created binary (application) `minigrep` project
|
||||
$ cd minigrep
|
||||
```
|
||||
|
||||
The first task is to make `minigrep` accept its two command line arguments: the
|
||||
filename and a string to search for. That is, we want to be able to run our
|
||||
program with `cargo run`, a string to search for, and a path to a file to
|
||||
search in, like so:
|
||||
|
||||
```text
|
||||
$ cargo run searchstring example-filename.txt
|
||||
```
|
||||
|
||||
Right now, the program generated by `cargo new` cannot process arguments we
|
||||
give it. Some existing libraries on [Crates.io](https://crates.io/) can help
|
||||
with writing a program that accepts command line arguments, but because you’re
|
||||
just learning this concept, let’s implement this capability ourselves.
|
||||
|
||||
### Reading the Argument Values
|
||||
|
||||
To enable `minigrep` to read the values of command line arguments we pass to
|
||||
it, we’ll need a function provided in Rust’s standard library, which is
|
||||
`std::env::args`. This function returns an *iterator* of the command line
|
||||
arguments that were given to `minigrep`. We haven’t discussed iterators yet
|
||||
(we’ll cover them fully in Chapter 13), but for now, you only need to know two
|
||||
details about iterators: iterators produce a series of values, and we can call
|
||||
the `collect` method on an iterator to turn it into a collection, such as a
|
||||
vector, containing all the elements the iterator produces.
|
||||
|
||||
Use the code in Listing 12-1 to allow your `minigrep` program to read any
|
||||
command line arguments passed to it and then collect the values into a vector:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::env;
|
||||
|
||||
fn main() {
|
||||
let args: Vec<String> = env::args().collect();
|
||||
println!("{:?}", args);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-1: Collecting the command line arguments into
|
||||
a vector and printing them</span>
|
||||
|
||||
First, we bring the `std::env` module into scope with a `use` statement so we
|
||||
can use its `args` function. Notice that the `std::env::args` function is
|
||||
nested in two levels of modules. As we discussed in Chapter 7, in cases where
|
||||
the desired function is nested in more than one module, it’s conventional to
|
||||
bring the parent module into scope rather than the function. By doing so, we
|
||||
can easily use other functions from `std::env`. It’s also less ambiguous than
|
||||
adding `use std::env::args` and then calling the function with just `args`,
|
||||
because `args` might easily be mistaken for a function that’s defined in the
|
||||
current module.
|
||||
|
||||
> ### The `args` Function and Invalid Unicode
|
||||
>
|
||||
> Note that `std::env::args` will panic if any argument contains invalid
|
||||
> Unicode. If your program needs to accept arguments containing invalid
|
||||
> Unicode, use `std::env::args_os` instead. That function returns an iterator
|
||||
> that produces `OsString` values instead of `String` values. We’ve chosen to
|
||||
> use `std::env::args` here for simplicity, because `OsString` values differ
|
||||
> per platform and are more complex to work with than `String` values.
|
||||
|
||||
On the first line of `main`, we call `env::args`, and we immediately use
|
||||
`collect` to turn the iterator into a vector containing all the values produced
|
||||
by the iterator. We can use the `collect` function to create many kinds of
|
||||
collections, so we explicitly annotate the type of `args` to specify that we
|
||||
want a vector of strings. Although we very rarely need to annotate types in
|
||||
Rust, `collect` is one function you do often need to annotate because Rust
|
||||
isn’t able to infer the kind of collection you want.
|
||||
|
||||
Finally, we print the vector using the debug formatter, `:?`. Let’s try running
|
||||
the code first with no arguments and then with two arguments:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
--snip--
|
||||
["target/debug/minigrep"]
|
||||
|
||||
$ cargo run needle haystack
|
||||
--snip--
|
||||
["target/debug/minigrep", "needle", "haystack"]
|
||||
```
|
||||
|
||||
Notice that the first value in the vector is `"target/debug/minigrep"`, which
|
||||
is the name of our binary. This matches the behavior of the arguments list in
|
||||
C, letting programs use the name by which they were invoked in their execution.
|
||||
It’s often convenient to have access to the program name in case you want to
|
||||
print it in messages or change behavior of the program based on what command
|
||||
line alias was used to invoke the program. But for the purposes of this
|
||||
chapter, we’ll ignore it and save only the two arguments we need.
|
||||
|
||||
### Saving the Argument Values in Variables
|
||||
|
||||
Printing the value of the vector of arguments illustrated that the program is
|
||||
able to access the values specified as command line arguments. Now we need to
|
||||
save the values of the two arguments in variables so we can use the values
|
||||
throughout the rest of the program. We do that in Listing 12-2:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,should_panic
|
||||
use std::env;
|
||||
|
||||
fn main() {
|
||||
let args: Vec<String> = env::args().collect();
|
||||
|
||||
let query = &args[1];
|
||||
let filename = &args[2];
|
||||
|
||||
println!("Searching for {}", query);
|
||||
println!("In file {}", filename);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-2: Creating variables to hold the query
|
||||
argument and filename argument</span>
|
||||
|
||||
As we saw when we printed the vector, the program’s name takes up the first
|
||||
value in the vector at `args[0]`, so we’re starting at index `1`. The first
|
||||
argument `minigrep` takes is the string we’re searching for, so we put a
|
||||
reference to the first argument in the variable `query`. The second argument
|
||||
will be the filename, so we put a reference to the second argument in the
|
||||
variable `filename`.
|
||||
|
||||
We temporarily print the values of these variables to prove that the code is
|
||||
working as we intend. Let’s run this program again with the arguments `test`
|
||||
and `sample.txt`:
|
||||
|
||||
```text
|
||||
$ cargo run test sample.txt
|
||||
Compiling minigrep v0.1.0 (file:///projects/minigrep)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/minigrep test sample.txt`
|
||||
Searching for test
|
||||
In file sample.txt
|
||||
```
|
||||
|
||||
Great, the program is working! The values of the arguments we need are being
|
||||
saved into the right variables. Later we’ll add some error handling to deal
|
||||
with certain potential erroneous situations, such as when the user provides no
|
||||
arguments; for now, we’ll ignore that situation and work on adding file-reading
|
||||
capabilities instead.
|
||||
111
2018-edition/src/ch12-02-reading-a-file.md
Normal file
111
2018-edition/src/ch12-02-reading-a-file.md
Normal file
@@ -0,0 +1,111 @@
|
||||
## Reading a File
|
||||
|
||||
Now we’ll add functionality to read the file that is specified in the
|
||||
`filename` command line argument. First, we need a sample file to test it with:
|
||||
the best kind of file to use to make sure `minigrep` is working is one with a
|
||||
small amount of text over multiple lines with some repeated words. Listing 12-3
|
||||
has an Emily Dickinson poem that will work well! Create a file called
|
||||
*poem.txt* at the root level of your project, and enter the poem “I’m Nobody!
|
||||
Who are you?”
|
||||
|
||||
<span class="filename">Filename: poem.txt</span>
|
||||
|
||||
```text
|
||||
I’m nobody! Who are you?
|
||||
Are you nobody, too?
|
||||
Then there’s a pair of us — don’t tell!
|
||||
They’d banish us, you know.
|
||||
|
||||
How dreary to be somebody!
|
||||
How public, like a frog
|
||||
To tell your name the livelong day
|
||||
To an admiring bog!
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-3: A poem by Emily Dickinson makes a good test
|
||||
case</span>
|
||||
|
||||
With the text in place, edit *src/main.rs* and add code to open the file, as
|
||||
shown in Listing 12-4:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,should_panic
|
||||
use std::env;
|
||||
use std::fs::File;
|
||||
use std::io::prelude::*;
|
||||
|
||||
fn main() {
|
||||
# let args: Vec<String> = env::args().collect();
|
||||
#
|
||||
# let query = &args[1];
|
||||
# let filename = &args[2];
|
||||
#
|
||||
# println!("Searching for {}", query);
|
||||
// --snip--
|
||||
println!("In file {}", filename);
|
||||
|
||||
let mut f = File::open(filename).expect("file not found");
|
||||
|
||||
let mut contents = String::new();
|
||||
f.read_to_string(&mut contents)
|
||||
.expect("something went wrong reading the file");
|
||||
|
||||
println!("With text:\n{}", contents);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-4: Reading the contents of the file specified
|
||||
by the second argument</span>
|
||||
|
||||
First, we add some more `use` statements to bring in relevant parts of the
|
||||
standard library: we need `std::fs::File` to handle files, and
|
||||
`std::io::prelude::*` contains various useful traits for doing I/O, including
|
||||
file I/O. In the same way that Rust has a general prelude that brings certain
|
||||
types and functions into scope automatically, the `std::io` module has its own
|
||||
prelude of common types and functions you’ll need when working with I/O. Unlike
|
||||
with the default prelude, we must explicitly add a `use` statement for the
|
||||
prelude from `std::io`.
|
||||
|
||||
In `main`, we’ve added three statements: first, we get a mutable handle to the
|
||||
file by calling the `File::open` function and passing it the value of the
|
||||
`filename` variable. Second, we create a variable called `contents` and set it
|
||||
to a mutable, empty `String`. This will hold the content of the file after we
|
||||
read it in. Third, we call `read_to_string` on our file handle and pass a
|
||||
mutable reference to `contents` as an argument.
|
||||
|
||||
After those lines, we’ve again added a temporary `println!` statement that
|
||||
prints the value of `contents` after the file is read, so we can check that the
|
||||
program is working so far.
|
||||
|
||||
Let’s run this code with any string as the first command line argument (because
|
||||
we haven’t implemented the searching part yet) and the *poem.txt* file as the
|
||||
second argument:
|
||||
|
||||
```text
|
||||
$ cargo run the poem.txt
|
||||
Compiling minigrep v0.1.0 (file:///projects/minigrep)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/minigrep the poem.txt`
|
||||
Searching for the
|
||||
In file poem.txt
|
||||
With text:
|
||||
I’m nobody! Who are you?
|
||||
Are you nobody, too?
|
||||
Then there’s a pair of us — don’t tell!
|
||||
They’d banish us, you know.
|
||||
|
||||
How dreary to be somebody!
|
||||
How public, like a frog
|
||||
To tell your name the livelong day
|
||||
To an admiring bog!
|
||||
```
|
||||
|
||||
Great! The code read and then printed the contents of the file. But the code
|
||||
has a few flaws. The `main` function has multiple responsibilities: generally,
|
||||
functions are clearer and easier to maintain if each function is responsible
|
||||
for only one idea. The other problem is that we’re not handling errors as well
|
||||
as we could. The program is still small, so these flaws aren’t a big problem,
|
||||
but as the program grows, it will be harder to fix them cleanly. It’s good
|
||||
practice to begin refactoring early on when developing a program, because it’s
|
||||
much easier to refactor smaller amounts of code. We’ll do that next.
|
||||
@@ -0,0 +1,676 @@
|
||||
## Refactoring to Improve Modularity and Error Handling
|
||||
|
||||
To improve our program, we’ll fix four problems that have to do with the
|
||||
program’s structure and how it’s handling potential errors.
|
||||
|
||||
First, our `main` function now performs two tasks: it parses arguments and
|
||||
opens files. For such a small function, this isn’t a major problem. However, if
|
||||
we continue to grow our program inside `main`, the number of separate tasks the
|
||||
`main` function handles will increase. As a function gains responsibilities, it
|
||||
becomes more difficult to reason about, harder to test, and harder to change
|
||||
without breaking one of its parts. It’s best to separate functionality so each
|
||||
function is responsible for one task.
|
||||
|
||||
This issue also ties into the second problem: although `query` and `filename`
|
||||
are configuration variables to our program, variables like `f` and `contents`
|
||||
are used to perform the program’s logic. The longer `main` becomes, the more
|
||||
variables we’ll need to bring into scope; the more variables we have in scope,
|
||||
the harder it will be to keep track of the purpose of each. It’s best to group
|
||||
the configuration variables into one structure to make their purpose clear.
|
||||
|
||||
The third problem is that we’ve used `expect` to print an error message when
|
||||
opening the file fails, but the error message just prints `file not found`.
|
||||
Opening a file can fail in a number of ways besides the file being missing: for
|
||||
example, the file might exist, but we might not have permission to open it.
|
||||
Right now, if we’re in that situation, we’d print the `file not found` error
|
||||
message, which would give the user the wrong information!
|
||||
|
||||
Fourth, we use `expect` repeatedly to handle different errors, and if the user
|
||||
runs our program without specifying enough arguments, they’ll get an `index out
|
||||
of bounds` error from Rust that doesn’t clearly explain the problem. It would
|
||||
be best if all the error-handling code were in one place so future maintainers
|
||||
had only one place to consult in the code if the error-handling logic needed to
|
||||
change. Having all the error-handling code in one place will also ensure that
|
||||
we’re printing messages that will be meaningful to our end users.
|
||||
|
||||
Let’s address these four problems by refactoring our project.
|
||||
|
||||
### Separation of Concerns for Binary Projects
|
||||
|
||||
The organizational problem of allocating responsibility for multiple tasks to
|
||||
the `main` function is common to many binary projects. As a result, the Rust
|
||||
community has developed a process to use as a guideline for splitting the
|
||||
separate concerns of a binary program when `main` starts getting large. The
|
||||
process has the following steps:
|
||||
|
||||
* Split your program into a *main.rs* and a *lib.rs* and move your program’s
|
||||
logic to *lib.rs*.
|
||||
* As long as your command line parsing logic is small, it can remain in
|
||||
*main.rs*.
|
||||
* When the command line parsing logic starts getting complicated, extract it
|
||||
from *main.rs* and move it to *lib.rs*.
|
||||
* The responsibilities that remain in the `main` function after this process
|
||||
should be limited to the following:
|
||||
|
||||
* Calling the command line parsing logic with the argument values
|
||||
* Setting up any other configuration
|
||||
* Calling a `run` function in *lib.rs*
|
||||
* Handling the error if `run` returns an error
|
||||
|
||||
This pattern is about separating concerns: *main.rs* handles running the
|
||||
program, and *lib.rs* handles all the logic of the task at hand. Because you
|
||||
can’t test the `main` function directly, this structure lets you test all of
|
||||
your program’s logic by moving it into functions in *lib.rs*. The only code
|
||||
that remains in *main.rs* will be small enough to verify its correctness by
|
||||
reading it. Let’s rework our program by following this process.
|
||||
|
||||
#### Extracting the Argument Parser
|
||||
|
||||
We’ll extract the functionality for parsing arguments into a function that
|
||||
`main` will call to prepare for moving the command line parsing logic to
|
||||
*src/lib.rs*. Listing 12-5 shows the new start of `main` that calls a new
|
||||
function `parse_config`, which we’ll define in *src/main.rs* for the moment.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let args: Vec<String> = env::args().collect();
|
||||
|
||||
let (query, filename) = parse_config(&args);
|
||||
|
||||
// --snip--
|
||||
}
|
||||
|
||||
fn parse_config(args: &[String]) -> (&str, &str) {
|
||||
let query = &args[1];
|
||||
let filename = &args[2];
|
||||
|
||||
(query, filename)
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-5: Extracting a `parse_config` function from
|
||||
`main`</span>
|
||||
|
||||
We’re still collecting the command line arguments into a vector, but instead of
|
||||
assigning the argument value at index `1` to the variable `query` and the
|
||||
argument value at index `2` to the variable `filename` within the `main`
|
||||
function, we pass the whole vector to the `parse_config` function. The
|
||||
`parse_config` function then holds the logic that determines which argument
|
||||
goes in which variable and passes the values back to `main`. We still create
|
||||
the `query` and `filename` variables in `main`, but `main` no longer has the
|
||||
responsibility of determining how the command line arguments and variables
|
||||
correspond.
|
||||
|
||||
This rework may seem like overkill for our small program, but we’re refactoring
|
||||
in small, incremental steps. After making this change, run the program again to
|
||||
verify that the argument parsing still works. It’s good to check your progress
|
||||
often, to help identify the cause of problems when they occur.
|
||||
|
||||
#### Grouping Configuration Values
|
||||
|
||||
We can take another small step to improve the `parse_config` function further.
|
||||
At the moment, we’re returning a tuple, but then we immediately break that
|
||||
tuple into individual parts again. This is a sign that perhaps we don’t have
|
||||
the right abstraction yet.
|
||||
|
||||
Another indicator that shows there’s room for improvement is the `config` part
|
||||
of `parse_config`, which implies that the two values we return are related and
|
||||
are both part of one configuration value. We’re not currently conveying this
|
||||
meaning in the structure of the data other than by grouping the two values into
|
||||
a tuple; we could put the two values into one struct and give each of the
|
||||
struct fields a meaningful name. Doing so will make it easier for future
|
||||
maintainers of this code to understand how the different values relate to each
|
||||
other and what their purpose is.
|
||||
|
||||
> Note: Some people call this anti-pattern of using primitive values when a
|
||||
> complex type would be more appropriate *primitive obsession*.
|
||||
|
||||
Listing 12-6 shows the addition of a struct named `Config` defined to have
|
||||
fields named `query` and `filename`. We’ve also changed the `parse_config`
|
||||
function to return an instance of the `Config` struct and updated `main` to use
|
||||
the struct fields rather than having separate variables:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,should_panic
|
||||
# use std::env;
|
||||
# use std::fs::File;
|
||||
#
|
||||
fn main() {
|
||||
let args: Vec<String> = env::args().collect();
|
||||
|
||||
let config = parse_config(&args);
|
||||
|
||||
println!("Searching for {}", config.query);
|
||||
println!("In file {}", config.filename);
|
||||
|
||||
let mut f = File::open(config.filename).expect("file not found");
|
||||
|
||||
// --snip--
|
||||
}
|
||||
|
||||
struct Config {
|
||||
query: String,
|
||||
filename: String,
|
||||
}
|
||||
|
||||
fn parse_config(args: &[String]) -> Config {
|
||||
let query = args[1].clone();
|
||||
let filename = args[2].clone();
|
||||
|
||||
Config { query, filename }
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-6: Refactoring `parse_config` to return an
|
||||
instance of a `Config` struct</span>
|
||||
|
||||
The signature of `parse_config` now indicates that it returns a `Config` value.
|
||||
In the body of `parse_config`, where we used to return string slices that
|
||||
reference `String` values in `args`, we now define `Config` to contain owned
|
||||
`String` values. The `args` variable in `main` is the owner of the argument
|
||||
values and is only letting the `parse_config` function borrow them, which means
|
||||
we’d violate Rust’s borrowing rules if `Config` tried to take ownership of the
|
||||
values in `args`.
|
||||
|
||||
We could manage the `String` data in a number of different ways, but the
|
||||
easiest, though somewhat inefficient, route is to call the `clone` method on
|
||||
the values. This will make a full copy of the data for the `Config` instance to
|
||||
own, which takes more time and memory than storing a reference to the string
|
||||
data. However, cloning the data also makes our code very straightforward
|
||||
because we don’t have to manage the lifetimes of the references; in this
|
||||
circumstance, giving up a little performance to gain simplicity is a worthwhile
|
||||
trade-off.
|
||||
|
||||
> ### The Trade-Offs of Using `clone`
|
||||
>
|
||||
> There’s a tendency among many Rustaceans to avoid using `clone` to fix
|
||||
> ownership problems because of its runtime cost. In Chapter 13, you’ll learn
|
||||
> how to use more efficient methods in this type of situation. But for now,
|
||||
> it’s okay to copy a few strings to continue making progress because you’ll
|
||||
> make these copies only once and your filename and query string are very
|
||||
> small. It’s better to have a working program that’s a bit inefficient than to
|
||||
> try to hyperoptimize code on your first pass. As you become more experienced
|
||||
> with Rust, it’ll be easier to start with the most efficient solution, but for
|
||||
> now, it’s perfectly acceptable to call `clone`.
|
||||
|
||||
We’ve updated `main` so it places the instance of `Config` returned by
|
||||
`parse_config` into a variable named `config`, and we updated the code that
|
||||
previously used the separate `query` and `filename` variables so it now uses
|
||||
the fields on the `Config` struct instead.
|
||||
|
||||
Now our code more clearly conveys that `query` and `filename` are related and
|
||||
that their purpose is to configure how the program will work. Any code that
|
||||
uses these values knows to find them in the `config` instance in the fields
|
||||
named for their purpose.
|
||||
|
||||
#### Creating a Constructor for `Config`
|
||||
|
||||
So far, we’ve extracted the logic responsible for parsing the command line
|
||||
arguments from `main` and placed it in the `parse_config` function. Doing so
|
||||
helped us to see that the `query` and `filename` values were related and that
|
||||
relationship should be conveyed in our code. We then added a `Config` struct to
|
||||
name the related purpose of `query` and `filename` and to be able to return the
|
||||
values’ names as struct field names from the `parse_config` function.
|
||||
|
||||
So now that the purpose of the `parse_config` function is to create a `Config`
|
||||
instance, we can change `parse_config` from a plain function to a function
|
||||
named `new` that is associated with the `Config` struct. Making this change
|
||||
will make the code more idiomatic. We can create instances of types in the
|
||||
standard library, such as `String`, by calling `String::new`. Similarly, by
|
||||
changing `parse_config` into a `new` function associated with `Config`, we’ll
|
||||
be able to create instances of `Config` by calling `Config::new`. Listing 12-7
|
||||
shows the changes we need to make:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,should_panic
|
||||
# use std::env;
|
||||
#
|
||||
fn main() {
|
||||
let args: Vec<String> = env::args().collect();
|
||||
|
||||
let config = Config::new(&args);
|
||||
|
||||
// --snip--
|
||||
}
|
||||
|
||||
# struct Config {
|
||||
# query: String,
|
||||
# filename: String,
|
||||
# }
|
||||
#
|
||||
// --snip--
|
||||
|
||||
impl Config {
|
||||
fn new(args: &[String]) -> Config {
|
||||
let query = args[1].clone();
|
||||
let filename = args[2].clone();
|
||||
|
||||
Config { query, filename }
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-7: Changing `parse_config` into
|
||||
`Config::new`</span>
|
||||
|
||||
We’ve updated `main` where we were calling `parse_config` to instead call
|
||||
`Config::new`. We’ve changed the name of `parse_config` to `new` and moved it
|
||||
within an `impl` block, which associates the `new` function with `Config`. Try
|
||||
compiling this code again to make sure it works.
|
||||
|
||||
### Fixing the Error Handling
|
||||
|
||||
Now we’ll work on fixing our error handling. Recall that attempting to access
|
||||
the values in the `args` vector at index `1` or index `2` will cause the
|
||||
program to panic if the vector contains fewer than three items. Try running the
|
||||
program without any arguments; it will look like this:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling minigrep v0.1.0 (file:///projects/minigrep)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/minigrep`
|
||||
thread 'main' panicked at 'index out of bounds: the len is 1
|
||||
but the index is 1', src/main.rs:29:21
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
```
|
||||
|
||||
The line `index out of bounds: the len is 1 but the index is 1` is an error
|
||||
message intended for programmers. It won’t help our end users understand what
|
||||
happened and what they should do instead. Let’s fix that now.
|
||||
|
||||
#### Improving the Error Message
|
||||
|
||||
In Listing 12-8, we add a check in the `new` function that will verify that the
|
||||
slice is long enough before accessing index `1` and `2`. If the slice isn’t
|
||||
long enough, the program panics and displays a better error message than the
|
||||
`index out of bounds` message.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
// --snip--
|
||||
fn new(args: &[String]) -> Config {
|
||||
if args.len() < 3 {
|
||||
panic!("not enough arguments");
|
||||
}
|
||||
// --snip--
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-8: Adding a check for the number of
|
||||
arguments</span>
|
||||
|
||||
This code is similar to the `Guess::new` function we wrote in Listing 9-9, where
|
||||
we called `panic!` when the `value` argument was out of the range of valid
|
||||
values. Instead of checking for a range of values here, we’re checking that the
|
||||
length of `args` is at least `3` and the rest of the function can operate under
|
||||
the assumption that this condition has been met. If `args` has fewer than three
|
||||
items, this condition will be true, and we call the `panic!` macro to end the
|
||||
program immediately.
|
||||
|
||||
With these extra few lines of code in `new`, let’s run the program without any
|
||||
arguments again to see what the error looks like now:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling minigrep v0.1.0 (file:///projects/minigrep)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/minigrep`
|
||||
thread 'main' panicked at 'not enough arguments', src/main.rs:30:12
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
```
|
||||
|
||||
This output is better: we now have a reasonable error message. However, we also
|
||||
have extraneous information we don’t want to give to our users. Perhaps using
|
||||
the technique we used in Listing 9-9 isn’t the best to use here: a call to
|
||||
`panic!` is more appropriate for a programming problem rather than a usage
|
||||
problem, as discussed in Chapter 9. Instead, we can use the other technique you
|
||||
learned about in Chapter 9—returning a `Result` that indicates either success
|
||||
or an error.
|
||||
|
||||
#### Returning a `Result` from `new` Instead of Calling `panic!`
|
||||
|
||||
We can instead return a `Result` value that will contain a `Config` instance in
|
||||
the successful case and will describe the problem in the error case. When
|
||||
`Config::new` is communicating to `main`, we can use the `Result` type to
|
||||
signal there was a problem. Then we can change `main` to convert an `Err`
|
||||
variant into a more practical error for our users without the surrounding text
|
||||
about `thread 'main'` and `RUST_BACKTRACE` that a call to `panic!` causes.
|
||||
|
||||
Listing 12-9 shows the changes we need to make to the return value of
|
||||
`Config::new` and the body of the function needed to return a `Result`. Note
|
||||
that this won’t compile until we update `main` as well, which we’ll do in the
|
||||
next listing.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
impl Config {
|
||||
fn new(args: &[String]) -> Result<Config, &'static str> {
|
||||
if args.len() < 3 {
|
||||
return Err("not enough arguments");
|
||||
}
|
||||
|
||||
let query = args[1].clone();
|
||||
let filename = args[2].clone();
|
||||
|
||||
Ok(Config { query, filename })
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-9: Returning a `Result` from
|
||||
`Config::new`</span>
|
||||
|
||||
Our `new` function now returns a `Result` with a `Config` instance in the
|
||||
success case and a `&'static str` in the error case. Recall from “The Static
|
||||
Lifetime” section in Chapter 10 that `&'static str` is the type of string
|
||||
literals, which is our error message type for now.
|
||||
|
||||
We’ve made two changes in the body of the `new` function: instead of calling
|
||||
`panic!` when the user doesn’t pass enough arguments, we now return an `Err`
|
||||
value, and we’ve wrapped the `Config` return value in an `Ok`. These changes
|
||||
make the function conform to its new type signature.
|
||||
|
||||
Returning an `Err` value from `Config::new` allows the `main` function to
|
||||
handle the `Result` value returned from the `new` function and exit the process
|
||||
more cleanly in the error case.
|
||||
|
||||
#### Calling `Config::new` and Handling Errors
|
||||
|
||||
To handle the error case and print a user-friendly message, we need to update
|
||||
`main` to handle the `Result` being returned by `Config::new`, as shown in
|
||||
Listing 12-10. We’ll also take the responsibility of exiting the command line
|
||||
tool with a nonzero error code from `panic!` and implement it by hand. A
|
||||
nonzero exit status is a convention to signal to the process that called our
|
||||
program that the program exited with an error state.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
use std::process;
|
||||
|
||||
fn main() {
|
||||
let args: Vec<String> = env::args().collect();
|
||||
|
||||
let config = Config::new(&args).unwrap_or_else(|err| {
|
||||
println!("Problem parsing arguments: {}", err);
|
||||
process::exit(1);
|
||||
});
|
||||
|
||||
// --snip--
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-10: Exiting with an error code if creating a
|
||||
new `Config` fails</span>
|
||||
|
||||
In this listing, we’ve used a method we haven’t covered before:
|
||||
`unwrap_or_else`, which is defined on `Result<T, E>` by the standard library.
|
||||
Using `unwrap_or_else` allows us to define some custom, non-`panic!` error
|
||||
handling. If the `Result` is an `Ok` value, this method’s behavior is similar
|
||||
to `unwrap`: it returns the inner value `Ok` is wrapping. However, if the value
|
||||
is an `Err` value, this method calls the code in the *closure*, which is an
|
||||
anonymous function we define and pass as an argument to `unwrap_or_else`. We’ll
|
||||
cover closures in more detail in Chapter 13. For now, you just need to know
|
||||
that `unwrap_or_else` will pass the inner value of the `Err`, which in this
|
||||
case is the static string `not enough arguments` that we added in Listing 12-9,
|
||||
to our closure in the argument `err` that appears between the vertical pipes.
|
||||
The code in the closure can then use the `err` value when it runs.
|
||||
|
||||
We’ve added a new `use` line to import `process` from the standard library. The
|
||||
code in the closure that will be run in the error case is only two lines: we
|
||||
print the `err` value and then call `process::exit`. The `process::exit`
|
||||
function will stop the program immediately and return the number that was
|
||||
passed as the exit status code. This is similar to the `panic!`-based handling
|
||||
we used in Listing 12-8, but we no longer get all the extra output. Let’s try
|
||||
it:
|
||||
|
||||
```text
|
||||
$ cargo run
|
||||
Compiling minigrep v0.1.0 (file:///projects/minigrep)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.48 secs
|
||||
Running `target/debug/minigrep`
|
||||
Problem parsing arguments: not enough arguments
|
||||
```
|
||||
|
||||
Great! This output is much friendlier for our users.
|
||||
|
||||
### Extracting Logic from `main`
|
||||
|
||||
Now that we’ve finished refactoring the configuration parsing, let’s turn to
|
||||
the program’s logic. As we stated in “Separation of Concerns for Binary
|
||||
Projects”, we’ll extract a function named `run` that will hold all the logic
|
||||
currently in the `main` function that isn’t involved with setting up
|
||||
configuration or handling errors. When we’re done, `main` will be concise and
|
||||
easy to verify by inspection, and we’ll be able to write tests for all the
|
||||
other logic.
|
||||
|
||||
Listing 12-11 shows the extracted `run` function. For now, we’re just making
|
||||
the small, incremental improvement of extracting the function. We’re still
|
||||
defining the function in *src/main.rs*.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
// --snip--
|
||||
|
||||
println!("Searching for {}", config.query);
|
||||
println!("In file {}", config.filename);
|
||||
|
||||
run(config);
|
||||
}
|
||||
|
||||
fn run(config: Config) {
|
||||
let mut f = File::open(config.filename).expect("file not found");
|
||||
|
||||
let mut contents = String::new();
|
||||
f.read_to_string(&mut contents)
|
||||
.expect("something went wrong reading the file");
|
||||
|
||||
println!("With text:\n{}", contents);
|
||||
}
|
||||
|
||||
// --snip--
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-11: Extracting a `run` function containing the
|
||||
rest of the program logic</span>
|
||||
|
||||
The `run` function now contains all the remaining logic from `main`, starting
|
||||
from reading the file. The `run` function takes the `Config` instance as an
|
||||
argument.
|
||||
|
||||
#### Returning Errors from the `run` Function
|
||||
|
||||
With the remaining program logic separated into the `run` function, we can
|
||||
improve the error handling, as we did with `Config::new` in Listing 12-9.
|
||||
Instead of allowing the program to panic by calling `expect`, the `run`
|
||||
function will return a `Result<T, E>` when something goes wrong. This will let
|
||||
us further consolidate into `main` the logic around handling errors in a
|
||||
user-friendly way. Listing 12-12 shows the changes we need to make to the
|
||||
signature and body of `run`:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
use std::error::Error;
|
||||
|
||||
// --snip--
|
||||
|
||||
fn run(config: Config) -> Result<(), Box<Error>> {
|
||||
let mut f = File::open(config.filename)?;
|
||||
|
||||
let mut contents = String::new();
|
||||
f.read_to_string(&mut contents)?;
|
||||
|
||||
println!("With text:\n{}", contents);
|
||||
|
||||
Ok(())
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-12: Changing the `run` function to return
|
||||
`Result`</span>
|
||||
|
||||
We’ve made three significant changes here. First, we changed the return type of
|
||||
the `run` function to `Result<(), Box<Error>>`. This function previously
|
||||
returned the unit type, `()`, and we keep that as the value returned in the
|
||||
`Ok` case.
|
||||
|
||||
For the error type, we used the *trait object* `Box<Error>` (and we’ve brought
|
||||
`std::error::Error` into scope with a `use` statement at the top). We’ll cover
|
||||
trait objects in Chapter 17. For now, just know that `Box<Error>` means the
|
||||
function will return a type that implements the `Error` trait, but we don’t
|
||||
have to specify what particular type the return value will be. This gives us
|
||||
flexibility to return error values that may be of different types in different
|
||||
error cases.
|
||||
|
||||
Second, we’ve removed the calls to `expect` in favor of `?`, as we talked about
|
||||
in Chapter 9. Rather than `panic!` on an error, `?` will return the error value
|
||||
from the current function for the caller to handle.
|
||||
|
||||
Third, the `run` function now returns an `Ok` value in the success case. We’ve
|
||||
declared the `run` function’s success type as `()` in the signature, which
|
||||
means we need to wrap the unit type value in the `Ok` value. This `Ok(())`
|
||||
syntax might look a bit strange at first, but using `()` like this is the
|
||||
idiomatic way to indicate that we’re calling `run` for its side effects only;
|
||||
it doesn’t return a value we need.
|
||||
|
||||
When you run this code, it will compile but will display a warning:
|
||||
|
||||
```text
|
||||
warning: unused `std::result::Result` which must be used
|
||||
--> src/main.rs:18:5
|
||||
|
|
||||
18 | run(config);
|
||||
| ^^^^^^^^^^^^
|
||||
= note: #[warn(unused_must_use)] on by default
|
||||
```
|
||||
|
||||
Rust tells us that our code ignored the `Result` value and the `Result` value
|
||||
might indicate that an error occurred. But we’re not checking to see whether or
|
||||
not there was an error, and the compiler reminds us that we probably meant to
|
||||
have some error handling code here! Let’s rectify that problem now.
|
||||
|
||||
#### Handling Errors Returned from `run` in `main`
|
||||
|
||||
We’ll check for errors and handle them using a technique similar to one we used
|
||||
with `Config::new` in Listing 12-10, but with a slight difference:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
// --snip--
|
||||
|
||||
println!("Searching for {}", config.query);
|
||||
println!("In file {}", config.filename);
|
||||
|
||||
if let Err(e) = run(config) {
|
||||
println!("Application error: {}", e);
|
||||
|
||||
process::exit(1);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
We use `if let` rather than `unwrap_or_else` to check whether `run` returns an
|
||||
`Err` value and call `process::exit(1)` if it does. The `run` function doesn’t
|
||||
return a value that we want to `unwrap` in the same way that `Config::new`
|
||||
returns the `Config` instance. Because `run` returns `()` in the success case,
|
||||
we only care about detecting an error, so we don’t need `unwrap_or_else` to
|
||||
return the unwrapped value because it would only be `()`.
|
||||
|
||||
The bodies of the `if let` and the `unwrap_or_else` functions are the same in
|
||||
both cases: we print the error and exit.
|
||||
|
||||
### Splitting Code into a Library Crate
|
||||
|
||||
Our `minigrep` project is looking good so far! Now we’ll split the
|
||||
*src/main.rs* file and put some code into the *src/lib.rs* file so we can test
|
||||
it and have a *src/main.rs* file with fewer responsibilities.
|
||||
|
||||
Let’s move all the code that isn’t the `main` function from *src/main.rs* to
|
||||
*src/lib.rs*:
|
||||
|
||||
* The `run` function definition
|
||||
* The relevant `use` statements
|
||||
* The definition of `Config`
|
||||
* The `Config::new` function definition
|
||||
|
||||
The contents of *src/lib.rs* should have the signatures shown in Listing 12-13
|
||||
(we’ve omitted the bodies of the functions for brevity). Note that this won’t
|
||||
compile until we modify *src/main.rs* in the listing after this one.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
use std::error::Error;
|
||||
use std::fs::File;
|
||||
use std::io::prelude::*;
|
||||
|
||||
pub struct Config {
|
||||
pub query: String,
|
||||
pub filename: String,
|
||||
}
|
||||
|
||||
impl Config {
|
||||
pub fn new(args: &[String]) -> Result<Config, &'static str> {
|
||||
// --snip--
|
||||
}
|
||||
}
|
||||
|
||||
pub fn run(config: Config) -> Result<(), Box<Error>> {
|
||||
// --snip--
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-13: Moving `Config` and `run` into
|
||||
*src/lib.rs*</span>
|
||||
|
||||
We’ve made liberal use of the `pub` keyword: on `Config`, on its fields and its
|
||||
`new` method, and on the `run` function. We now have a library crate that has a
|
||||
public API that we can test!
|
||||
|
||||
Now we need to bring the code we moved to *src/lib.rs* into the scope of the
|
||||
binary crate in *src/main.rs*, as shown in Listing 12-14:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
extern crate minigrep;
|
||||
|
||||
use std::env;
|
||||
use std::process;
|
||||
|
||||
use minigrep::Config;
|
||||
|
||||
fn main() {
|
||||
// --snip--
|
||||
if let Err(e) = minigrep::run(config) {
|
||||
// --snip--
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-14: Bringing the `minigrep` crate into the
|
||||
scope of *src/main.rs*</span>
|
||||
|
||||
To bring the library crate into the binary crate, we use `extern crate
|
||||
minigrep`. Then we add a `use minigrep::Config` line to bring the `Config` type
|
||||
into scope, and we prefix the `run` function with our crate name. Now all the
|
||||
functionality should be connected and should work. Run the program with `cargo
|
||||
run` and make sure everything works correctly.
|
||||
|
||||
Whew! That was a lot of work, but we’ve set ourselves up for success in the
|
||||
future. Now it’s much easier to handle errors, and we’ve made the code more
|
||||
modular. Almost all of our work will be done in *src/lib.rs* from here on out.
|
||||
|
||||
Let’s take advantage of this newfound modularity by doing something that would
|
||||
have been difficult with the old code but is easy with the new code: we’ll
|
||||
write some tests!
|
||||
332
2018-edition/src/ch12-04-testing-the-librarys-functionality.md
Normal file
332
2018-edition/src/ch12-04-testing-the-librarys-functionality.md
Normal file
@@ -0,0 +1,332 @@
|
||||
## Developing the Library’s Functionality with Test-Driven Development
|
||||
|
||||
Now that we’ve extracted the logic into *src/lib.rs* and left the argument
|
||||
collecting and error handling in *src/main.rs*, it’s much easier to write tests
|
||||
for the core functionality of our code. We can call functions directly with
|
||||
various arguments and check return values without having to call our binary
|
||||
from the command line. Feel free to write some tests for the functionality in
|
||||
the `Config::new` and `run` functions on your own.
|
||||
|
||||
In this section, we’ll add the searching logic to the `minigrep` program by
|
||||
using the Test-driven development (TDD) process. This software development
|
||||
technique follows these steps:
|
||||
|
||||
1. Write a test that fails and run it to make sure it fails for the reason you
|
||||
expect.
|
||||
2. Write or modify just enough code to make the new test pass.
|
||||
3. Refactor the code you just added or changed and make sure the tests
|
||||
continue to pass.
|
||||
4. Repeat from step 1!
|
||||
|
||||
This process is just one of many ways to write software, but TDD can help drive
|
||||
code design as well. Writing the test before you write the code that makes the
|
||||
test pass helps to maintain high test coverage throughout the process.
|
||||
|
||||
We’ll test drive the implementation of the functionality that will actually do
|
||||
the searching for the query string in the file contents and produce a list of
|
||||
lines that match the query. We’ll add this functionality in a function called
|
||||
`search`.
|
||||
|
||||
### Writing a Failing Test
|
||||
|
||||
Because we don’t need them anymore, let’s remove the `println!` statements from
|
||||
*src/lib.rs* and *src/main.rs* that we used to check the program’s behavior.
|
||||
Then, in *src/lib.rs*, we’ll add a `test` module with a test function, as we
|
||||
did in Chapter 11. The test function specifies the behavior we want the
|
||||
`search` function to have: it will take a query and the text to search for the
|
||||
query in, and it will return only the lines from the text that contain the
|
||||
query. Listing 12-15 shows this test, which won’t compile yet:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn search<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
# vec![]
|
||||
# }
|
||||
#
|
||||
#[cfg(test)]
|
||||
mod test {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn one_result() {
|
||||
let query = "duct";
|
||||
let contents = "\
|
||||
Rust:
|
||||
safe, fast, productive.
|
||||
Pick three.";
|
||||
|
||||
assert_eq!(
|
||||
vec!["safe, fast, productive."],
|
||||
search(query, contents)
|
||||
);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-15: Creating a failing test for the `search`
|
||||
function we wish we had</span>
|
||||
|
||||
This test searches for the string `"duct"`. The text we’re searching is three
|
||||
lines, only one of which contains `"duct"`. We assert that the value returned
|
||||
from the `search` function contains only the line we expect.
|
||||
|
||||
We aren’t able to run this test and watch it fail because the test doesn’t even
|
||||
compile: the `search` function doesn’t exist yet! So now we’ll add just enough
|
||||
code to get the test to compile and run by adding a definition of the `search`
|
||||
function that always returns an empty vector, as shown in Listing 12-16. Then
|
||||
the test should compile and fail because an empty vector doesn’t match a vector
|
||||
containing the line `"safe, fast, productive."`
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub fn search<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
vec![]
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-16: Defining just enough of the `search`
|
||||
function so our test will compile</span>
|
||||
|
||||
Notice that we need an explicit lifetime `'a` defined in the signature of
|
||||
`search` and used with the `contents` argument and the return value. Recall in
|
||||
Chapter 10 that the lifetime parameters specify which argument lifetime is
|
||||
connected to the lifetime of the return value. In this case, we indicate that
|
||||
the returned vector should contain string slices that reference slices of the
|
||||
argument `contents` (rather than the argument `query`).
|
||||
|
||||
In other words, we tell Rust that the data returned by the `search` function
|
||||
will live as long as the data passed into the `search` function in the
|
||||
`contents` argument. This is important! The data referenced *by* a slice needs
|
||||
to be valid for the reference to be valid; if the compiler assumes we’re making
|
||||
string slices of `query` rather than `contents`, it will do its safety checking
|
||||
incorrectly.
|
||||
|
||||
If we forget the lifetime annotations and try to compile this function, we’ll
|
||||
get this error:
|
||||
|
||||
```text
|
||||
error[E0106]: missing lifetime specifier
|
||||
--> src/lib.rs:5:51
|
||||
|
|
||||
5 | pub fn search(query: &str, contents: &str) -> Vec<&str> {
|
||||
| ^ expected lifetime
|
||||
parameter
|
||||
|
|
||||
= help: this function's return type contains a borrowed value, but the
|
||||
signature does not say whether it is borrowed from `query` or `contents`
|
||||
```
|
||||
|
||||
Rust can’t possibly know which of the two arguments we need, so we need to tell
|
||||
it. Because `contents` is the argument that contains all of our text and we
|
||||
want to return the parts of that text that match, we know `contents` is the
|
||||
argument that should be connected to the return value using the lifetime syntax.
|
||||
|
||||
Other programming languages don’t require you to connect arguments to return
|
||||
values in the signature. So although this might seem strange, it will get
|
||||
easier over time. You might want to compare this example with the “Validating
|
||||
References with Lifetimes” section in Chapter 10.
|
||||
|
||||
Now let’s run the test:
|
||||
|
||||
```text
|
||||
$ cargo test
|
||||
Compiling minigrep v0.1.0 (file:///projects/minigrep)
|
||||
--warnings--
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.43 secs
|
||||
Running target/debug/deps/minigrep-abcabcabc
|
||||
|
||||
running 1 test
|
||||
test test::one_result ... FAILED
|
||||
|
||||
failures:
|
||||
|
||||
---- test::one_result stdout ----
|
||||
thread 'test::one_result' panicked at 'assertion failed: `(left ==
|
||||
right)`
|
||||
left: `["safe, fast, productive."]`,
|
||||
right: `[]`)', src/lib.rs:48:8
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
|
||||
|
||||
failures:
|
||||
test::one_result
|
||||
|
||||
test result: FAILED. 0 passed; 1 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
error: test failed, to rerun pass '--lib'
|
||||
```
|
||||
|
||||
Great, the test fails, exactly as we expected. Let’s get the test to pass!
|
||||
|
||||
### Writing Code to Pass the Test
|
||||
|
||||
Currently, our test is failing because we always return an empty vector. To fix
|
||||
that and implement `search`, our program needs to follow these steps:
|
||||
|
||||
* Iterate through each line of the contents.
|
||||
* Check whether the line contains our query string.
|
||||
* If it does, add it to the list of values we’re returning.
|
||||
* If it doesn’t, do nothing.
|
||||
* Return the list of results that match.
|
||||
|
||||
Let’s work through each step, starting with iterating through lines.
|
||||
|
||||
#### Iterating Through Lines with the `lines` Method
|
||||
|
||||
Rust has a helpful method to handle line-by-line iteration of strings,
|
||||
conveniently named `lines`, that works as shown in Listing 12-17. Note this
|
||||
won’t compile yet:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub fn search<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
for line in contents.lines() {
|
||||
// do something with line
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-17: Iterating through each line in `contents`
|
||||
</span>
|
||||
|
||||
The `lines` method returns an iterator. We’ll talk about iterators in depth in
|
||||
Chapter 13, but recall that you saw this way of using an iterator in Listing
|
||||
3-5, where we used a `for` loop with an iterator to run some code on each item
|
||||
in a collection.
|
||||
|
||||
#### Searching Each Line for the Query
|
||||
|
||||
Next, we’ll check whether the current line contains our query string.
|
||||
Fortunately, strings have a helpful method named `contains` that does this for
|
||||
us! Add a call to the `contains` method in the `search` function, as shown in
|
||||
Listing 12-18. Note this still won’t compile yet:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub fn search<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
for line in contents.lines() {
|
||||
if line.contains(query) {
|
||||
// do something with line
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-18: Adding functionality to see whether the
|
||||
line contains the string in `query`</span>
|
||||
|
||||
#### Storing Matching Lines
|
||||
|
||||
We also need a way to store the lines that contain our query string. For that,
|
||||
we can make a mutable vector before the `for` loop and call the `push` method
|
||||
to store a `line` in the vector. After the `for` loop, we return the vector, as
|
||||
shown in Listing 12-19:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub fn search<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
let mut results = Vec::new();
|
||||
|
||||
for line in contents.lines() {
|
||||
if line.contains(query) {
|
||||
results.push(line);
|
||||
}
|
||||
}
|
||||
|
||||
results
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-19: Storing the lines that match so we can
|
||||
return them</span>
|
||||
|
||||
Now the `search` function should return only the lines that contain `query`,
|
||||
and our test should pass. Let’s run the test:
|
||||
|
||||
```text
|
||||
$ cargo test
|
||||
--snip--
|
||||
running 1 test
|
||||
test test::one_result ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Our test passed, so we know it works!
|
||||
|
||||
At this point, we could consider opportunities for refactoring the
|
||||
implementation of the search function while keeping the tests passing to
|
||||
maintain the same functionality. The code in the search function isn’t too bad,
|
||||
but it doesn’t take advantage of some useful features of iterators. We’ll
|
||||
return to this example in Chapter 13, where we’ll explore iterators in detail,
|
||||
and look at how to improve it.
|
||||
|
||||
#### Using the `search` Function in the `run` Function
|
||||
|
||||
Now that the `search` function is working and tested, we need to call `search`
|
||||
from our `run` function. We need to pass the `config.query` value and the
|
||||
`contents` that `run` reads from the file to the `search` function. Then `run`
|
||||
will print each line returned from `search`:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub fn run(config: Config) -> Result<(), Box<Error>> {
|
||||
let mut f = File::open(config.filename)?;
|
||||
|
||||
let mut contents = String::new();
|
||||
f.read_to_string(&mut contents)?;
|
||||
|
||||
for line in search(&config.query, &contents) {
|
||||
println!("{}", line);
|
||||
}
|
||||
|
||||
Ok(())
|
||||
}
|
||||
```
|
||||
|
||||
We’re still using a `for` loop to return each line from `search` and print it.
|
||||
|
||||
Now the entire program should work! Let’s try it out, first with a word that
|
||||
should return exactly one line from the Emily Dickinson poem, “frog”:
|
||||
|
||||
```text
|
||||
$ cargo run frog poem.txt
|
||||
Compiling minigrep v0.1.0 (file:///projects/minigrep)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.38 secs
|
||||
Running `target/debug/minigrep frog poem.txt`
|
||||
How public, like a frog
|
||||
```
|
||||
|
||||
Cool! Now let’s try a word that will match multiple lines, like “body”:
|
||||
|
||||
```text
|
||||
$ cargo run body poem.txt
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/minigrep body poem.txt`
|
||||
I’m nobody! Who are you?
|
||||
Are you nobody, too?
|
||||
How dreary to be somebody!
|
||||
```
|
||||
|
||||
And finally, let’s make sure that we don’t get any lines when we search for a
|
||||
word that isn’t anywhere in the poem, such as “monomorphization”:
|
||||
|
||||
```text
|
||||
$ cargo run monomorphization poem.txt
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/minigrep monomorphization poem.txt`
|
||||
```
|
||||
|
||||
Excellent! We’ve built our own mini version of a classic tool and learned a lot
|
||||
about how to structure applications. We’ve also learned a bit about file input
|
||||
and output, lifetimes, testing, and command line parsing.
|
||||
|
||||
To round out this project, we’ll briefly demonstrate how to work with
|
||||
environment variables and how to print to standard error, both of which are
|
||||
useful when you’re writing command line programs.
|
||||
305
2018-edition/src/ch12-05-working-with-environment-variables.md
Normal file
305
2018-edition/src/ch12-05-working-with-environment-variables.md
Normal file
@@ -0,0 +1,305 @@
|
||||
## Working with Environment Variables
|
||||
|
||||
We’ll improve `minigrep` by adding an extra feature: an option for
|
||||
case-insensitive searching that the user can turn on via an environment
|
||||
variable. We could make this feature a command line option and require that
|
||||
users enter it each time they want it to apply, but instead we’ll use an
|
||||
environment variable. Doing so allows our users to set the environment variable
|
||||
once and have all their searches be case insensitive in that terminal session.
|
||||
|
||||
### Writing a Failing Test for the Case-Insensitive `search` Function
|
||||
|
||||
We want to add a new `search_case_insensitive` function that we’ll call when
|
||||
the environment variable is on. We’ll continue to follow the TDD process, so
|
||||
the first step is again to write a failing test. We’ll add a new test for the
|
||||
new `search_case_insensitive` function and rename our old test from
|
||||
`one_result` to `case_sensitive` to clarify the differences between the two
|
||||
tests, as shown in Listing 12-20:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[cfg(test)]
|
||||
mod test {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn case_sensitive() {
|
||||
let query = "duct";
|
||||
let contents = "\
|
||||
Rust:
|
||||
safe, fast, productive.
|
||||
Pick three.
|
||||
Duct tape.";
|
||||
|
||||
assert_eq!(
|
||||
vec!["safe, fast, productive."],
|
||||
search(query, contents)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn case_insensitive() {
|
||||
let query = "rUsT";
|
||||
let contents = "\
|
||||
Rust:
|
||||
safe, fast, productive.
|
||||
Pick three.
|
||||
Trust me.";
|
||||
|
||||
assert_eq!(
|
||||
vec!["Rust:", "Trust me."],
|
||||
search_case_insensitive(query, contents)
|
||||
);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-20: Adding a new failing test for the
|
||||
case-insensitive function we’re about to add</span>
|
||||
|
||||
Note that we’ve edited the old test’s `contents` too. We’ve added a new line
|
||||
with the text `"Duct tape."` using a capital D that shouldn’t match the query
|
||||
“duct” when we’re searching in a case-sensitive manner. Changing the old test
|
||||
in this way helps ensure that we don’t accidentally break the case-sensitive
|
||||
search functionality that we’ve already implemented. This test should pass now
|
||||
and should continue to pass as we work on the case-insensitive search.
|
||||
|
||||
The new test for the case-*insensitive* search uses `"rUsT"` as its query. In
|
||||
the `search_case_insensitive` function we’re about to add, the query `"rUsT"`
|
||||
should match the line containing `"Rust:"` with a capital R and match the line
|
||||
`"Trust me."` even though both have different casing than the query. This is
|
||||
our failing test, and it will fail to compile because we haven’t yet defined
|
||||
the `search_case_insensitive` function. Feel free to add a skeleton
|
||||
implementation that always returns an empty vector, similar to the way we did
|
||||
for the `search` function in Listing 12-16 to see the test compile and fail.
|
||||
|
||||
### Implementing the `search_case_insensitive` Function
|
||||
|
||||
The `search_case_insensitive` function, shown in Listing 12-21, will be almost
|
||||
the same as the `search` function. The only difference is that we’ll lowercase
|
||||
the `query` and each `line` so whatever the case of the input arguments,
|
||||
they’ll be the same case when we check whether the line contains the query.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
fn search_case_insensitive<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
let query = query.to_lowercase();
|
||||
let mut results = Vec::new();
|
||||
|
||||
for line in contents.lines() {
|
||||
if line.to_lowercase().contains(&query) {
|
||||
results.push(line);
|
||||
}
|
||||
}
|
||||
|
||||
results
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-21: Defining the `search_case_insensitive`
|
||||
function to lowercase the query and the line before comparing them</span>
|
||||
|
||||
First, we lowercase the `query` string and store it in a shadowed variable with
|
||||
the same name. Calling `to_lowercase` on the query is necessary so no matter
|
||||
whether the user’s query is `"rust"`, `"RUST"`, `"Rust:"`, or `"rUsT"`, we’ll
|
||||
treat the query as if it were `"rust"` and be insensitive to the case.
|
||||
|
||||
Note that `query` is now a `String` rather than a string slice, because calling
|
||||
`to_lowercase` creates new data rather than referencing existing data. Say the
|
||||
query is `"rUsT"`, as an example: that string slice doesn’t contain a lowercase
|
||||
`u` or `t` for us to use, so we have to allocate a new `String` containing
|
||||
`"rust"`. When we pass `query` as an argument to the `contains` method now, we
|
||||
need to add an ampersand because the signature of `contains` is defined to take
|
||||
a string slice.
|
||||
|
||||
Next, we add a call to `to_lowercase` on each `line` before we check whether it
|
||||
contains `query` to lowercase all characters. Now that we’ve converted `line`
|
||||
and `query` to lowercase, we’ll find matches no matter what the case of the
|
||||
query is.
|
||||
|
||||
Let’s see if this implementation passes the tests:
|
||||
|
||||
```text
|
||||
running 2 tests
|
||||
test test::case_insensitive ... ok
|
||||
test test::case_sensitive ... ok
|
||||
|
||||
test result: ok. 2 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Great! They passed. Now, let’s call the new `search_case_insensitive` function
|
||||
from the `run` function. First, we’ll add a configuration option to the
|
||||
`Config` struct to switch between case-sensitive and case-insensitive search.
|
||||
Adding this field will cause compiler errors since we aren’t initializing this
|
||||
field anywhere yet:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub struct Config {
|
||||
pub query: String,
|
||||
pub filename: String,
|
||||
pub case_sensitive: bool,
|
||||
}
|
||||
```
|
||||
|
||||
Note that we added the `case_sensitive` field that holds a Boolean. Next, we
|
||||
need the `run` function to check the `case_sensitive` field’s value and use
|
||||
that to decide whether to call the `search` function or the
|
||||
`search_case_insensitive` function, as shown in Listing 12-22. Note this still
|
||||
won’t compile yet:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::error::Error;
|
||||
# use std::fs::File;
|
||||
# use std::io::prelude::*;
|
||||
#
|
||||
# fn search<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
# vec![]
|
||||
# }
|
||||
#
|
||||
# fn search_case_insensitive<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
# vec![]
|
||||
# }
|
||||
#
|
||||
# struct Config {
|
||||
# query: String,
|
||||
# filename: String,
|
||||
# case_sensitive: bool,
|
||||
# }
|
||||
#
|
||||
pub fn run(config: Config) -> Result<(), Box<Error>> {
|
||||
let mut f = File::open(config.filename)?;
|
||||
|
||||
let mut contents = String::new();
|
||||
f.read_to_string(&mut contents)?;
|
||||
|
||||
let results = if config.case_sensitive {
|
||||
search(&config.query, &contents)
|
||||
} else {
|
||||
search_case_insensitive(&config.query, &contents)
|
||||
};
|
||||
|
||||
for line in results {
|
||||
println!("{}", line);
|
||||
}
|
||||
|
||||
Ok(())
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-22: Calling either `search` or
|
||||
`search_case_insensitive` based on the value in `config.case_sensitive`</span>
|
||||
|
||||
Finally, we need to check for the environment variable. The functions for
|
||||
working with environment variables are in the `env` module in the standard
|
||||
library, so we want to bring that module into scope with a `use std::env;` line
|
||||
at the top of *src/lib.rs*. Then we’ll use the `var` method from the `env`
|
||||
module to check for an environment variable named `CASE_INSENSITIVE`, as shown
|
||||
in Listing 12-23:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
use std::env;
|
||||
# struct Config {
|
||||
# query: String,
|
||||
# filename: String,
|
||||
# case_sensitive: bool,
|
||||
# }
|
||||
|
||||
// --snip--
|
||||
|
||||
impl Config {
|
||||
pub fn new(args: &[String]) -> Result<Config, &'static str> {
|
||||
if args.len() < 3 {
|
||||
return Err("not enough arguments");
|
||||
}
|
||||
|
||||
let query = args[1].clone();
|
||||
let filename = args[2].clone();
|
||||
|
||||
let case_sensitive = env::var("CASE_INSENSITIVE").is_err();
|
||||
|
||||
Ok(Config { query, filename, case_sensitive })
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-23: Checking for an environment variable named
|
||||
`CASE_INSENSITIVE`</span>
|
||||
|
||||
Here, we create a new variable `case_sensitive`. To set its value, we call the
|
||||
`env::var` function and pass it the name of the `CASE_INSENSITIVE` environment
|
||||
variable. The `env::var` method returns a `Result` that will be the successful
|
||||
`Ok` variant that contains the value of the environment variable if the
|
||||
environment variable is set. It will return the `Err` variant if the
|
||||
environment variable is not set.
|
||||
|
||||
We’re using the `is_err` method on the `Result` to check whether it’s an error
|
||||
and therefore unset, which means it *should* do a case-sensitive search. If the
|
||||
`CASE_INSENSITIVE` environment variable is set to anything, `is_err` will
|
||||
return false and the program will perform a case-insensitive search. We don’t
|
||||
care about the *value* of the environment variable, just whether it’s set or
|
||||
unset, so we’re checking `is_err` rather than using `unwrap`, `expect`, or any
|
||||
of the other methods we’ve seen on `Result`.
|
||||
|
||||
We pass the value in the `case_sensitive` variable to the `Config` instance so
|
||||
the `run` function can read that value and decide whether to call `search` or
|
||||
`search_case_insensitive`, as we implemented in Listing 12-22.
|
||||
|
||||
Let’s give it a try! First, we’ll run our program without the environment
|
||||
variable set and with the query `to`, which should match any line that contains
|
||||
the word “to” in all lowercase:
|
||||
|
||||
```text
|
||||
$ cargo run to poem.txt
|
||||
Compiling minigrep v0.1.0 (file:///projects/minigrep)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/minigrep to poem.txt`
|
||||
Are you nobody, too?
|
||||
How dreary to be somebody!
|
||||
```
|
||||
|
||||
Looks like that still works! Now, let’s run the program with `CASE_INSENSITIVE`
|
||||
set to `1` but with the same query `to`.
|
||||
|
||||
If you’re using PowerShell, you will need to set the environment variable and
|
||||
run the program in two commands rather than one:
|
||||
|
||||
```text
|
||||
$ $env:CASE_INSENSITIVE=1
|
||||
$ cargo run to poem.txt
|
||||
```
|
||||
|
||||
We should get lines that contain “to” that might have uppercase letters:
|
||||
|
||||
```text
|
||||
$ CASE_INSENSITIVE=1 cargo run to poem.txt
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/minigrep to poem.txt`
|
||||
Are you nobody, too?
|
||||
How dreary to be somebody!
|
||||
To tell your name the livelong day
|
||||
To an admiring bog!
|
||||
```
|
||||
|
||||
Excellent, we also got lines containing “To”! Our `minigrep` program can now do
|
||||
case-insensitive searching controlled by an environment variable. Now you know
|
||||
how to manage options set using either command line arguments or environment
|
||||
variables.
|
||||
|
||||
Some programs allow arguments *and* environment variables for the same
|
||||
configuration. In those cases, the programs decide that one or the other takes
|
||||
precedence. For another exercise on your own, try controlling case
|
||||
insensitivity through either a command line argument or an environment
|
||||
variable. Decide whether the command line argument or the environment variable
|
||||
should take precedence if the program is run with one set to case sensitive and
|
||||
one set to case insensitive.
|
||||
|
||||
The `std::env` module contains many more useful features for dealing with
|
||||
environment variables: check out its documentation to see what is available.
|
||||
121
2018-edition/src/ch12-06-writing-to-stderr-instead-of-stdout.md
Normal file
121
2018-edition/src/ch12-06-writing-to-stderr-instead-of-stdout.md
Normal file
@@ -0,0 +1,121 @@
|
||||
## Writing Error Messages to Standard Error Instead of Standard Output
|
||||
|
||||
At the moment, we’re writing all of our output to the terminal using the
|
||||
`println!` function. Most terminals provide two kinds of output: *standard
|
||||
output* (`stdout`) for general information and *standard error* (`stderr`)
|
||||
for error messages. This distinction enables users to choose to direct the
|
||||
successful output of a program to a file but still print error messages to the
|
||||
screen.
|
||||
|
||||
The `println!` function is only capable of printing to standard output, so we
|
||||
have to use something else to print to standard error.
|
||||
|
||||
### Checking Where Errors Are Written
|
||||
|
||||
First, let’s observe how the content printed by `minigrep` is currently being
|
||||
written to standard output, including any error messages we want to write to
|
||||
standard error instead. We’ll do that by redirecting the standard output stream
|
||||
to a file while also intentionally causing an error. We won’t redirect the
|
||||
standard error stream, so any content sent to standard error will continue to
|
||||
display on the screen.
|
||||
|
||||
Command line programs are expected to send error messages to the standard error
|
||||
stream so we can still see error messages on the screen even if we redirect the
|
||||
standard output stream to a file. Our program is not currently well-behaved:
|
||||
we’re about to see that it saves the error message output to a file instead!
|
||||
|
||||
The way to demonstrate this behavior is by running the program with `>` and the
|
||||
filename, *output.txt*, that we want to redirect the standard output stream to.
|
||||
We won’t pass any arguments, which should cause an error:
|
||||
|
||||
```text
|
||||
$ cargo run > output.txt
|
||||
```
|
||||
|
||||
The `>` syntax tells the shell to write the contents of standard output to
|
||||
*output.txt* instead of the screen. We didn’t see the error message we were
|
||||
expecting printed to the screen, so that means it must have ended up in the
|
||||
file. This is what *output.txt* contains:
|
||||
|
||||
```text
|
||||
Problem parsing arguments: not enough arguments
|
||||
```
|
||||
|
||||
Yup, our error message is being printed to standard output. It’s much more
|
||||
useful for error messages like this to be printed to standard error so only
|
||||
data from a successful run ends up in the file. We’ll change that.
|
||||
|
||||
### Printing Errors to Standard Error
|
||||
|
||||
We’ll use the code in Listing 12-24 to change how error messages are printed.
|
||||
Because of the refactoring we did earlier in this chapter, all the code that
|
||||
prints error messages is in one function, `main`. The standard library provides
|
||||
the `eprintln!` macro that prints to the standard error stream, so let’s change
|
||||
the two places we were calling `println!` to print errors to use `eprintln!`
|
||||
instead.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let args: Vec<String> = env::args().collect();
|
||||
|
||||
let config = Config::new(&args).unwrap_or_else(|err| {
|
||||
eprintln!("Problem parsing arguments: {}", err);
|
||||
process::exit(1);
|
||||
});
|
||||
|
||||
if let Err(e) = minigrep::run(config) {
|
||||
eprintln!("Application error: {}", e);
|
||||
|
||||
process::exit(1);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 12-24: Writing error messages to standard error
|
||||
instead of standard output using `eprintln!`</span>
|
||||
|
||||
After changing `println!` to `eprintln!`, let’s run the program again in the
|
||||
same way, without any arguments and redirecting standard output with `>`:
|
||||
|
||||
```text
|
||||
$ cargo run > output.txt
|
||||
Problem parsing arguments: not enough arguments
|
||||
```
|
||||
|
||||
Now we see the error onscreen and *output.txt* contains nothing, which is the
|
||||
behavior we expect of command line programs.
|
||||
|
||||
Let’s run the program again with arguments that don’t cause an error but still
|
||||
redirect standard output to a file, like so:
|
||||
|
||||
```text
|
||||
$ cargo run to poem.txt > output.txt
|
||||
```
|
||||
|
||||
We won’t see any output to the terminal, and *output.txt* will contain our
|
||||
results:
|
||||
|
||||
<span class="filename">Filename: output.txt</span>
|
||||
|
||||
```text
|
||||
Are you nobody, too?
|
||||
How dreary to be somebody!
|
||||
```
|
||||
|
||||
This demonstrates that we’re now using standard output for successful output
|
||||
and standard error for error output as appropriate.
|
||||
|
||||
## Summary
|
||||
|
||||
This chapter recapped some of the major concepts you’ve learned so far and
|
||||
covered how to perform common I/O operations in Rust. By using command line
|
||||
arguments, files, environment variables, and the `eprintln!` macro for printing
|
||||
errors, you’re now prepared to write command line applications. By using the
|
||||
concepts in previous chapters, your code will be well organized, store data
|
||||
effectively in the appropriate data structures, handle errors nicely, and be
|
||||
well tested.
|
||||
|
||||
Next, we’ll explore some Rust features that were influenced by functional
|
||||
languages: closures and iterators.
|
||||
24
2018-edition/src/ch13-00-functional-features.md
Normal file
24
2018-edition/src/ch13-00-functional-features.md
Normal file
@@ -0,0 +1,24 @@
|
||||
# Functional Language Features: Iterators and Closures
|
||||
|
||||
Rust’s design has taken inspiration from many existing languages and
|
||||
techniques, and one significant influence is *functional programming*.
|
||||
Programming in a functional style often includes using functions as values by
|
||||
passing them in arguments, returning them from other functions, assigning them
|
||||
to variables for later execution, and so forth.
|
||||
|
||||
In this chapter, we won’t debate the issue of what functional programming is or
|
||||
isn’t but will instead discuss some features of Rust that are similar to
|
||||
features in many languages often referred to as functional.
|
||||
|
||||
More specifically, we’ll cover:
|
||||
|
||||
* *Closures*, a function-like construct you can store in a variable
|
||||
* *Iterators*, a way of processing a series of elements
|
||||
* How to use these two features to improve the I/O project in Chapter 12
|
||||
* The performance of these two features (Spoiler alert: they’re faster than you
|
||||
might think!)
|
||||
|
||||
Other Rust features, such as pattern matching and enums, which we’ve covered in
|
||||
other chapters, are influenced by the functional style as well. Mastering
|
||||
closures and iterators is an important part of writing idiomatic, fast Rust
|
||||
code, so we’ll devote this entire chapter to them.
|
||||
823
2018-edition/src/ch13-01-closures.md
Normal file
823
2018-edition/src/ch13-01-closures.md
Normal file
@@ -0,0 +1,823 @@
|
||||
## Closures: Anonymous Functions that Can Capture Their Environment
|
||||
|
||||
Rust’s closures are anonymous functions you can save in a variable or pass as
|
||||
arguments to other functions. You can create the closure in one place and then
|
||||
call the closure to evaluate it in a different context. Unlike functions,
|
||||
closures can capture values from the scope in which they’re called. We’ll
|
||||
demonstrate how these closure features allow for code reuse and behavior
|
||||
customization.
|
||||
|
||||
### Creating an Abstraction of Behavior with Closures
|
||||
|
||||
Let’s work on an example of a situation in which it’s useful to store a closure
|
||||
to be executed later. Along the way, we’ll talk about the syntax of closures,
|
||||
type inference, and traits.
|
||||
|
||||
Consider this hypothetical situation: we work at a startup that’s making an app
|
||||
to generate custom exercise workout plans. The backend is written in Rust, and
|
||||
the algorithm that generates the workout plan takes into account many factors,
|
||||
such as the app user’s age, body mass index, exercise preferences, recent
|
||||
workouts, and an intensity number they specify. The actual algorithm used isn’t
|
||||
important in this example; what’s important is that this calculation takes a
|
||||
few seconds. We want to call this algorithm only when we need to and only call
|
||||
it once so we don’t make the user wait more than necessary.
|
||||
|
||||
We’ll simulate calling this hypothetical algorithm with the function
|
||||
`simulated_expensive_calculation` shown in Listing 13-1, which will print
|
||||
`calculating slowly...`, wait for two seconds, and then return whatever number
|
||||
we passed in:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::thread;
|
||||
use std::time::Duration;
|
||||
|
||||
fn simulated_expensive_calculation(intensity: u32) -> u32 {
|
||||
println!("calculating slowly...");
|
||||
thread::sleep(Duration::from_secs(2));
|
||||
intensity
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-1: A function to stand in for a hypothetical
|
||||
calculation that takes about 2 seconds to run</span>
|
||||
|
||||
Next is the `main` function, which contains the parts of the workout app
|
||||
important for this example. This function represents the code that the app will
|
||||
call when a user asks for a workout plan. Because the interaction with the
|
||||
app’s frontend isn’t relevant to the use of closures, we’ll hardcode values
|
||||
representing inputs to our program and print the outputs.
|
||||
|
||||
The required inputs are these:
|
||||
|
||||
* An intensity number from the user, which is specified when they request
|
||||
a workout to indicate whether they want a low-intensity workout or a
|
||||
high-intensity workout
|
||||
* A random number that will generate some variety in the workout plans
|
||||
|
||||
The output will be the recommended workout plan. Listing 13-2 shows the `main`
|
||||
function we’ll use:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let simulated_user_specified_value = 10;
|
||||
let simulated_random_number = 7;
|
||||
|
||||
generate_workout(
|
||||
simulated_user_specified_value,
|
||||
simulated_random_number
|
||||
);
|
||||
}
|
||||
# fn generate_workout(intensity: u32, random_number: u32) {}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-2: A `main` function with hardcoded values to
|
||||
simulate user input and random number generation</span>
|
||||
|
||||
We’ve hardcoded the variable `simulated_user_specified_value` as 10 and the
|
||||
variable `simulated_random_number` as 7 for simplicity’s sake; in an actual
|
||||
program, we’d get the intensity number from the app frontend, and we’d use the
|
||||
`rand` crate to generate a random number, as we did in the Guessing Game
|
||||
example in Chapter 2. The `main` function calls a `generate_workout` function
|
||||
with the simulated input values.
|
||||
|
||||
Now that we have the context, let’s get to the algorithm. The function
|
||||
`generate_workout` in Listing 13-3 contains the business logic of the
|
||||
app that we’re most concerned with in this example. The rest of the code
|
||||
changes in this example will be made to this function.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::thread;
|
||||
# use std::time::Duration;
|
||||
#
|
||||
# fn simulated_expensive_calculation(num: u32) -> u32 {
|
||||
# println!("calculating slowly...");
|
||||
# thread::sleep(Duration::from_secs(2));
|
||||
# num
|
||||
# }
|
||||
#
|
||||
fn generate_workout(intensity: u32, random_number: u32) {
|
||||
if intensity < 25 {
|
||||
println!(
|
||||
"Today, do {} pushups!",
|
||||
simulated_expensive_calculation(intensity)
|
||||
);
|
||||
println!(
|
||||
"Next, do {} situps!",
|
||||
simulated_expensive_calculation(intensity)
|
||||
);
|
||||
} else {
|
||||
if random_number == 3 {
|
||||
println!("Take a break today! Remember to stay hydrated!");
|
||||
} else {
|
||||
println!(
|
||||
"Today, run for {} minutes!",
|
||||
simulated_expensive_calculation(intensity)
|
||||
);
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-3: The business logic that prints the workout
|
||||
plans based on the inputs and calls to the `simulated_expensive_calculation`
|
||||
function</span>
|
||||
|
||||
The code in Listing 13-3 has multiple calls to the slow calculation function.
|
||||
The first `if` block calls `simulated_expensive_calculation` twice, the `if`
|
||||
inside the outer `else` doesn’t call it at all, and the code inside the
|
||||
second `else` case calls it once.
|
||||
|
||||
<!-- NEXT PARAGRAPH WRAPPED WEIRD INTENTIONALLY SEE #199 -->
|
||||
|
||||
The desired behavior of the `generate_workout` function is to first check
|
||||
whether the user wants a low-intensity workout (indicated by a number less
|
||||
than 25) or a high-intensity workout (a number of 25 or greater).
|
||||
|
||||
Low-intensity workout plans will recommend a number of push-ups and sit-ups
|
||||
based on the complex algorithm we’re simulating.
|
||||
|
||||
If the user wants a high-intensity workout, there’s some additional logic: if
|
||||
the value of the random number generated by the app happens to be 3, the app
|
||||
will recommend a break and hydration. If not, the user will get a number of
|
||||
minutes of running based on the complex algorithm.
|
||||
|
||||
This code works the way the business wants it to now, but let’s say the data
|
||||
science team decides that we need to make some changes to the way we call the
|
||||
`simulated_expensive_calculation` function in the future. To simplify the
|
||||
update when those changes happen, we want to refactor this code so it calls the
|
||||
`simulated_expensive_calculation` function only once. We also want to cut the
|
||||
place where we’re currently unnecessarily calling the function twice without
|
||||
adding any other calls to that function in the process. That is, we don’t want
|
||||
to call it if the result isn’t needed, and we still want to call it only once.
|
||||
|
||||
#### Refactoring Using Functions
|
||||
|
||||
We could restructure the workout program in many ways. First, we’ll try
|
||||
extracting the duplicated call to the `simulated_expensive_calculation`
|
||||
function into a variable, as shown in Listing 13-4:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::thread;
|
||||
# use std::time::Duration;
|
||||
#
|
||||
# fn simulated_expensive_calculation(num: u32) -> u32 {
|
||||
# println!("calculating slowly...");
|
||||
# thread::sleep(Duration::from_secs(2));
|
||||
# num
|
||||
# }
|
||||
#
|
||||
fn generate_workout(intensity: u32, random_number: u32) {
|
||||
let expensive_result =
|
||||
simulated_expensive_calculation(intensity);
|
||||
|
||||
if intensity < 25 {
|
||||
println!(
|
||||
"Today, do {} pushups!",
|
||||
expensive_result
|
||||
);
|
||||
println!(
|
||||
"Next, do {} situps!",
|
||||
expensive_result
|
||||
);
|
||||
} else {
|
||||
if random_number == 3 {
|
||||
println!("Take a break today! Remember to stay hydrated!");
|
||||
} else {
|
||||
println!(
|
||||
"Today, run for {} minutes!",
|
||||
expensive_result
|
||||
);
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-4: Extracting the calls to
|
||||
`simulated_expensive_calculation` to one place and storing the result in the
|
||||
`expensive_result` variable</span>
|
||||
|
||||
This change unifies all the calls to `simulated_expensive_calculation` and
|
||||
solves the problem of the first `if` block unnecessarily calling the function
|
||||
twice. Unfortunately, we’re now calling this function and waiting for the
|
||||
result in all cases, which includes the inner `if` block that doesn’t use the
|
||||
result value at all.
|
||||
|
||||
We want to define code in one place in our program, but only *execute* that
|
||||
code where we actually need the result. This is a use case for closures!
|
||||
|
||||
#### Refactoring with Closures to Store Code
|
||||
|
||||
Instead of always calling the `simulated_expensive_calculation` function before
|
||||
the `if` blocks, we can define a closure and store the *closure* in a variable
|
||||
rather than storing the result of the function call, as shown in Listing 13-5.
|
||||
We can actually move the whole body of `simulated_expensive_calculation` within
|
||||
the closure we’re introducing here:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::thread;
|
||||
# use std::time::Duration;
|
||||
#
|
||||
let expensive_closure = |num| {
|
||||
println!("calculating slowly...");
|
||||
thread::sleep(Duration::from_secs(2));
|
||||
num
|
||||
};
|
||||
# expensive_closure(5);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-5: Defining a closure and storing it in the
|
||||
`expensive_closure` variable</span>
|
||||
|
||||
The closure definition comes after the `=` to assign it to the variable
|
||||
`expensive_closure`. To define a closure, we start with a pair of vertical
|
||||
pipes (`|`), inside which we specify the parameters to the closure; this syntax
|
||||
was chosen because of its similarity to closure definitions in Smalltalk and
|
||||
Ruby. This closure has one parameter named `num`: if we had more than one
|
||||
parameter, we would separate them with commas, like `|param1, param2|`.
|
||||
|
||||
After the parameters, we place curly brackets that hold the body of the
|
||||
closure—these are optional if the closure body is a single expression. The end
|
||||
of the closure, after the curly brackets, needs a semicolon to complete the
|
||||
`let` statement. The value returned from the last line in the closure body
|
||||
(`num`) will be the value returned from the closure when it’s called, because
|
||||
that line doesn’t end in a semicolon; just like in function bodies.
|
||||
|
||||
Note that this `let` statement means `expensive_closure` contains the
|
||||
*definition* of an anonymous function, not the *resulting value* of calling the
|
||||
anonymous function. Recall that we’re using a closure because we want to define
|
||||
the code to call at one point, store that code, and call it at a later point;
|
||||
the code we want to call is now stored in `expensive_closure`.
|
||||
|
||||
With the closure defined, we can change the code in the `if` blocks to call the
|
||||
closure to execute the code and get the resulting value. We call a closure like
|
||||
we do a function: we specify the variable name that holds the closure
|
||||
definition and follow it with parentheses containing the argument values we
|
||||
want to use, as shown in Listing 13-6:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::thread;
|
||||
# use std::time::Duration;
|
||||
#
|
||||
fn generate_workout(intensity: u32, random_number: u32) {
|
||||
let expensive_closure = |num| {
|
||||
println!("calculating slowly...");
|
||||
thread::sleep(Duration::from_secs(2));
|
||||
num
|
||||
};
|
||||
|
||||
if intensity < 25 {
|
||||
println!(
|
||||
"Today, do {} pushups!",
|
||||
expensive_closure(intensity)
|
||||
);
|
||||
println!(
|
||||
"Next, do {} situps!",
|
||||
expensive_closure(intensity)
|
||||
);
|
||||
} else {
|
||||
if random_number == 3 {
|
||||
println!("Take a break today! Remember to stay hydrated!");
|
||||
} else {
|
||||
println!(
|
||||
"Today, run for {} minutes!",
|
||||
expensive_closure(intensity)
|
||||
);
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-6: Calling the `expensive_closure` we’ve
|
||||
defined</span>
|
||||
|
||||
Now the expensive calculation is called in only one place, and we’re only
|
||||
executing that code where we need the results.
|
||||
|
||||
However, we’ve reintroduced one of the problems from Listing 13-3: we’re still
|
||||
calling the closure twice in the first `if` block, which will call the
|
||||
expensive code twice and make the user wait twice as long as they need to. We
|
||||
could fix this problem by creating a variable local to that `if` block to hold
|
||||
the result of calling the closure, but closures provide us with another
|
||||
solution. We’ll talk about that solution in a bit. But first let’s talk about
|
||||
why there aren’t type annotations in the closure definition and the traits
|
||||
involved with closures.
|
||||
|
||||
### Closure Type Inference and Annotation
|
||||
|
||||
Closures don’t require you to annotate the types of the parameters or the
|
||||
return value like `fn` functions do. Type annotations are required on functions
|
||||
because they’re part of an explicit interface exposed to your users. Defining
|
||||
this interface rigidly is important for ensuring that everyone agrees on what
|
||||
types of values a function uses and returns. But closures aren’t used in an
|
||||
exposed interface like this: they’re stored in variables and used without
|
||||
naming them and exposing them to users of our library.
|
||||
|
||||
Closures are usually short and relevant only within a narrow context rather
|
||||
than in any arbitrary scenario. Within these limited contexts, the compiler is
|
||||
reliably able to infer the types of the parameters and the return type, similar
|
||||
to how it’s able to infer the types of most variables.
|
||||
|
||||
Making programmers annotate the types in these small, anonymous functions would
|
||||
be annoying and largely redundant with the information the compiler already has
|
||||
available.
|
||||
|
||||
As with variables, we can add type annotations if we want to increase
|
||||
explicitness and clarity at the cost of being more verbose than is strictly
|
||||
necessary. Annotating the types for the closure we defined in Listing 13-5
|
||||
would look like the definition shown in Listing 13-7:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::thread;
|
||||
# use std::time::Duration;
|
||||
#
|
||||
let expensive_closure = |num: u32| -> u32 {
|
||||
println!("calculating slowly...");
|
||||
thread::sleep(Duration::from_secs(2));
|
||||
num
|
||||
};
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-7: Adding optional type annotations of the
|
||||
parameter and return value types in the closure</span>
|
||||
|
||||
With type annotations added, the syntax of closures looks more similar to the
|
||||
syntax of functions. The following is a vertical comparison of the syntax for
|
||||
the definition of a function that adds 1 to its parameter and a closure that
|
||||
has the same behavior. We’ve added some spaces to line up the relevant parts.
|
||||
This illustrates how closure syntax is similar to function syntax except for
|
||||
the use of pipes and the amount of syntax that is optional:
|
||||
|
||||
```rust,ignore
|
||||
fn add_one_v1 (x: u32) -> u32 { x + 1 }
|
||||
let add_one_v2 = |x: u32| -> u32 { x + 1 };
|
||||
let add_one_v3 = |x| { x + 1 };
|
||||
let add_one_v4 = |x| x + 1 ;
|
||||
```
|
||||
|
||||
The first line shows a function definition, and the second line shows a fully
|
||||
annotated closure definition. The third line removes the type annotations from
|
||||
the closure definition, and the fourth line removes the brackets, which are
|
||||
optional because the closure body has only one expression. These are all valid
|
||||
definitions that will produce the same behavior when they’re called.
|
||||
|
||||
Closure definitions will have one concrete type inferred for each of their
|
||||
parameters and for their return value. For instance, Listing 13-8 shows the
|
||||
definition of a short closure that just returns the value it receives as a
|
||||
parameter. This closure isn’t very useful except for the purposes of this
|
||||
example. Note that we haven’t added any type annotations to the definition: if
|
||||
we then try to call the closure twice, using a `String` as an argument the
|
||||
first time and a `u32` the second time, we’ll get an error.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
let example_closure = |x| x;
|
||||
|
||||
let s = example_closure(String::from("hello"));
|
||||
let n = example_closure(5);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-8: Attempting to call a closure whose types
|
||||
are inferred with two different types</span>
|
||||
|
||||
The compiler gives us this error:
|
||||
|
||||
```text
|
||||
error[E0308]: mismatched types
|
||||
--> src/main.rs
|
||||
|
|
||||
| let n = example_closure(5);
|
||||
| ^ expected struct `std::string::String`, found
|
||||
integral variable
|
||||
|
|
||||
= note: expected type `std::string::String`
|
||||
found type `{integer}`
|
||||
```
|
||||
|
||||
The first time we call `example_closure` with the `String` value, the compiler
|
||||
infers the type of `x` and the return type of the closure to be `String`. Those
|
||||
types are then locked in to the closure in `example_closure`, and we get a type
|
||||
error if we try to use a different type with the same closure.
|
||||
|
||||
### Storing Closures Using Generic Parameters and the `Fn` Traits
|
||||
|
||||
Let’s return to our workout generation app. In Listing 13-6, our code was still
|
||||
calling the expensive calculation closure more times than it needed to. One
|
||||
option to solve this issue is to save the result of the expensive closure in a
|
||||
variable for reuse and use the variable in each place we need the result,
|
||||
instead of calling the closure again. However, this method could result in a
|
||||
lot of repeated code.
|
||||
|
||||
Fortunately, another solution is available to us. We can create a struct that
|
||||
will hold the closure and the resulting value of calling the closure. The
|
||||
struct will execute the closure only if we need the resulting value, and it
|
||||
will cache the resulting value so the rest of our code doesn’t have to be
|
||||
responsible for saving and reusing the result. You may know this pattern as
|
||||
*memoization* or *lazy evaluation*.
|
||||
|
||||
To make a struct that holds a closure, we need to specify the type of the
|
||||
closure, because a struct definition needs to know the types of each of its
|
||||
fields. Each closure instance has its own unique anonymous type: that is, even
|
||||
if two closures have the same signature, their types are still considered
|
||||
different. To define structs, enums, or function parameters that use closures,
|
||||
we use generics and trait bounds, as we discussed in Chapter 10.
|
||||
|
||||
The `Fn` traits are provided by the standard library. All closures implement at
|
||||
least one of the traits: `Fn`, `FnMut`, or `FnOnce`. We’ll discuss the
|
||||
difference between these traits in the “Capturing the Environment with
|
||||
Closures” section; in this example, we can use the `Fn` trait.
|
||||
|
||||
We add types to the `Fn` trait bound to represent the types of the parameters
|
||||
and return values the closures must have to match this trait bound. In this
|
||||
case, our closure has a parameter of type `u32` and returns a `u32`, so the
|
||||
trait bound we specify is `Fn(u32) -> u32`.
|
||||
|
||||
Listing 13-9 shows the definition of the `Cacher` struct that holds a closure
|
||||
and an optional result value:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
struct Cacher<T>
|
||||
where T: Fn(u32) -> u32
|
||||
{
|
||||
calculation: T,
|
||||
value: Option<u32>,
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-9: Defining a `Cacher` struct that holds a
|
||||
closure in `calculation` and an optional result in `value`</span>
|
||||
|
||||
The `Cacher` struct has a `calculation` field of the generic type `T`. The
|
||||
trait bounds on `T` specify that it’s a closure by using the `Fn` trait. Any
|
||||
closure we want to store in the `calculation` field must have one `u32`
|
||||
parameter (specified within the parentheses after `Fn`) and must return a
|
||||
`u32` (specified after the `->`).
|
||||
|
||||
> Note: Functions implement all three of the `Fn` traits too. If what we want
|
||||
> to do doesn’t require capturing a value from the environment, we can use a
|
||||
> function rather than a closure where we need something that implements an `Fn`
|
||||
> trait.
|
||||
|
||||
The `value` field is of type `Option<u32>`. Before we execute the closure,
|
||||
`value` will be `None`. When code using a `Cacher` asks for the *result* of the
|
||||
closure, the `Cacher` will execute the closure at that time and store the
|
||||
result within a `Some` variant in the `value` field. Then if the code asks for
|
||||
the result of the closure again, instead of executing the closure again, the
|
||||
`Cacher` will return the result held in the `Some` variant.
|
||||
|
||||
The logic around the `value` field we’ve just described is defined in Listing
|
||||
13-10:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# struct Cacher<T>
|
||||
# where T: Fn(u32) -> u32
|
||||
# {
|
||||
# calculation: T,
|
||||
# value: Option<u32>,
|
||||
# }
|
||||
#
|
||||
impl<T> Cacher<T>
|
||||
where T: Fn(u32) -> u32
|
||||
{
|
||||
fn new(calculation: T) -> Cacher<T> {
|
||||
Cacher {
|
||||
calculation,
|
||||
value: None,
|
||||
}
|
||||
}
|
||||
|
||||
fn value(&mut self, arg: u32) -> u32 {
|
||||
match self.value {
|
||||
Some(v) => v,
|
||||
None => {
|
||||
let v = (self.calculation)(arg);
|
||||
self.value = Some(v);
|
||||
v
|
||||
},
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-10: The caching logic of `Cacher`</span>
|
||||
|
||||
We want `Cacher` to manage the struct fields’ values rather than letting the
|
||||
calling code potentially change the values in these fields directly, so these
|
||||
fields are private.
|
||||
|
||||
The `Cacher::new` function takes a generic parameter `T`, which we’ve defined
|
||||
as having the same trait bound as the `Cacher` struct. Then `Cacher::new`
|
||||
returns a `Cacher` instance that holds the closure specified in the
|
||||
`calculation` field and a `None` value in the `value` field, because we haven’t
|
||||
executed the closure yet.
|
||||
|
||||
When the calling code needs the result of evaluating the closure, instead of
|
||||
calling the closure directly, it will call the `value` method. This method
|
||||
checks whether we already have a resulting value in `self.value` in a `Some`;
|
||||
if we do, it returns the value within the `Some` without executing the closure
|
||||
again.
|
||||
|
||||
If `self.value` is `None`, the code calls the closure stored in
|
||||
`self.calculation`, saves the result in `self.value` for future use, and
|
||||
returns the value as well.
|
||||
|
||||
Listing 13-11 shows how we can use this `Cacher` struct in the function
|
||||
`generate_workout` from Listing 13-6:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::thread;
|
||||
# use std::time::Duration;
|
||||
#
|
||||
# struct Cacher<T>
|
||||
# where T: Fn(u32) -> u32
|
||||
# {
|
||||
# calculation: T,
|
||||
# value: Option<u32>,
|
||||
# }
|
||||
#
|
||||
# impl<T> Cacher<T>
|
||||
# where T: Fn(u32) -> u32
|
||||
# {
|
||||
# fn new(calculation: T) -> Cacher<T> {
|
||||
# Cacher {
|
||||
# calculation,
|
||||
# value: None,
|
||||
# }
|
||||
# }
|
||||
#
|
||||
# fn value(&mut self, arg: u32) -> u32 {
|
||||
# match self.value {
|
||||
# Some(v) => v,
|
||||
# None => {
|
||||
# let v = (self.calculation)(arg);
|
||||
# self.value = Some(v);
|
||||
# v
|
||||
# },
|
||||
# }
|
||||
# }
|
||||
# }
|
||||
#
|
||||
fn generate_workout(intensity: u32, random_number: u32) {
|
||||
let mut expensive_result = Cacher::new(|num| {
|
||||
println!("calculating slowly...");
|
||||
thread::sleep(Duration::from_secs(2));
|
||||
num
|
||||
});
|
||||
|
||||
if intensity < 25 {
|
||||
println!(
|
||||
"Today, do {} pushups!",
|
||||
expensive_result.value(intensity)
|
||||
);
|
||||
println!(
|
||||
"Next, do {} situps!",
|
||||
expensive_result.value(intensity)
|
||||
);
|
||||
} else {
|
||||
if random_number == 3 {
|
||||
println!("Take a break today! Remember to stay hydrated!");
|
||||
} else {
|
||||
println!(
|
||||
"Today, run for {} minutes!",
|
||||
expensive_result.value(intensity)
|
||||
);
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-11: Using `Cacher` in the `generate_workout`
|
||||
function to abstract away the caching logic</span>
|
||||
|
||||
Instead of saving the closure in a variable directly, we save a new instance of
|
||||
`Cacher` that holds the closure. Then, in each place we want the result, we
|
||||
call the `value` method on the `Cacher` instance. We can call the `value`
|
||||
method as many times as we want, or not call it at all, and the expensive
|
||||
calculation will be run a maximum of once.
|
||||
|
||||
Try running this program with the `main` function from Listing 13-2. Change the
|
||||
values in the `simulated_user_specified_value` and `simulated_random_number`
|
||||
variables to verify that in all the cases in the various `if` and `else`
|
||||
blocks, `calculating slowly...` appears only once and only when needed. The
|
||||
`Cacher` takes care of the logic necessary to ensure we aren’t calling the
|
||||
expensive calculation more than we need to so `generate_workout` can focus on
|
||||
the business logic.
|
||||
|
||||
### Limitations of the `Cacher` Implementation
|
||||
|
||||
Caching values is a generally useful behavior that we might want to use in
|
||||
other parts of our code with different closures. However, there are two
|
||||
problems with the current implementation of `Cacher` that would make reusing it
|
||||
in different contexts difficult.
|
||||
|
||||
The first problem is that a `Cacher` instance assumes it will always get the
|
||||
same value for the parameter `arg` to the `value` method. That is, this test of
|
||||
`Cacher` will fail:
|
||||
|
||||
```rust,ignore
|
||||
#[test]
|
||||
fn call_with_different_values() {
|
||||
let mut c = Cacher::new(|a| a);
|
||||
|
||||
let v1 = c.value(1);
|
||||
let v2 = c.value(2);
|
||||
|
||||
assert_eq!(v2, 2);
|
||||
}
|
||||
```
|
||||
|
||||
This test creates a new `Cacher` instance with a closure that returns the value
|
||||
passed into it. We call the `value` method on this `Cacher` instance with an
|
||||
`arg` value of 1 and then an `arg` value of 2, and we expect the call to
|
||||
`value` with the `arg` value of 2 should return 2.
|
||||
|
||||
Run this test with the `Cacher` implementation in Listing 13-9 and Listing
|
||||
13-10, and the test will fail on the `assert_eq!` with this message:
|
||||
|
||||
```text
|
||||
thread 'call_with_different_values' panicked at 'assertion failed: `(left == right)`
|
||||
left: `1`,
|
||||
right: `2`', src/main.rs
|
||||
```
|
||||
|
||||
The problem is that the first time we called `c.value` with 1, the `Cacher`
|
||||
instance saved `Some(1)` in `self.value`. Thereafter, no matter what we pass in
|
||||
to the `value` method, it will always return 1.
|
||||
|
||||
Try modifying `Cacher` to hold a hash map rather than a single value. The keys
|
||||
of the hash map will be the `arg` values that are passed in, and the values of
|
||||
the hash map will be the result of calling the closure on that key. Instead of
|
||||
looking at whether `self.value` directly has a `Some` or a `None` value, the
|
||||
`value` function will look up the `arg` in the hash map and return the value if
|
||||
it’s present. If it’s not present, the `Cacher` will call the closure and save
|
||||
the resulting value in the hash map associated with its `arg` value.
|
||||
|
||||
The second problem with the current `Cacher` implementation is that it only
|
||||
accepts closures that take one parameter of type `u32` and return a `u32`. We
|
||||
might want to cache the results of closures that take a string slice and return
|
||||
`usize` values, for example. To fix this issue, try introducing more generic
|
||||
parameters to increase the flexibility of the `Cacher` functionality.
|
||||
|
||||
### Capturing the Environment with Closures
|
||||
|
||||
In the workout generator example, we only used closures as inline anonymous
|
||||
functions. However, closures have an additional capability that functions don’t
|
||||
have: they can capture their environment and access variables from the scope in
|
||||
which they’re defined.
|
||||
|
||||
Listing 13-12 has an example of a closure stored in the `equal_to_x` variable
|
||||
that uses the `x` variable from the closure’s surrounding environment:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let x = 4;
|
||||
|
||||
let equal_to_x = |z| z == x;
|
||||
|
||||
let y = 4;
|
||||
|
||||
assert!(equal_to_x(y));
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-12: Example of a closure that refers to a
|
||||
variable in its enclosing scope</span>
|
||||
|
||||
Here, even though `x` is not one of the parameters of `equal_to_x`, the
|
||||
`equal_to_x` closure is allowed to use the `x` variable that’s defined in the
|
||||
same scope that `equal_to_x` is defined in.
|
||||
|
||||
We can’t do the same with functions; if we try with the following example, our
|
||||
code won’t compile:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let x = 4;
|
||||
|
||||
fn equal_to_x(z: i32) -> bool { z == x }
|
||||
|
||||
let y = 4;
|
||||
|
||||
assert!(equal_to_x(y));
|
||||
}
|
||||
```
|
||||
|
||||
We get an error:
|
||||
|
||||
```text
|
||||
error[E0434]: can't capture dynamic environment in a fn item; use the || { ...
|
||||
} closure form instead
|
||||
--> src/main.rs
|
||||
|
|
||||
4 | fn equal_to_x(z: i32) -> bool { z == x }
|
||||
| ^
|
||||
```
|
||||
|
||||
The compiler even reminds us that this only works with closures!
|
||||
|
||||
When a closure captures a value from its environment, it uses memory to store
|
||||
the values for use in the closure body. This use of memory is overhead that we
|
||||
don’t want to pay in more common cases where we want to execute code that
|
||||
doesn’t capture its environment. Because functions are never allowed to capture
|
||||
their environment, defining and using functions will never incur this overhead.
|
||||
|
||||
Closures can capture values from their environment in three ways, which
|
||||
directly map to the three ways a function can take a parameter: taking
|
||||
ownership, borrowing mutably, and borrowing immutably. These are encoded in the
|
||||
three `Fn` traits as follows:
|
||||
|
||||
* `FnOnce` consumes the variables it captures from its enclosing scope, known
|
||||
as the closure’s *environment*. To consume the captured variables, the
|
||||
closure must take ownership of these variables and move them into the closure
|
||||
when it is defined. The `Once` part of the name represents the fact that the
|
||||
closure can’t take ownership of the same variables more than once, so it can
|
||||
be called only once.
|
||||
* `FnMut` can change the environment because it mutably borrows values.
|
||||
* `Fn` borrows values from the environment immutably.
|
||||
|
||||
When you create a closure, Rust infers which trait to use based on how the
|
||||
closure uses the values from the environment. All closures implement `FnOnce`
|
||||
because they can all be called at least once. Closures that don’t move the
|
||||
captured variables also implement `FnMut`, and closures that don’t need mutable
|
||||
access to the captured variables also implement `Fn`. In Listing 13-12, the
|
||||
`equal_to_x` closure borrows `x` immutably (so `equal_to_x` has the `Fn` trait)
|
||||
because the body of the closure only needs to read the value in `x`.
|
||||
|
||||
If you want to force the closure to take ownership of the values it uses in the
|
||||
environment, you can use the `move` keyword before the parameter list. This
|
||||
technique is mostly useful when passing a closure to a new thread to move the
|
||||
data so it’s owned by the new thread.
|
||||
|
||||
We’ll have more examples of `move` closures in Chapter 16 when we talk about
|
||||
concurrency. For now, here’s the code from Listing 13-12 with the `move`
|
||||
keyword added to the closure definition and using vectors instead of integers,
|
||||
because integers can be copied rather than moved; note that this code will not
|
||||
yet compile.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let x = vec![1, 2, 3];
|
||||
|
||||
let equal_to_x = move |z| z == x;
|
||||
|
||||
println!("can't use x here: {:?}", x);
|
||||
|
||||
let y = vec![1, 2, 3];
|
||||
|
||||
assert!(equal_to_x(y));
|
||||
}
|
||||
```
|
||||
|
||||
We receive the following error:
|
||||
|
||||
```text
|
||||
error[E0382]: use of moved value: `x`
|
||||
--> src/main.rs:6:40
|
||||
|
|
||||
4 | let equal_to_x = move |z| z == x;
|
||||
| -------- value moved (into closure) here
|
||||
5 |
|
||||
6 | println!("can't use x here: {:?}", x);
|
||||
| ^ value used here after move
|
||||
|
|
||||
= note: move occurs because `x` has type `std::vec::Vec<i32>`, which does not
|
||||
implement the `Copy` trait
|
||||
```
|
||||
|
||||
The `x` value is moved into the closure when the closure is defined, because we
|
||||
added the `move` keyword. The closure then has ownership of `x`, and `main`
|
||||
isn’t allowed to use `x` anymore in the `println!` statement. Removing
|
||||
`println!` will fix this example.
|
||||
|
||||
Most of the time when specifying one of the `Fn` trait bounds, you can start
|
||||
with `Fn` and the compiler will tell you if you need `FnMut` or `FnOnce` based
|
||||
on what happens in the closure body.
|
||||
|
||||
To illustrate situations where closures that can capture their environment are
|
||||
useful as function parameters, let’s move on to our next topic: iterators.
|
||||
482
2018-edition/src/ch13-02-iterators.md
Normal file
482
2018-edition/src/ch13-02-iterators.md
Normal file
@@ -0,0 +1,482 @@
|
||||
## Processing a Series of Items with Iterators
|
||||
|
||||
The iterator pattern allows you to perform some task on a sequence of items in
|
||||
turn. An iterator is responsible for the logic of iterating over each item and
|
||||
determining when the sequence has finished. When you use iterators, you don’t
|
||||
have to reimplement that logic yourself.
|
||||
|
||||
In Rust, iterators are *lazy*, meaning they have no effect until you call
|
||||
methods that consume the iterator to use it up. For example, the code in
|
||||
Listing 13-13 creates an iterator over the items in the vector `v1` by calling
|
||||
the `iter` method defined on `Vec`. This code by itself doesn’t do anything
|
||||
useful.
|
||||
|
||||
```rust
|
||||
let v1 = vec![1, 2, 3];
|
||||
|
||||
let v1_iter = v1.iter();
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-13: Creating an iterator</span>
|
||||
|
||||
Once we’ve created an iterator, we can use it in a variety of ways. In Listing
|
||||
3-5 in Chapter 3, we used iterators with `for` loops to execute some code on
|
||||
each item, although we glossed over what the call to `iter` did until now.
|
||||
|
||||
The example in Listing 13-14 separates the creation of the iterator from the
|
||||
use of the iterator in the `for` loop. The iterator is stored in the `v1_iter`
|
||||
variable, and no iteration takes place at that time. When the `for` loop is
|
||||
called using the iterator in `v1_iter`, each element in the iterator is used in
|
||||
one iteration of the loop, which prints out each value.
|
||||
|
||||
```rust
|
||||
let v1 = vec![1, 2, 3];
|
||||
|
||||
let v1_iter = v1.iter();
|
||||
|
||||
for val in v1_iter {
|
||||
println!("Got: {}", val);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-14: Using an iterator in a `for` loop</span>
|
||||
|
||||
In languages that don’t have iterators provided by their standard libraries,
|
||||
you would likely write this same functionality by starting a variable at index
|
||||
0, using that variable to index into the vector to get a value, and
|
||||
incrementing the variable value in a loop until it reached the total number of
|
||||
items in the vector.
|
||||
|
||||
Iterators handle all that logic for you, cutting down on repetitive code you
|
||||
could potentially mess up. Iterators give you more flexibility to use the same
|
||||
logic with many different kinds of sequences, not just data structures you can
|
||||
index into, like vectors. Let’s examine how iterators do that.
|
||||
|
||||
### The `Iterator` Trait and the `next` Method
|
||||
|
||||
All iterators implement a trait named `Iterator` that is defined in the
|
||||
standard library. The definition of the trait looks like this:
|
||||
|
||||
```rust
|
||||
trait Iterator {
|
||||
type Item;
|
||||
|
||||
fn next(&mut self) -> Option<Self::Item>;
|
||||
|
||||
// methods with default implementations elided
|
||||
}
|
||||
```
|
||||
|
||||
Notice this definition uses some new syntax: `type Item` and `Self::Item`,
|
||||
which are defining an *associated type* with this trait. We’ll talk about
|
||||
associated types in depth in Chapter 19. For now, all you need to know is that
|
||||
this code says implementing the `Iterator` trait requires that you also define
|
||||
an `Item` type, and this `Item` type is used in the return type of the `next`
|
||||
method. In other words, the `Item` type will be the type returned from the
|
||||
iterator.
|
||||
|
||||
The `Iterator` trait only requires implementors to define one method: the
|
||||
`next` method, which returns one item of the iterator at a time wrapped in
|
||||
`Some` and, when iteration is over, returns `None`.
|
||||
|
||||
We can call the `next` method on iterators directly; Listing 13-15 demonstrates
|
||||
what values are returned from repeated calls to `next` on the iterator created
|
||||
from the vector:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[test]
|
||||
fn iterator_demonstration() {
|
||||
let v1 = vec![1, 2, 3];
|
||||
|
||||
let mut v1_iter = v1.iter();
|
||||
|
||||
assert_eq!(v1_iter.next(), Some(&1));
|
||||
assert_eq!(v1_iter.next(), Some(&2));
|
||||
assert_eq!(v1_iter.next(), Some(&3));
|
||||
assert_eq!(v1_iter.next(), None);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-15: Calling the `next` method on an
|
||||
iterator</span>
|
||||
|
||||
Note that we needed to make `v1_iter` mutable: calling the `next` method on an
|
||||
iterator changes internal state that the iterator uses to keep track of where
|
||||
it is in the sequence. In other words, this code *consumes*, or uses up, the
|
||||
iterator. Each call to `next` eats up an item from the iterator. We didn’t need
|
||||
to make `v1_iter` mutable when we used a `for` loop because the loop took
|
||||
ownership of `v1_iter` and made it mutable behind the scenes.
|
||||
|
||||
Also note that the values we get from the calls to `next` are immutable
|
||||
references to the values in the vector. The `iter` method produces an iterator
|
||||
over immutable references. If we want to create an iterator that takes
|
||||
ownership of `v1` and returns owned values, we can call `into_iter` instead of
|
||||
`iter`. Similarly, if we want to iterate over mutable references, we can call
|
||||
`iter_mut` instead of `iter`.
|
||||
|
||||
### Methods that Consume the Iterator
|
||||
|
||||
The `Iterator` trait has a number of different methods with default
|
||||
implementations provided by the standard library; you can find out about these
|
||||
methods by looking in the standard library API documentation for the `Iterator`
|
||||
trait. Some of these methods call the `next` method in their definition, which
|
||||
is why you’re required to implement the `next` method when implementing the
|
||||
`Iterator` trait.
|
||||
|
||||
Methods that call `next` are called *consuming adaptors*, because calling them
|
||||
uses up the iterator. One example is the `sum` method, which takes ownership of
|
||||
the iterator and iterates through the items by repeatedly calling `next`, thus
|
||||
consuming the iterator. As it iterates through, it adds each item to a running
|
||||
total and returns the total when iteration is complete. Listing 13-16 has a
|
||||
test illustrating a use of the `sum` method:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[test]
|
||||
fn iterator_sum() {
|
||||
let v1 = vec![1, 2, 3];
|
||||
|
||||
let v1_iter = v1.iter();
|
||||
|
||||
let total: i32 = v1_iter.sum();
|
||||
|
||||
assert_eq!(total, 6);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-16: Calling the `sum` method to get the total
|
||||
of all items in the iterator</span>
|
||||
|
||||
We aren’t allowed to use `v1_iter` after the call to `sum` because `sum` takes
|
||||
ownership of the iterator we call it on.
|
||||
|
||||
### Methods that Produce Other Iterators
|
||||
|
||||
Other methods defined on the `Iterator` trait, known as *iterator adaptors*,
|
||||
allow you to change iterators into different kinds of iterators. You can chain
|
||||
multiple calls to iterator adaptors to perform complex actions in a readable
|
||||
way. But because all iterators are lazy, you have to call one of the consuming
|
||||
adaptor methods to get results from calls to iterator adaptors.
|
||||
|
||||
Listing 13-17 shows an example of calling the iterator adaptor method `map`,
|
||||
which takes a closure to call on each item to produce a new iterator. The
|
||||
closure here creates a new iterator in which each item from the vector has been
|
||||
incremented by 1. However, this code produces a warning:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
let v1: Vec<i32> = vec![1, 2, 3];
|
||||
|
||||
v1.iter().map(|x| x + 1);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-17: Calling the iterator adaptor `map` to
|
||||
create a new iterator</span>
|
||||
|
||||
The warning we get is this:
|
||||
|
||||
```text
|
||||
warning: unused `std::iter::Map` which must be used: iterator adaptors are lazy
|
||||
and do nothing unless consumed
|
||||
--> src/main.rs:4:5
|
||||
|
|
||||
4 | v1.iter().map(|x| x + 1);
|
||||
| ^^^^^^^^^^^^^^^^^^^^^^^^^
|
||||
|
|
||||
= note: #[warn(unused_must_use)] on by default
|
||||
```
|
||||
|
||||
The code in Listing 13-17 doesn’t do anything; the closure we’ve specified
|
||||
never gets called. The warning reminds us why: iterator adaptors are lazy, and
|
||||
we need to consume the iterator here.
|
||||
|
||||
To fix this and consume the iterator, we’ll use the `collect` method, which we
|
||||
used in Chapter 12 with `env::args` in Listing 12-1. This method consumes the
|
||||
iterator and collects the resulting values into a collection data type.
|
||||
|
||||
In Listing 13-18, we collect the results of iterating over the iterator that’s
|
||||
returned from the call to `map` into a vector. This vector will end up
|
||||
containing each item from the original vector incremented by 1.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
let v1: Vec<i32> = vec![1, 2, 3];
|
||||
|
||||
let v2: Vec<_> = v1.iter().map(|x| x + 1).collect();
|
||||
|
||||
assert_eq!(v2, vec![2, 3, 4]);
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-18: Calling the `map` method to create a new
|
||||
iterator and then calling the `collect` method to consume the new iterator and
|
||||
create a vector</span>
|
||||
|
||||
Because `map` takes a closure, we can specify any operation we want to perform
|
||||
on each item. This is a great example of how closures let you customize some
|
||||
behavior while reusing the iteration behavior that the `Iterator` trait
|
||||
provides.
|
||||
|
||||
### Using Closures that Capture Their Environment
|
||||
|
||||
Now that we’ve introduced iterators, we can demonstrate a common use of
|
||||
closures that capture their environment by using the `filter` iterator adaptor.
|
||||
The `filter` method on an iterator takes a closure that takes each item from
|
||||
the iterator and returns a Boolean. If the closure returns `true`, the value
|
||||
will be included in the iterator produced by `filter`. If the closure returns
|
||||
`false`, the value won’t be included in the resulting iterator.
|
||||
|
||||
In Listing 13-19, we use `filter` with a closure that captures the `shoe_size`
|
||||
variable from its environment to iterate over a collection of `Shoe` struct
|
||||
instances. It will return only shoes that are the specified size.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[derive(PartialEq, Debug)]
|
||||
struct Shoe {
|
||||
size: u32,
|
||||
style: String,
|
||||
}
|
||||
|
||||
fn shoes_in_my_size(shoes: Vec<Shoe>, shoe_size: u32) -> Vec<Shoe> {
|
||||
shoes.into_iter()
|
||||
.filter(|s| s.size == shoe_size)
|
||||
.collect()
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn filters_by_size() {
|
||||
let shoes = vec![
|
||||
Shoe { size: 10, style: String::from("sneaker") },
|
||||
Shoe { size: 13, style: String::from("sandal") },
|
||||
Shoe { size: 10, style: String::from("boot") },
|
||||
];
|
||||
|
||||
let in_my_size = shoes_in_my_size(shoes, 10);
|
||||
|
||||
assert_eq!(
|
||||
in_my_size,
|
||||
vec![
|
||||
Shoe { size: 10, style: String::from("sneaker") },
|
||||
Shoe { size: 10, style: String::from("boot") },
|
||||
]
|
||||
);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-19: Using the `filter` method with a closure
|
||||
that captures `shoe_size`</span>
|
||||
|
||||
The `shoes_in_my_size` function takes ownership of a vector of shoes and a shoe
|
||||
size as parameters. It returns a vector containing only shoes of the specified
|
||||
size.
|
||||
|
||||
In the body of `shoes_in_my_size`, we call `into_iter` to create an iterator
|
||||
that takes ownership of the vector. Then we call `filter` to adapt that
|
||||
iterator into a new iterator that only contains elements for which the closure
|
||||
returns `true`.
|
||||
|
||||
The closure captures the `shoe_size` parameter from the environment and
|
||||
compares the value with each shoe’s size, keeping only shoes of the size
|
||||
specified. Finally, calling `collect` gathers the values returned by the
|
||||
adapted iterator into a vector that’s returned by the function.
|
||||
|
||||
The test shows that when we call `shoes_in_my_size`, we get back only shoes
|
||||
that have the same size as the value we specified.
|
||||
|
||||
### Creating Our Own Iterators with the `Iterator` Trait
|
||||
|
||||
We’ve shown that you can create an iterator by calling `iter`, `into_iter`, or
|
||||
`iter_mut` on a vector. You can create iterators from the other collection
|
||||
types in the standard library, such as hash map. You can also create iterators
|
||||
that do anything you want by implementing the `Iterator` trait on your own
|
||||
types. As previously mentioned, the only method you’re required to provide a
|
||||
definition for is the `next` method. Once you’ve done that, you can use all
|
||||
other methods that have default implementations provided by the `Iterator`
|
||||
trait!
|
||||
|
||||
To demonstrate, let’s create an iterator that will only ever count from 1 to 5.
|
||||
First, we’ll create a struct to hold some values. Then we’ll make this struct
|
||||
into an iterator by implementing the `Iterator` trait and using the values in
|
||||
that implementation.
|
||||
|
||||
Listing 13-20 has the definition of the `Counter` struct and an associated
|
||||
`new` function to create instances of `Counter`:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
struct Counter {
|
||||
count: u32,
|
||||
}
|
||||
|
||||
impl Counter {
|
||||
fn new() -> Counter {
|
||||
Counter { count: 0 }
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-20: Defining the `Counter` struct and a `new`
|
||||
function that creates instances of `Counter` with an initial value of 0 for
|
||||
`count`</span>
|
||||
|
||||
The `Counter` struct has one field named `count`. This field holds a `u32`
|
||||
value that will keep track of where we are in the process of iterating from 1
|
||||
to 5. The `count` field is private because we want the implementation of
|
||||
`Counter` to manage its value. The `new` function enforces the behavior of
|
||||
always starting new instances with a value of 0 in the `count` field.
|
||||
|
||||
Next, we’ll implement the `Iterator` trait for our `Counter` type by defining
|
||||
the body of the `next` method to specify what we want to happen when this
|
||||
iterator is used, as shown in Listing 13-21:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# struct Counter {
|
||||
# count: u32,
|
||||
# }
|
||||
#
|
||||
impl Iterator for Counter {
|
||||
type Item = u32;
|
||||
|
||||
fn next(&mut self) -> Option<Self::Item> {
|
||||
self.count += 1;
|
||||
|
||||
if self.count < 6 {
|
||||
Some(self.count)
|
||||
} else {
|
||||
None
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-21: Implementing the `Iterator` trait on our
|
||||
`Counter` struct</span>
|
||||
|
||||
We set the associated `Item` type for our iterator to `u32`, meaning the
|
||||
iterator will return `u32` values. Again, don’t worry about associated types
|
||||
yet, we’ll cover them in Chapter 19.
|
||||
|
||||
We want our iterator to add 1 to the current state, so we initialized `count`
|
||||
to 0 so it would return 1 first. If the value of `count` is less than 6, `next`
|
||||
will return the current value wrapped in `Some`, but if `count` is 6 or higher,
|
||||
our iterator will return `None`.
|
||||
|
||||
#### Using Our `Counter` Iterator’s `next` Method
|
||||
|
||||
Once we’ve implemented the `Iterator` trait, we have an iterator! Listing 13-22
|
||||
shows a test demonstrating that we can use the iterator functionality of our
|
||||
`Counter` struct by calling the `next` method on it directly, just as we did
|
||||
with the iterator created from a vector in Listing 13-15.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# struct Counter {
|
||||
# count: u32,
|
||||
# }
|
||||
#
|
||||
# impl Iterator for Counter {
|
||||
# type Item = u32;
|
||||
#
|
||||
# fn next(&mut self) -> Option<Self::Item> {
|
||||
# self.count += 1;
|
||||
#
|
||||
# if self.count < 6 {
|
||||
# Some(self.count)
|
||||
# } else {
|
||||
# None
|
||||
# }
|
||||
# }
|
||||
# }
|
||||
#
|
||||
#[test]
|
||||
fn calling_next_directly() {
|
||||
let mut counter = Counter::new();
|
||||
|
||||
assert_eq!(counter.next(), Some(1));
|
||||
assert_eq!(counter.next(), Some(2));
|
||||
assert_eq!(counter.next(), Some(3));
|
||||
assert_eq!(counter.next(), Some(4));
|
||||
assert_eq!(counter.next(), Some(5));
|
||||
assert_eq!(counter.next(), None);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-22: Testing the functionality of the `next`
|
||||
method implementation</span>
|
||||
|
||||
This test creates a new `Counter` instance in the `counter` variable and then
|
||||
calls `next` repeatedly, verifying that we have implemented the behavior we
|
||||
want this iterator to have: returning the values from 1 to 5.
|
||||
|
||||
#### Using Other `Iterator` Trait Methods
|
||||
|
||||
We implemented the `Iterator` trait by defining the `next` method, so we
|
||||
can now use any `Iterator` trait method’s default implementations as defined in
|
||||
the standard library, because they all use the `next` method’s functionality.
|
||||
|
||||
For example, if for some reason we wanted to take the values produced by an
|
||||
instance of `Counter`, pair them with values produced by another `Counter`
|
||||
instance after skipping the first value, multiply each pair together, keep only
|
||||
those results that are divisible by 3, and add all the resulting values
|
||||
together, we could do so, as shown in the test in Listing 13-23:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# struct Counter {
|
||||
# count: u32,
|
||||
# }
|
||||
#
|
||||
# impl Counter {
|
||||
# fn new() -> Counter {
|
||||
# Counter { count: 0 }
|
||||
# }
|
||||
# }
|
||||
#
|
||||
# impl Iterator for Counter {
|
||||
# // Our iterator will produce u32s
|
||||
# type Item = u32;
|
||||
#
|
||||
# fn next(&mut self) -> Option<Self::Item> {
|
||||
# // increment our count. This is why we started at zero.
|
||||
# self.count += 1;
|
||||
#
|
||||
# // check to see if we've finished counting or not.
|
||||
# if self.count < 6 {
|
||||
# Some(self.count)
|
||||
# } else {
|
||||
# None
|
||||
# }
|
||||
# }
|
||||
# }
|
||||
#
|
||||
#[test]
|
||||
fn using_other_iterator_trait_methods() {
|
||||
let sum: u32 = Counter::new().zip(Counter::new().skip(1))
|
||||
.map(|(a, b)| a * b)
|
||||
.filter(|x| x % 3 == 0)
|
||||
.sum();
|
||||
assert_eq!(18, sum);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-23: Using a variety of `Iterator` trait
|
||||
methods on our `Counter` iterator</span>
|
||||
|
||||
Note that `zip` produces only four pairs; the theoretical fifth pair `(5,
|
||||
None)` is never produced because `zip` returns `None` when either of its input
|
||||
iterators return `None`.
|
||||
|
||||
All of these method calls are possible because we specified how the `next`
|
||||
method works, and the standard library provides default implementations for
|
||||
other methods that call `next`.
|
||||
240
2018-edition/src/ch13-03-improving-our-io-project.md
Normal file
240
2018-edition/src/ch13-03-improving-our-io-project.md
Normal file
@@ -0,0 +1,240 @@
|
||||
## Improving Our I/O Project
|
||||
|
||||
With this new knowledge about iterators, we can improve the I/O project in
|
||||
Chapter 12 by using iterators to make places in the code clearer and more
|
||||
concise. Let’s look at how iterators can improve our implementation of the
|
||||
`Config::new` function and the `search` function.
|
||||
|
||||
|
||||
### Removing a `clone` Using an Iterator
|
||||
|
||||
In Listing 12-6, we added code that took a slice of `String` values and created
|
||||
an instance of the `Config` struct by indexing into the slice and cloning the
|
||||
values, allowing the `Config` struct to own those values. In Listing 13-24,
|
||||
we’ve reproduced the implementation of the `Config::new` function as it was in
|
||||
Listing 12-23:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
impl Config {
|
||||
pub fn new(args: &[String]) -> Result<Config, &'static str> {
|
||||
if args.len() < 3 {
|
||||
return Err("not enough arguments");
|
||||
}
|
||||
|
||||
let query = args[1].clone();
|
||||
let filename = args[2].clone();
|
||||
|
||||
let case_sensitive = env::var("CASE_INSENSITIVE").is_err();
|
||||
|
||||
Ok(Config { query, filename, case_sensitive })
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-24: Reproduction of the `Config::new` function
|
||||
from Listing 12-23</span>
|
||||
|
||||
At the time, we said not to worry about the inefficient `clone` calls because
|
||||
we would remove them in the future. Well, that time is now!
|
||||
|
||||
We needed `clone` here because we have a slice with `String` elements in the
|
||||
parameter `args`, but the `new` function doesn’t own `args`. To return
|
||||
ownership of a `Config` instance, we had to clone the values from the `query`
|
||||
and `filename` fields of `Config` so the `Config` instance can own its values.
|
||||
|
||||
With our new knowledge about iterators, we can change the `new` function to
|
||||
take ownership of an iterator as its argument instead of borrowing a slice.
|
||||
We’ll use the iterator functionality instead of the code that checks the length
|
||||
of the slice and indexes into specific locations. This will clarify what the
|
||||
`Config::new` function is doing because the iterator will access the values.
|
||||
|
||||
Once `Config::new` takes ownership of the iterator and stops using indexing
|
||||
operations that borrow, we can move the `String` values from the iterator into
|
||||
`Config` rather than calling `clone` and making a new allocation.
|
||||
|
||||
#### Using the Returned Iterator Directly
|
||||
|
||||
Open your I/O project’s *src/main.rs* file, which should look like this:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let args: Vec<String> = env::args().collect();
|
||||
|
||||
let config = Config::new(&args).unwrap_or_else(|err| {
|
||||
eprintln!("Problem parsing arguments: {}", err);
|
||||
process::exit(1);
|
||||
});
|
||||
|
||||
// --snip--
|
||||
}
|
||||
```
|
||||
|
||||
We’ll change the start of the `main` function that we had in Listing 12-24 at
|
||||
to the code in Listing 13-25. This won’t compile until we update `Config::new`
|
||||
as well.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let config = Config::new(env::args()).unwrap_or_else(|err| {
|
||||
eprintln!("Problem parsing arguments: {}", err);
|
||||
process::exit(1);
|
||||
});
|
||||
|
||||
// --snip--
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-25: Passing the return value of `env::args` to
|
||||
`Config::new`</span>
|
||||
|
||||
The `env::args` function returns an iterator! Rather than collecting the
|
||||
iterator values into a vector and then passing a slice to `Config::new`, now
|
||||
we’re passing ownership of the iterator returned from `env::args` to
|
||||
`Config::new` directly.
|
||||
|
||||
Next, we need to update the definition of `Config::new`. In your I/O project’s
|
||||
*src/lib.rs* file, let’s change the signature of `Config::new` to look like
|
||||
Listing 13-26. This still won’t compile because we need to update the function
|
||||
body.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
impl Config {
|
||||
pub fn new(mut args: std::env::Args) -> Result<Config, &'static str> {
|
||||
// --snip--
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-26: Updating the signature of `Config::new` to
|
||||
expect an iterator</span>
|
||||
|
||||
The standard library documentation for the `env::args` function shows that the
|
||||
type of the iterator it returns is `std::env::Args`. We’ve updated the
|
||||
signature of the `Config::new` function so the parameter `args` has the type
|
||||
`std::env::Args` instead of `&[String]`. Because we’re taking ownership of
|
||||
`args` and we’ll be mutating `args` by iterating over it, we can add the `mut`
|
||||
keyword into the specification of the `args` parameter to make it mutable.
|
||||
|
||||
#### Using `Iterator` Trait Methods Instead of Indexing
|
||||
|
||||
Next, we’ll fix the body of `Config::new`. The standard library documentation
|
||||
also mentions that `std::env::Args` implements the `Iterator` trait, so we know
|
||||
we can call the `next` method on it! Listing 13-27 updates the code from
|
||||
Listing 12-23 to use the `next` method:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
# use std::env;
|
||||
#
|
||||
# struct Config {
|
||||
# query: String,
|
||||
# filename: String,
|
||||
# case_sensitive: bool,
|
||||
# }
|
||||
#
|
||||
impl Config {
|
||||
pub fn new(mut args: std::env::Args) -> Result<Config, &'static str> {
|
||||
args.next();
|
||||
|
||||
let query = match args.next() {
|
||||
Some(arg) => arg,
|
||||
None => return Err("Didn't get a query string"),
|
||||
};
|
||||
|
||||
let filename = match args.next() {
|
||||
Some(arg) => arg,
|
||||
None => return Err("Didn't get a file name"),
|
||||
};
|
||||
|
||||
let case_sensitive = env::var("CASE_INSENSITIVE").is_err();
|
||||
|
||||
Ok(Config { query, filename, case_sensitive })
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-27: Changing the body of `Config::new` to use
|
||||
iterator methods</span>
|
||||
|
||||
Remember that the first value in the return value of `env::args` is the name of
|
||||
the program. We want to ignore that and get to the next value, so first we call
|
||||
`next` and do nothing with the return value. Second, we call `next` to get the
|
||||
value we want to put in the `query` field of `Config`. If `next` returns a
|
||||
`Some`, we use a `match` to extract the value. If it returns `None`, it means
|
||||
not enough arguments were given and we return early with an `Err` value. We do
|
||||
the same thing for the `filename` value.
|
||||
|
||||
### Making Code Clearer with Iterator Adaptors
|
||||
|
||||
We can also take advantage of iterators in the `search` function in our I/O
|
||||
project, which is reproduced here in Listing 13-28 as it was in Listing 12-19:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub fn search<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
let mut results = Vec::new();
|
||||
|
||||
for line in contents.lines() {
|
||||
if line.contains(query) {
|
||||
results.push(line);
|
||||
}
|
||||
}
|
||||
|
||||
results
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-28: The implementation of the `search`
|
||||
function from Listing 12-19</span>
|
||||
|
||||
We can write this code in a more concise way using iterator adaptor methods.
|
||||
Doing so also lets us avoid having a mutable intermediate `results` vector. The
|
||||
functional programming style prefers to minimize the amount of mutable state to
|
||||
make code clearer. Removing the mutable state might enable a future enhancement
|
||||
to make searching happen in parallel, because we wouldn’t have to manage
|
||||
concurrent access to the `results` vector. Listing 13-29 shows this change:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
pub fn search<'a>(query: &str, contents: &'a str) -> Vec<&'a str> {
|
||||
contents.lines()
|
||||
.filter(|line| line.contains(query))
|
||||
.collect()
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 13-29: Using iterator adaptor methods in the
|
||||
implementation of the `search` function</span>
|
||||
|
||||
Recall that the purpose of the `search` function is to return all lines in
|
||||
`contents` that contain the `query`. Similar to the `filter` example in Listing
|
||||
13-19, this code uses the `filter` adaptor to keep only the lines that
|
||||
`line.contains(query)` returns `true` for. We then collect the matching lines
|
||||
into another vector with `collect`. Much simpler! Feel free to make the same
|
||||
change to use iterator methods in the `search_case_insensitive` function as
|
||||
well.
|
||||
|
||||
The next logical question is which style you should choose in your own code and
|
||||
why: the original implementation in Listing 13-28 or the version using
|
||||
iterators in Listing 13-29. Most Rust programmers prefer to use the iterator
|
||||
style. It’s a bit tougher to get the hang of at first, but once you get a feel
|
||||
for the various iterator adaptors and what they do, iterators can be easier to
|
||||
understand. Instead of fiddling with the various bits of looping and building
|
||||
new vectors, the code focuses on the high-level objective of the loop. This
|
||||
abstracts away some of the commonplace code so it’s easier to see the concepts
|
||||
that are unique to this code, such as the filtering condition each element in
|
||||
the iterator must pass.
|
||||
|
||||
But are the two implementations truly equivalent? The intuitive assumption
|
||||
might be that the more low-level loop will be faster. Let’s talk about
|
||||
performance.
|
||||
94
2018-edition/src/ch13-04-performance.md
Normal file
94
2018-edition/src/ch13-04-performance.md
Normal file
@@ -0,0 +1,94 @@
|
||||
## Comparing Performance: Loops vs. Iterators
|
||||
|
||||
To determine whether to use loops or iterators, you need to know which version
|
||||
of our `search` functions is faster: the version with an explicit `for` loop or
|
||||
the version with iterators.
|
||||
|
||||
We ran a benchmark by loading the entire contents of *The Adventures of
|
||||
Sherlock Holmes* by Sir Arthur Conan Doyle into a `String` and looking for the
|
||||
word *the* in the contents. Here are the results of the benchmark on the
|
||||
version of `search` using the `for` loop and the version using iterators:
|
||||
|
||||
```text
|
||||
test bench_search_for ... bench: 19,620,300 ns/iter (+/- 915,700)
|
||||
test bench_search_iter ... bench: 19,234,900 ns/iter (+/- 657,200)
|
||||
```
|
||||
|
||||
The iterator version was slightly faster! We won’t explain the benchmark code
|
||||
here, because the point is not to prove that the two versions are equivalent
|
||||
but to get a general sense of how these two implementations compare
|
||||
performance-wise.
|
||||
|
||||
For a more comprehensive benchmark, you should check using various texts of
|
||||
various sizes as the `contents`, different words and words of different lengths
|
||||
as the `query`, and all kinds of other variations. The point is this:
|
||||
iterators, although a high-level abstraction, get compiled down to roughly the
|
||||
same code as if you’d written the lower-level code yourself. Iterators are one
|
||||
of Rust’s *zero-cost abstractions*, by which we mean using the abstraction
|
||||
imposes no additional runtime overhead. This is analogous to how Bjarne
|
||||
Stroustrup, the original designer and implementor of C++, defines
|
||||
*zero-overhead* in “Foundations of C++” (2012):
|
||||
|
||||
> In general, C++ implementations obey the zero-overhead principle: What you
|
||||
> don’t use, you don’t pay for. And further: What you do use, you couldn’t hand
|
||||
> code any better.
|
||||
|
||||
As another example, the following code is taken from an audio decoder. The
|
||||
decoding algorithm uses the linear prediction mathematical operation to
|
||||
estimate future values based on a linear function of the previous samples. This
|
||||
code uses an iterator chain to do some math on three variables in scope: a
|
||||
`buffer` slice of data, an array of 12 `coefficients`, and an amount by which
|
||||
to shift data in `qlp_shift`. We’ve declared the variables within this example
|
||||
but not given them any values; although this code doesn’t have much meaning
|
||||
outside of its context, it’s still a concise, real-world example of how Rust
|
||||
translates high-level ideas to low-level code.
|
||||
|
||||
```rust,ignore
|
||||
let buffer: &mut [i32];
|
||||
let coefficients: [i64; 12];
|
||||
let qlp_shift: i16;
|
||||
|
||||
for i in 12..buffer.len() {
|
||||
let prediction = coefficients.iter()
|
||||
.zip(&buffer[i - 12..i])
|
||||
.map(|(&c, &s)| c * s as i64)
|
||||
.sum::<i64>() >> qlp_shift;
|
||||
let delta = buffer[i];
|
||||
buffer[i] = prediction as i32 + delta;
|
||||
}
|
||||
```
|
||||
|
||||
To calculate the value of `prediction`, this code iterates through each of the
|
||||
12 values in `coefficients` and uses the `zip` method to pair the coefficient
|
||||
values with the previous 12 values in `buffer`. Then, for each pair, we
|
||||
multiply the values together, sum all the results, and shift the bits in the
|
||||
sum `qlp_shift` bits to the right.
|
||||
|
||||
Calculations in applications like audio decoders often prioritize performance
|
||||
most highly. Here, we’re creating an iterator, using two adaptors, and then
|
||||
consuming the value. What assembly code would this Rust code compile to? Well,
|
||||
as of this writing, it compiles down to the same assembly you’d write by hand.
|
||||
There’s no loop at all corresponding to the iteration over the values in
|
||||
`coefficients`: Rust knows that there are 12 iterations, so it “unrolls” the
|
||||
loop. *Unrolling* is an optimization that removes the overhead of the loop
|
||||
controlling code and instead generates repetitive code for each iteration of
|
||||
the loop.
|
||||
|
||||
All of the coefficients get stored in registers, which means accessing the
|
||||
values is very fast. There are no bounds checks on the array access at runtime.
|
||||
All these optimizations that Rust is able to apply make the resulting code
|
||||
extremely efficient. Now that you know this, you can use iterators and closures
|
||||
without fear! They make code seem like it’s higher level but don’t impose a
|
||||
runtime performance penalty for doing so.
|
||||
|
||||
## Summary
|
||||
|
||||
Closures and iterators are Rust features inspired by functional programming
|
||||
language ideas. They contribute to Rust’s capability to clearly express
|
||||
high-level ideas at low-level performance. The implementations of closures and
|
||||
iterators are such that runtime performance is not affected. This is part of
|
||||
Rust’s goal to strive to provide zero-cost abstractions.
|
||||
|
||||
Now that we’ve improved the expressiveness of our I/O project, let’s look at
|
||||
some more features of `cargo` that will help us share the project with the
|
||||
world.
|
||||
15
2018-edition/src/ch14-00-more-about-cargo.md
Normal file
15
2018-edition/src/ch14-00-more-about-cargo.md
Normal file
@@ -0,0 +1,15 @@
|
||||
# More About Cargo and Crates.io
|
||||
|
||||
So far we’ve used only the most basic features of Cargo to build, run, and test
|
||||
our code, but it can do a lot more. In this chapter, we’ll discuss some of its
|
||||
other, more advanced features to show you how to do the following:
|
||||
|
||||
* Customize your build through release profiles
|
||||
* Publish libraries on [crates.io](https://crates.io)<!-- ignore -->
|
||||
* Organize large projects with workspaces
|
||||
* Install binaries from [crates.io](https://crates.io)<!-- ignore -->
|
||||
* Extend Cargo using custom commands
|
||||
|
||||
Cargo can do even more than what we cover in this chapter, so for a full
|
||||
explanation of all its features, see [its
|
||||
documentation](https://doc.rust-lang.org/cargo/).
|
||||
69
2018-edition/src/ch14-01-release-profiles.md
Normal file
69
2018-edition/src/ch14-01-release-profiles.md
Normal file
@@ -0,0 +1,69 @@
|
||||
## Customizing Builds with Release Profiles
|
||||
|
||||
In Rust, *release profiles* are predefined and customizable profiles with
|
||||
different configurations that allow a programmer to have more control over
|
||||
various options for compiling code. Each profile is configured independently of
|
||||
the others.
|
||||
|
||||
Cargo has two main profiles: the `dev` profile Cargo uses when you run `cargo
|
||||
build` and the `release` profile Cargo uses when you run `cargo build
|
||||
--release`. The `dev` profile is defined with good defaults for development,
|
||||
and the `release` profile has good defaults for release builds.
|
||||
|
||||
These profile names might be familiar from the output of your builds:
|
||||
|
||||
```text
|
||||
$ cargo build
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
$ cargo build --release
|
||||
Finished release [optimized] target(s) in 0.0 secs
|
||||
```
|
||||
|
||||
The `dev` and `release` shown in this build output indicate that the compiler
|
||||
is using different profiles.
|
||||
|
||||
Cargo has default settings for each of the profiles that apply when there
|
||||
aren’t any `[profile.*]` sections in the project’s *Cargo.toml* file. By adding
|
||||
`[profile.*]` sections for any profile you want to customize, you can override
|
||||
any subset of the default settings. For example, here are the default values
|
||||
for the `opt-level` setting for the `dev` and `release` profiles:
|
||||
|
||||
<span class="filename">Filename: Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[profile.dev]
|
||||
opt-level = 0
|
||||
|
||||
[profile.release]
|
||||
opt-level = 3
|
||||
```
|
||||
|
||||
The `opt-level` setting controls the number of optimizations Rust will apply to
|
||||
your code, with a range of 0 to 3. Applying more optimizations extends
|
||||
compiling time, so if you’re in development and compiling your code often,
|
||||
you'll want faster compiling even if the resulting code runs slower. That is
|
||||
the reason the default `opt-level` for `dev` is `0`. When you’re ready to
|
||||
release your code, it’s best to spend more time compiling. You’ll only compile
|
||||
in release mode once, but you'll run the compiled program many times, so
|
||||
release mode trades longer compile time for code that runs faster. That is why
|
||||
the default `opt-level` for the `release` profile is `3`.
|
||||
|
||||
You can override any default setting by adding a different value for it in
|
||||
*Cargo.toml*. For example, if we want to use optimization level 1 in the
|
||||
development profile, we can add these two lines to our project’s *Cargo.toml*
|
||||
file:
|
||||
|
||||
<span class="filename">Filename: Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[profile.dev]
|
||||
opt-level = 1
|
||||
```
|
||||
|
||||
This code overrides the default setting of `0`. Now when we run `cargo build`,
|
||||
Cargo will use the defaults for the `dev` profile plus our customization to
|
||||
`opt-level`. Because we set `opt-level` to `1`, Cargo will apply more
|
||||
optimizations than the default, but not as many as in a release build.
|
||||
|
||||
For the full list of configuration options and defaults for each profile, see
|
||||
[Cargo’s documentation](https://doc.rust-lang.org/cargo/).
|
||||
516
2018-edition/src/ch14-02-publishing-to-crates-io.md
Normal file
516
2018-edition/src/ch14-02-publishing-to-crates-io.md
Normal file
@@ -0,0 +1,516 @@
|
||||
## Publishing a Crate to Crates.io
|
||||
|
||||
We’ve used packages from [crates.io](https://crates.io)<!-- ignore --> as
|
||||
dependencies of our project, but you can also share your code with other people
|
||||
by publishing your own packages. The crate registry at
|
||||
[crates.io](https://crates.io)<!-- ignore --> distributes the source code of
|
||||
your packages, so it primarily hosts code that is open source.
|
||||
|
||||
Rust and Cargo have features that help make your published package easier for
|
||||
people to use and to find in the first place. We’ll talk about some of these
|
||||
features next and then explain how to publish a package.
|
||||
|
||||
### Making Useful Documentation Comments
|
||||
|
||||
Accurately documenting your packages will help other users know how and when to
|
||||
use them, so it’s worth investing the time to write documentation. In Chapter
|
||||
3, we discussed how to comment Rust code using two slashes, `//`. Rust also has
|
||||
a particular kind of comment for documentation, known conveniently as a
|
||||
*documentation comment*, that will generate HTML documentation. The HTML
|
||||
displays the contents of documentation comments for public API items intended
|
||||
for programmers interested in knowing how to *use* your crate as opposed to how
|
||||
your crate is *implemented*.
|
||||
|
||||
Documentation comments use three slashes, `///`, instead of two and support
|
||||
Markdown notation for formatting the text. Place documentation comments just
|
||||
before the item they’re documenting. Listing 14-1 shows documentation comments
|
||||
for an `add_one` function in a crate named `my_crate`:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
/// Adds one to the number given.
|
||||
///
|
||||
/// # Examples
|
||||
///
|
||||
/// ```
|
||||
/// let five = 5;
|
||||
///
|
||||
/// assert_eq!(6, my_crate::add_one(5));
|
||||
/// ```
|
||||
pub fn add_one(x: i32) -> i32 {
|
||||
x + 1
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 14-1: A documentation comment for a
|
||||
function</span>
|
||||
|
||||
Here, we give a description of what the `add_one` function does, start a
|
||||
section with the heading `Examples`, and then provide code that demonstrates
|
||||
how to use the `add_one` function. We can generate the HTML documentation from
|
||||
this documentation comment by running `cargo doc`. This command runs the
|
||||
`rustdoc` tool distributed with Rust and puts the generated HTML documentation
|
||||
in the *target/doc* directory.
|
||||
|
||||
For convenience, running `cargo doc --open` will build the HTML for your
|
||||
current crate’s documentation (as well as the documentation for all of your
|
||||
crate’s dependencies) and open the result in a web browser. Navigate to the
|
||||
`add_one` function and you’ll see how the text in the documentation comments is
|
||||
rendered, as shown in Figure 14-1:
|
||||
|
||||
<img alt="Rendered HTML documentation for the `add_one` function of `my_crate`" src="img/trpl14-01.png" class="center" />
|
||||
|
||||
<span class="caption">Figure 14-1: HTML documentation for the `add_one`
|
||||
function</span>
|
||||
|
||||
#### Commonly Used Sections
|
||||
|
||||
We used the `# Examples` Markdown heading in Listing 14-1 to create a section
|
||||
in the HTML with the title “Examples.” Here are some other sections that crate
|
||||
authors commonly use in their documentation:
|
||||
|
||||
* **Panics**: The scenarios in which the function being documented could
|
||||
panic. Callers of the function who don’t want their programs to panic should
|
||||
make sure they don’t call the function in these situations.
|
||||
* **Errors**: If the function returns a `Result`, describing the kinds of
|
||||
errors that might occur and what conditions might cause those errors to be
|
||||
returned can be helpful to callers so they can write code to handle the
|
||||
different kinds of errors in different ways.
|
||||
* **Safety**: If the function is `unsafe` to call (we discuss unsafety in
|
||||
Chapter 19), there should be a section explaining why the function is unsafe
|
||||
and covering the invariants that the function expects callers to uphold.
|
||||
|
||||
Most documentation comments don’t need all of these sections, but this is a
|
||||
good checklist to remind you of the aspects of your code that people calling
|
||||
your code will be interested in knowing about.
|
||||
|
||||
#### Documentation Comments as Tests
|
||||
|
||||
Adding example code blocks in your documentation comments can help demonstrate
|
||||
how to use your library, and doing so has an additional bonus: running `cargo
|
||||
test` will run the code examples in your documentation as tests! Nothing is
|
||||
better than documentation with examples. But nothing is worse than examples
|
||||
that don’t work because the code has changed since the documentation was
|
||||
written. If we run `cargo test` with the documentation for the `add_one`
|
||||
function from Listing 14-1, we will see a section in the test results like this:
|
||||
|
||||
```text
|
||||
Doc-tests my_crate
|
||||
|
||||
running 1 test
|
||||
test src/lib.rs - add_one (line 5) ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
Now if we change either the function or the example so the `assert_eq!` in the
|
||||
example panics and run `cargo test` again, we’ll see that the doc tests catch
|
||||
that the example and the code are out of sync with each other!
|
||||
|
||||
#### Commenting Contained Items
|
||||
|
||||
Another style of doc comment, `//!`, adds documentation to the item that
|
||||
contains the comments rather than adding documentation to the items following
|
||||
the comments. We typically use these doc comments inside the crate root file
|
||||
(*src/lib.rs* by convention) or inside a module to document the crate or the
|
||||
module as a whole.
|
||||
|
||||
For example, if we want to add documentation that describes the purpose of the
|
||||
`my_crate` crate that contains the `add_one` function, we can add documentation
|
||||
comments that start with `//!` to the beginning of the *src/lib.rs* file, as
|
||||
shown in Listing 14-2:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
//! # My Crate
|
||||
//!
|
||||
//! `my_crate` is a collection of utilities to make performing certain
|
||||
//! calculations more convenient.
|
||||
|
||||
/// Adds one to the number given.
|
||||
// --snip--
|
||||
```
|
||||
|
||||
<span class="caption">Listing 14-2: Documentation for the `my_crate` crate as a
|
||||
whole</span>
|
||||
|
||||
Notice there isn’t any code after the last line that begins with `//!`. Because
|
||||
we started the comments with `//!` instead of `///`, we’re documenting the item
|
||||
that contains this comment rather than an item that follows this comment. In
|
||||
this case, the item that contains this comment is the *src/lib.rs* file, which
|
||||
is the crate root. These comments describe the entire crate.
|
||||
|
||||
When we run `cargo doc --open`, these comments will display on the front
|
||||
page of the documentation for `my_crate` above the list of public items in the
|
||||
crate, as shown in Figure 14-2:
|
||||
|
||||
<img alt="Rendered HTML documentation with a comment for the crate as a whole" src="img/trpl14-02.png" class="center" />
|
||||
|
||||
<span class="caption">Figure 14-2: Rendered documentation for `my_crate`,
|
||||
including the comment describing the crate as a whole</span>
|
||||
|
||||
Documentation comments within items are useful for describing crates and
|
||||
modules especially. Use them to explain the overall purpose of the container to
|
||||
help your users understand the crate's organization.
|
||||
|
||||
### Exporting a Convenient Public API with `pub use`
|
||||
|
||||
In Chapter 7, we covered how to organize our code into modules using the `mod`
|
||||
keyword, how to make items public using the `pub` keyword, and how to bring
|
||||
items into a scope with the `use` keyword. However, the structure that makes
|
||||
sense to you while you’re developing a crate might not be very convenient for
|
||||
your users. You might want to organize your structs in a hierarchy containing
|
||||
multiple levels, but then people who want to use a type you’ve defined deep in
|
||||
the hierarchy might have trouble finding out that type exists. They might also
|
||||
be annoyed at having to enter `use`
|
||||
`my_crate::some_module::another_module::UsefulType;` rather than `use`
|
||||
`my_crate::UsefulType;`.
|
||||
|
||||
The structure of your public API is a major consideration when publishing a
|
||||
crate. People who use your crate are less familiar with the structure than you
|
||||
are and might have difficulty finding the pieces they want to use if your crate
|
||||
has a large module hierarchy.
|
||||
|
||||
The good news is that if the structure *isn’t* convenient for others to use
|
||||
from another library, you don’t have to rearrange your internal organization:
|
||||
instead, you can re-export items to make a public structure that’s different
|
||||
from your private structure by using `pub use`. Re-exporting takes a public
|
||||
item in one location and makes it public in another location, as if it were
|
||||
defined in the other location instead.
|
||||
|
||||
For example, say we made a library named `art` for modeling artistic concepts.
|
||||
Within this library are two modules: a `kinds` module containing two enums
|
||||
named `PrimaryColor` and `SecondaryColor` and a `utils` module containing a
|
||||
function named `mix`, as shown in Listing 14-3:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
//! # Art
|
||||
//!
|
||||
//! A library for modeling artistic concepts.
|
||||
|
||||
pub mod kinds {
|
||||
/// The primary colors according to the RYB color model.
|
||||
pub enum PrimaryColor {
|
||||
Red,
|
||||
Yellow,
|
||||
Blue,
|
||||
}
|
||||
|
||||
/// The secondary colors according to the RYB color model.
|
||||
pub enum SecondaryColor {
|
||||
Orange,
|
||||
Green,
|
||||
Purple,
|
||||
}
|
||||
}
|
||||
|
||||
pub mod utils {
|
||||
use kinds::*;
|
||||
|
||||
/// Combines two primary colors in equal amounts to create
|
||||
/// a secondary color.
|
||||
pub fn mix(c1: PrimaryColor, c2: PrimaryColor) -> SecondaryColor {
|
||||
// --snip--
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 14-3: An `art` library with items organized into
|
||||
`kinds` and `utils` modules</span>
|
||||
|
||||
Figure 14-3 shows what the front page of the documentation for this crate
|
||||
generated by `cargo doc` would look like:
|
||||
|
||||
<img alt="Rendered documentation for the `art` crate that lists the `kinds` and `utils` modules" src="img/trpl14-03.png" class="center" />
|
||||
|
||||
<span class="caption">Figure 14-3: Front page of the documentation for `art`
|
||||
that lists the `kinds` and `utils` modules</span>
|
||||
|
||||
Note that the `PrimaryColor` and `SecondaryColor` types aren’t listed on the
|
||||
front page, nor is the `mix` function. We have to click `kinds` and `utils` to
|
||||
see them.
|
||||
|
||||
Another crate that depends on this library would need `use` statements that
|
||||
import the items from `art`, specifying the module structure that’s currently
|
||||
defined. Listing 14-4 shows an example of a crate that uses the `PrimaryColor`
|
||||
and `mix` items from the `art` crate:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
extern crate art;
|
||||
|
||||
use art::kinds::PrimaryColor;
|
||||
use art::utils::mix;
|
||||
|
||||
fn main() {
|
||||
let red = PrimaryColor::Red;
|
||||
let yellow = PrimaryColor::Yellow;
|
||||
mix(red, yellow);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 14-4: A crate using the `art` crate’s items with
|
||||
its internal structure exported</span>
|
||||
|
||||
The author of the code in Listing 14-4, which uses the `art` crate, had to
|
||||
figure out that `PrimaryColor` is in the `kinds` module and `mix` is in the
|
||||
`utils` module. The module structure of the `art` crate is more relevant to
|
||||
developers working on the `art` crate than to developers using the `art` crate.
|
||||
The internal structure that organizes parts of the crate into the `kinds`
|
||||
module and the `utils` module doesn’t contain any useful information for
|
||||
someone trying to understand how to use the `art` crate. Instead, the `art`
|
||||
crate’s module structure causes confusion because developers have to figure out
|
||||
where to look, and the structure is inconvenient because developers must
|
||||
specify the module names in the `use` statements.
|
||||
|
||||
To remove the internal organization from the public API, we can modify the
|
||||
`art` crate code in Listing 14-3 to add `pub use` statements to re-export the
|
||||
items at the top level, as shown in Listing 14-5:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
//! # Art
|
||||
//!
|
||||
//! A library for modeling artistic concepts.
|
||||
|
||||
pub use kinds::PrimaryColor;
|
||||
pub use kinds::SecondaryColor;
|
||||
pub use utils::mix;
|
||||
|
||||
pub mod kinds {
|
||||
// --snip--
|
||||
}
|
||||
|
||||
pub mod utils {
|
||||
// --snip--
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 14-5: Adding `pub use` statements to re-export
|
||||
items</span>
|
||||
|
||||
The API documentation that `cargo doc` generates for this crate will now list
|
||||
and link re-exports on the front page, as shown in Figure 14-4, making the
|
||||
`PrimaryColor` and `SecondaryColor` types and the `mix` function easier to find.
|
||||
|
||||
<img alt="Rendered documentation for the `art` crate with the re-exports on the front page" src="img/trpl14-04.png" class="center" />
|
||||
|
||||
<span class="caption">Figure 14-4: The front page of the documentation for `art`
|
||||
that lists the re-exports</span>
|
||||
|
||||
The `art` crate users can still see and use the internal structure from Listing
|
||||
14-3 as demonstrated in Listing 14-4, or they can use the more convenient
|
||||
structure in Listing 14-5, as shown in Listing 14-6:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
extern crate art;
|
||||
|
||||
use art::PrimaryColor;
|
||||
use art::mix;
|
||||
|
||||
fn main() {
|
||||
// --snip--
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 14-6: A program using the re-exported items from
|
||||
the `art` crate</span>
|
||||
|
||||
In cases where there are many nested modules, re-exporting the types at the top
|
||||
level with `pub use` can make a significant difference in the experience of
|
||||
people who use the crate.
|
||||
|
||||
Creating a useful public API structure is more of an art than a science, and
|
||||
you can iterate to find the API that works best for your users. Choosing `pub
|
||||
use` gives you flexibility in how you structure your crate internally and
|
||||
decouples that internal structure from what you present to your users. Look at
|
||||
some of the code of crates you’ve installed to see if their internal structure
|
||||
differs from their public API.
|
||||
|
||||
### Setting Up a Crates.io Account
|
||||
|
||||
Before you can publish any crates, you need to create an account on
|
||||
[crates.io](https://crates.io)<!-- ignore --> and get an API token. To do so,
|
||||
visit the home page at [crates.io](https://crates.io)<!-- ignore --> and log in
|
||||
via a GitHub account. (The GitHub account is currently a requirement, but the
|
||||
site might support other ways of creating an account in the future.) Once
|
||||
you’re logged in, visit your account settings at
|
||||
[https://crates.io/me/](https://crates.io/me/)<!-- ignore --> and retrieve your
|
||||
API key. Then run the `cargo login` command with your API key, like this:
|
||||
|
||||
```text
|
||||
$ cargo login abcdefghijklmnopqrstuvwxyz012345
|
||||
```
|
||||
|
||||
This command will inform Cargo of your API token and store it locally in
|
||||
*~/.cargo/credentials*. Note that this token is a *secret*: do not share it
|
||||
with anyone else. If you do share it with anyone for any reason, you should
|
||||
revoke it and generate a new token on [crates.io](https://crates.io)<!-- ignore
|
||||
-->.
|
||||
|
||||
### Adding Metadata to a New Crate
|
||||
|
||||
Now that you have an account, let’s say you have a crate you want to publish.
|
||||
Before publishing, you’ll need to add some metadata to your crate by adding it
|
||||
to the `[package]` section of the crate’s *Cargo.toml* file.
|
||||
|
||||
Your crate will need a unique name. While you’re working on a crate locally,
|
||||
you can name a crate whatever you’d like. However, crate names on
|
||||
[crates.io](https://crates.io)<!-- ignore --> are allocated on a first-come,
|
||||
first-served basis. Once a crate name is taken, no one else can publish a crate
|
||||
with that name. Search for the name you want to use on the site to find out
|
||||
whether it has been used. If it hasn’t, edit the name in the *Cargo.toml* file
|
||||
under `[package]` to use the name for publishing, like so:
|
||||
|
||||
<span class="filename">Filename: Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[package]
|
||||
name = "guessing_game"
|
||||
```
|
||||
|
||||
Even if you’ve chosen a unique name, when you run `cargo publish` to publish
|
||||
the crate at this point, you’ll get a warning and then an error:
|
||||
|
||||
```text
|
||||
$ cargo publish
|
||||
Updating registry `https://github.com/rust-lang/crates.io-index`
|
||||
warning: manifest has no description, license, license-file, documentation,
|
||||
homepage or repository.
|
||||
--snip--
|
||||
error: api errors: missing or empty metadata fields: description, license.
|
||||
```
|
||||
|
||||
The reason is that you’re missing some crucial information: a description and
|
||||
license are required so people will know what your crate does and under what
|
||||
terms they can use it. To rectify this error, you need to include this
|
||||
information in the *Cargo.toml* file.
|
||||
|
||||
Add a description that is just a sentence or two, because it will appear with
|
||||
your crate in search results. For the `license` field, you need to give a
|
||||
*license identifier value*. The [Linux Foundation’s Software Package Data
|
||||
Exchange (SPDX)][spdx] lists the identifiers you can use for this value. For
|
||||
example, to specify that you’ve licensed your crate using the MIT License, add
|
||||
the `MIT` identifier:
|
||||
|
||||
[spdx]: http://spdx.org/licenses/
|
||||
|
||||
<span class="filename">Filename: Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[package]
|
||||
name = "guessing_game"
|
||||
license = "MIT"
|
||||
```
|
||||
|
||||
If you want to use a license that doesn’t appear in the SPDX, you need to place
|
||||
the text of that license in a file, include the file in your project, and then
|
||||
use `license-file` to specify the name of that file instead of using the
|
||||
`license` key.
|
||||
|
||||
Guidance on which license is appropriate for your project is beyond the scope
|
||||
of this book. Many people in the Rust community license their projects in the
|
||||
same way as Rust by using a dual license of `MIT OR Apache-2.0`. This practice
|
||||
demonstrates that you can also specify multiple license identifiers separated
|
||||
by `OR` to have multiple licenses for your project.
|
||||
|
||||
With a unique name, the version, the author details that `cargo new` added
|
||||
when you created the crate, your description, and a license added, the
|
||||
*Cargo.toml* file for a project that is ready to publish might look like this:
|
||||
|
||||
<span class="filename">Filename: Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[package]
|
||||
name = "guessing_game"
|
||||
version = "0.1.0"
|
||||
authors = ["Your Name <you@example.com>"]
|
||||
description = "A fun game where you guess what number the computer has chosen."
|
||||
license = "MIT OR Apache-2.0"
|
||||
|
||||
[dependencies]
|
||||
```
|
||||
|
||||
[Cargo’s documentation](https://doc.rust-lang.org/cargo/) describes other
|
||||
metadata you can specify to ensure others can discover and use your crate more
|
||||
easily.
|
||||
|
||||
### Publishing to Crates.io
|
||||
|
||||
Now that you’ve created an account, saved your API token, chosen a name for
|
||||
your crate, and specified the required metadata, you’re ready to publish!
|
||||
Publishing a crate uploads a specific version to
|
||||
[crates.io](https://crates.io)<!-- ignore --> for others to use.
|
||||
|
||||
Be careful when publishing a crate because a publish is *permanent*. The
|
||||
version can never be overwritten, and the code cannot be deleted. One major
|
||||
goal of [crates.io](https://crates.io)<!-- ignore --> is to act as a permanent
|
||||
archive of code so that builds of all projects that depend on crates from
|
||||
[crates.io](https://crates.io)<!-- ignore --> will continue to work. Allowing
|
||||
version deletions would make fulfilling that goal impossible. However, there is
|
||||
no limit to the number of crate versions you can publish.
|
||||
|
||||
Run the `cargo publish` command again. It should succeed now:
|
||||
|
||||
```text
|
||||
$ cargo publish
|
||||
Updating registry `https://github.com/rust-lang/crates.io-index`
|
||||
Packaging guessing_game v0.1.0 (file:///projects/guessing_game)
|
||||
Verifying guessing_game v0.1.0 (file:///projects/guessing_game)
|
||||
Compiling guessing_game v0.1.0
|
||||
(file:///projects/guessing_game/target/package/guessing_game-0.1.0)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.19 secs
|
||||
Uploading guessing_game v0.1.0 (file:///projects/guessing_game)
|
||||
```
|
||||
|
||||
Congratulations! You’ve now shared your code with the Rust community, and
|
||||
anyone can easily add your crate as a dependency of their project.
|
||||
|
||||
### Publishing a New Version of an Existing Crate
|
||||
|
||||
When you’ve made changes to your crate and are ready to release a new version,
|
||||
you change the `version` value specified in your *Cargo.toml* file and
|
||||
republish. Use the [Semantic Versioning rules][semver] to decide what an
|
||||
appropriate next version number is based on the kinds of changes you’ve made.
|
||||
Then run `cargo publish` to upload the new version.
|
||||
|
||||
[semver]: http://semver.org/
|
||||
|
||||
### Removing Versions from Crates.io with `cargo yank`
|
||||
|
||||
Although you can’t remove previous versions of a crate, you can prevent any
|
||||
future projects from adding them as a new dependency. This is useful when a
|
||||
crate version is broken for one reason or another. In such situations, Cargo
|
||||
supports *yanking* a crate version.
|
||||
|
||||
Yanking a version prevents new projects from starting to depend on that version
|
||||
while allowing all existing projects that depend on it to continue to download
|
||||
and depend on that version. Essentially, a yank means that all projects with a
|
||||
*Cargo.lock* will not break, and any future *Cargo.lock* files generated will
|
||||
not use the yanked version.
|
||||
|
||||
To yank a version of a crate, run `cargo yank` and specify which version you
|
||||
want to yank:
|
||||
|
||||
```text
|
||||
$ cargo yank --vers 1.0.1
|
||||
```
|
||||
|
||||
By adding `--undo` to the command, you can also undo a yank and allow projects
|
||||
to start depending on a version again:
|
||||
|
||||
```text
|
||||
$ cargo yank --vers 1.0.1 --undo
|
||||
```
|
||||
|
||||
A yank *does not* delete any code. For example, the yank feature is not
|
||||
intended for deleting accidentally uploaded secrets. If that happens, you must
|
||||
reset those secrets immediately.
|
||||
336
2018-edition/src/ch14-03-cargo-workspaces.md
Normal file
336
2018-edition/src/ch14-03-cargo-workspaces.md
Normal file
@@ -0,0 +1,336 @@
|
||||
## Cargo Workspaces
|
||||
|
||||
In Chapter 12, we built a package that included a binary crate and a library
|
||||
crate. As your project develops, you might find that the library crate
|
||||
continues to get bigger and you want to split up your package further into
|
||||
multiple library crates. In this situation, Cargo offers a feature called
|
||||
*workspaces* that can help manage multiple related packages that are developed
|
||||
in tandem.
|
||||
|
||||
### Creating a Workspace
|
||||
|
||||
A *workspace* is a set of packages that share the same *Cargo.lock* and output
|
||||
directory. Let’s make a project using a workspace—we’ll use trivial code so we
|
||||
can concentrate on the structure of the workspace. There are multiple ways to
|
||||
structure a workspace; we’re going to show one common way. We’ll have a
|
||||
workspace containing a binary and two libraries. The binary, which will provide
|
||||
the main functionality, will depend on the two libraries. One library will
|
||||
provide an `add_one` function, and a second library an `add_two` function.
|
||||
These three crates will be part of the same workspace. We’ll start by creating
|
||||
a new directory for the workspace:
|
||||
|
||||
```text
|
||||
$ mkdir add
|
||||
$ cd add
|
||||
```
|
||||
|
||||
Next, in the *add* directory, we create the *Cargo.toml* file that will
|
||||
configure the entire workspace. This file won’t have a `[package]` section or
|
||||
the metadata we’ve seen in other *Cargo.toml* files. Instead, it will start
|
||||
with a `[workspace]` section that will allow us to add members to the workspace
|
||||
by specifying the path to our binary crate; in this case, that path is *adder*:
|
||||
|
||||
<span class="filename">Filename: Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[workspace]
|
||||
|
||||
members = [
|
||||
"adder",
|
||||
]
|
||||
```
|
||||
|
||||
Next, we’ll create the `adder` binary crate by running `cargo new` within the
|
||||
*add* directory:
|
||||
|
||||
```text
|
||||
$ cargo new --bin adder
|
||||
Created binary (application) `adder` project
|
||||
```
|
||||
|
||||
At this point, we can build the workspace by running `cargo build`. The files
|
||||
in your *add* directory should look like this:
|
||||
|
||||
```text
|
||||
├── Cargo.lock
|
||||
├── Cargo.toml
|
||||
├── adder
|
||||
│ ├── Cargo.toml
|
||||
│ └── src
|
||||
│ └── main.rs
|
||||
└── target
|
||||
```
|
||||
|
||||
The workspace has one *target* directory at the top level for the compiled
|
||||
artifacts to be placed into; the `adder` crate doesn’t have its own *target*
|
||||
directory. Even if we were to run `cargo build` from inside the *adder*
|
||||
directory, the compiled artifacts would still end up in *add/target* rather
|
||||
than *add/adder/target*. Cargo structures the *target* directory in a workspace
|
||||
like this because the crates in a workspace are meant to depend on each other.
|
||||
If each crate had its own *target* directory, each crate would have to
|
||||
recompile each of the other crates in the workspace to have the artifacts in
|
||||
its own *target* directory. By sharing one *target* directory, the crates can
|
||||
avoid unnecessary rebuilding.
|
||||
|
||||
### Creating the Second Crate in the Workspace
|
||||
|
||||
Next, let’s create another member crate in the workspace and call it `add-one`.
|
||||
Change the top-level *Cargo.toml* to specify the *add-one* path in the
|
||||
`members` list:
|
||||
|
||||
<span class="filename">Filename: Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[workspace]
|
||||
|
||||
members = [
|
||||
"adder",
|
||||
"add-one",
|
||||
]
|
||||
```
|
||||
|
||||
Then generate a new library crate named `add-one`:
|
||||
|
||||
```text
|
||||
$ cargo new add-one
|
||||
Created library `add-one` project
|
||||
```
|
||||
|
||||
Your *add* directory should now have these directories and files:
|
||||
|
||||
```text
|
||||
├── Cargo.lock
|
||||
├── Cargo.toml
|
||||
├── add-one
|
||||
│ ├── Cargo.toml
|
||||
│ └── src
|
||||
│ └── lib.rs
|
||||
├── adder
|
||||
│ ├── Cargo.toml
|
||||
│ └── src
|
||||
│ └── main.rs
|
||||
└── target
|
||||
```
|
||||
|
||||
In the *add-one/src/lib.rs* file, let’s add an `add_one` function:
|
||||
|
||||
<span class="filename">Filename: add-one/src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub fn add_one(x: i32) -> i32 {
|
||||
x + 1
|
||||
}
|
||||
```
|
||||
|
||||
Now that we have a library crate in the workspace, we can have the binary crate
|
||||
`adder` depend on the library crate `add-one`. First, we’ll need to add a path
|
||||
dependency on `add-one` to *adder/Cargo.toml*.
|
||||
|
||||
<span class="filename">Filename: adder/Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[dependencies]
|
||||
|
||||
add-one = { path = "../add-one" }
|
||||
```
|
||||
|
||||
Cargo doesn’t assume that crates in a workspace will depend on each other, so
|
||||
we need to be explicit about the dependency relationships between the crates.
|
||||
|
||||
Next, let’s use the `add_one` function from the `add-one` crate in the `adder`
|
||||
crate. Open the *adder/src/main.rs* file and add an `extern crate` line at
|
||||
the top to bring the new `add-one` library crate into scope. Then change the
|
||||
`main` function to call the `add_one` function, as in Listing 14-7:
|
||||
|
||||
<span class="filename">Filename: adder/src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
extern crate add_one;
|
||||
|
||||
fn main() {
|
||||
let num = 10;
|
||||
println!("Hello, world! {} plus one is {}!", num, add_one::add_one(num));
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 14-7: Using the `add-one` library crate from the
|
||||
`adder` crate</span>
|
||||
|
||||
Let’s build the workspace by running `cargo build` in the top-level *add*
|
||||
directory!
|
||||
|
||||
```text
|
||||
$ cargo build
|
||||
Compiling add-one v0.1.0 (file:///projects/add/add-one)
|
||||
Compiling adder v0.1.0 (file:///projects/add/adder)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.68 secs
|
||||
```
|
||||
|
||||
To run the binary crate from the *add* directory, we need to specify which
|
||||
package in the workspace we want to use by using the `-p` argument and the
|
||||
package name with `cargo run`:
|
||||
|
||||
```text
|
||||
$ cargo run -p adder
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running `target/debug/adder`
|
||||
Hello, world! 10 plus one is 11!
|
||||
```
|
||||
|
||||
This runs the code in *adder/src/main.rs*, which depends on the `add-one` crate.
|
||||
|
||||
#### Depending on an External Crate in a Workspace
|
||||
|
||||
Notice that the workspace has only one *Cargo.lock* file at the top level of
|
||||
the workspace rather than having a *Cargo.lock* in each crate’s directory. This
|
||||
ensures that all crates are using the same version of all dependencies. If we
|
||||
add the `rand` crate to the *adder/Cargo.toml* and *add-one/Cargo.toml*
|
||||
files, Cargo will resolve both of those to one version of `rand` and record
|
||||
that in the one *Cargo.lock*. Making all crates in the workspace use the same
|
||||
dependencies means the crates in the workspace will always be compatible with
|
||||
each other. Let’s add the `rand` crate to the `[dependencies]` section in the
|
||||
*add-one/Cargo.toml* file to be able to use the `rand` crate in the `add-one`
|
||||
crate:
|
||||
|
||||
<span class="filename">Filename: add-one/Cargo.toml</span>
|
||||
|
||||
```toml
|
||||
[dependencies]
|
||||
|
||||
rand = "0.3.14"
|
||||
```
|
||||
|
||||
We can now add `extern crate rand;` to the *add-one/src/lib.rs* file, and
|
||||
building the whole workspace by running `cargo build` in the *add* directory
|
||||
will bring in and compile the `rand` crate:
|
||||
|
||||
```text
|
||||
$ cargo build
|
||||
Updating registry `https://github.com/rust-lang/crates.io-index`
|
||||
Downloading rand v0.3.14
|
||||
--snip--
|
||||
Compiling rand v0.3.14
|
||||
Compiling add-one v0.1.0 (file:///projects/add/add-one)
|
||||
Compiling adder v0.1.0 (file:///projects/add/adder)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 10.18 secs
|
||||
```
|
||||
|
||||
The top-level *Cargo.lock* now contains information about the dependency of
|
||||
`add-one` on `rand`. However, even though `rand` is used somewhere in the
|
||||
workspace, we can’t use it in other crates in the workspace unless we add
|
||||
`rand` to their *Cargo.toml* files as well. For example, if we add `extern
|
||||
crate rand;` to the *adder/src/main.rs* file for the `adder` crate, we’ll get
|
||||
an error:
|
||||
|
||||
```text
|
||||
$ cargo build
|
||||
Compiling adder v0.1.0 (file:///projects/add/adder)
|
||||
error: use of unstable library feature 'rand': use `rand` from crates.io (see
|
||||
issue #27703)
|
||||
--> adder/src/main.rs:1:1
|
||||
|
|
||||
1 | extern crate rand;
|
||||
```
|
||||
|
||||
To fix this, edit the *Cargo.toml* file for the `adder` crate and indicate that
|
||||
`rand` is a dependency for that crate as well. Building the `adder` crate will
|
||||
add `rand` to the list of dependencies for `adder` in *Cargo.lock*, but no
|
||||
additional copies of `rand` will be downloaded. Cargo has ensured that every
|
||||
crate in the workspace using the `rand` crate will be using the same version.
|
||||
Using the same version of `rand` across the workspace saves space because we
|
||||
won’t have multiple copies and ensures that the crates in the workspace will be
|
||||
compatible with each other.
|
||||
|
||||
#### Adding a Test to a Workspace
|
||||
|
||||
For another enhancement, let’s add a test of the `add_one::add_one` function
|
||||
within the `add_one` crate:
|
||||
|
||||
<span class="filename">Filename: add-one/src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub fn add_one(x: i32) -> i32 {
|
||||
x + 1
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
#[test]
|
||||
fn it_works() {
|
||||
assert_eq!(3, add_one(2));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
Now run `cargo test` in the top-level *add* directory:
|
||||
|
||||
```text
|
||||
$ cargo test
|
||||
Compiling add-one v0.1.0 (file:///projects/add/add-one)
|
||||
Compiling adder v0.1.0 (file:///projects/add/adder)
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.27 secs
|
||||
Running target/debug/deps/add_one-f0253159197f7841
|
||||
|
||||
running 1 test
|
||||
test tests::it_works ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
Running target/debug/deps/adder-f88af9d2cc175a5e
|
||||
|
||||
running 0 tests
|
||||
|
||||
test result: ok. 0 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
Doc-tests add-one
|
||||
|
||||
running 0 tests
|
||||
|
||||
test result: ok. 0 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
The first section of the output shows that the `it_works` test in the `add-one`
|
||||
crate passed. The next section shows that zero tests were found in the `adder`
|
||||
crate, and then the last section shows zero documentation tests were found in
|
||||
the `add-one` crate. Running `cargo test` in a workspace structured like this
|
||||
one will run the tests for all the crates in the workspace.
|
||||
|
||||
We can also run tests for one particular crate in a workspace from the
|
||||
top-level directory by using the `-p` flag and specifying the name of the crate
|
||||
we want to test:
|
||||
|
||||
```text
|
||||
$ cargo test -p add-one
|
||||
Finished dev [unoptimized + debuginfo] target(s) in 0.0 secs
|
||||
Running target/debug/deps/add_one-b3235fea9a156f74
|
||||
|
||||
running 1 test
|
||||
test tests::it_works ... ok
|
||||
|
||||
test result: ok. 1 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
|
||||
Doc-tests add-one
|
||||
|
||||
running 0 tests
|
||||
|
||||
test result: ok. 0 passed; 0 failed; 0 ignored; 0 measured; 0 filtered out
|
||||
```
|
||||
|
||||
This output shows `cargo test` only ran the tests for the `add-one` crate and
|
||||
didn’t run the `adder` crate tests.
|
||||
|
||||
If you publish the crates in the workspace to *https://crates.io/*, each crate
|
||||
in the workspace will need to be published separately. The `cargo publish`
|
||||
command does not have an `--all` flag or a `-p` flag, so you must change to
|
||||
each crate’s directory and run `cargo publish` on each crate in the workspace
|
||||
to publish the crates.
|
||||
|
||||
For additional practice, add an `add-two` crate to this workspace in a similar
|
||||
way as the `add-one` crate!
|
||||
|
||||
As your project grows, consider using a workspace: it’s easier to understand
|
||||
smaller, individual components than one big blob of code. Furthermore, keeping
|
||||
the crates in a workspace can make coordination between them easier if they are
|
||||
often changed at the same time.
|
||||
37
2018-edition/src/ch14-04-installing-binaries.md
Normal file
37
2018-edition/src/ch14-04-installing-binaries.md
Normal file
@@ -0,0 +1,37 @@
|
||||
## Installing Binaries from Crates.io with `cargo install`
|
||||
|
||||
The `cargo install` command allows you to install and use binary crates
|
||||
locally. This isn’t intended to replace system packages; it’s meant to be a
|
||||
convenient way for Rust developers to install tools that others have shared on
|
||||
[crates.io](https://crates.io)<!-- ignore -->. Note that you can only install
|
||||
packages that have binary targets. A *binary target* is the runnable program
|
||||
that is created if the crate has a *src/main.rs* file or another file specified
|
||||
as a binary, as opposed to a library target that isn’t runnable on its own but
|
||||
is suitable for including within other programs. Usually, crates have
|
||||
information in the *README* file about whether a crate is a library, has a
|
||||
binary target, or both.
|
||||
|
||||
All binaries installed with `cargo install` are stored in the installation
|
||||
root’s *bin* folder. If you installed Rust using *rustup.rs* and don’t have any
|
||||
custom configurations, this directory will be *$HOME/.cargo/bin*. Ensure that
|
||||
directory is in your `$PATH` to be able to run programs you’ve installed with
|
||||
`cargo install`.
|
||||
|
||||
For example, in Chapter 12 we mentioned that there’s a Rust implementation of
|
||||
the `grep` tool called `ripgrep` for searching files. If we want to install
|
||||
`ripgrep`, we can run the following:
|
||||
|
||||
```text
|
||||
$ cargo install ripgrep
|
||||
Updating registry `https://github.com/rust-lang/crates.io-index`
|
||||
Downloading ripgrep v0.3.2
|
||||
--snip--
|
||||
Compiling ripgrep v0.3.2
|
||||
Finished release [optimized + debuginfo] target(s) in 97.91 secs
|
||||
Installing ~/.cargo/bin/rg
|
||||
```
|
||||
|
||||
The last line of the output shows the location and the name of the installed
|
||||
binary, which in the case of `ripgrep` is `rg`. As long as the installation
|
||||
directory is in your `$PATH`, as mentioned previously, you can then run `rg
|
||||
--help` and start using a faster, rustier tool for searching files!
|
||||
17
2018-edition/src/ch14-05-extending-cargo.md
Normal file
17
2018-edition/src/ch14-05-extending-cargo.md
Normal file
@@ -0,0 +1,17 @@
|
||||
## Extending Cargo with Custom Commands
|
||||
|
||||
Cargo is designed so you can extend it with new subcommands without having to
|
||||
modify Cargo. If a binary in your `$PATH` is named `cargo-something`, you can
|
||||
run it as if it was a Cargo subcommand by running `cargo something`. Custom
|
||||
commands like this are also listed when you run `cargo --list`. Being able to
|
||||
use `cargo install` to install extensions and then run them just like the
|
||||
built-in Cargo tools is a super convenient benefit of Cargo’s design!
|
||||
|
||||
## Summary
|
||||
|
||||
Sharing code with Cargo and [crates.io](https://crates.io)<!-- ignore --> is
|
||||
part of what makes the Rust ecosystem useful for many different tasks. Rust’s
|
||||
standard library is small and stable, but crates are easy to share, use, and
|
||||
improve on a timeline different from that of the language. Don’t be shy about
|
||||
sharing code that’s useful to you on [crates.io](https://crates.io)<!-- ignore
|
||||
-->; it’s likely that it will be useful to someone else as well!
|
||||
56
2018-edition/src/ch15-00-smart-pointers.md
Normal file
56
2018-edition/src/ch15-00-smart-pointers.md
Normal file
@@ -0,0 +1,56 @@
|
||||
# Smart Pointers
|
||||
|
||||
A *pointer* is a general concept for a variable that contains an address in
|
||||
memory. This address refers to, or “points at,” some other data. The most
|
||||
common kind of pointer in Rust is a reference, which you learned about in
|
||||
Chapter 4. References are indicated by the `&` symbol and borrow the value they
|
||||
point to. They don’t have any special capabilities other than referring to
|
||||
data. Also, they don’t have any overhead and are the kind of pointer we use
|
||||
most often.
|
||||
|
||||
*Smart pointers*, on the other hand, are data structures that not only act like
|
||||
a pointer but also have additional metadata and capabilities. The concept of
|
||||
smart pointers isn’t unique to Rust: smart pointers originated in C++ and exist
|
||||
in other languages as well. In Rust, the different smart pointers defined in
|
||||
the standard library provide functionality beyond that provided by references.
|
||||
One example that we’ll explore in this chapter is the *reference counting*
|
||||
smart pointer type. This pointer enables you to have multiple owners of data by
|
||||
keeping track of the number of owners and, when no owners remain, cleaning up
|
||||
the data.
|
||||
|
||||
In Rust, which uses the concept of ownership and borrowing, an additional
|
||||
difference between references and smart pointers is that references are
|
||||
pointers that only borrow data; in contrast, in many cases, smart pointers
|
||||
*own* the data they point to.
|
||||
|
||||
We’ve already encountered a few smart pointers in this book, such as `String`
|
||||
and `Vec<T>` in Chapter 8, although we didn’t call them smart pointers at the
|
||||
time. Both these types count as smart pointers because they own some memory and
|
||||
allow you to manipulate it. They also have metadata (such as their capacity)
|
||||
and extra capabilities or guarantees (such as with `String` ensuring its data
|
||||
will always be valid UTF-8).
|
||||
|
||||
Smart pointers are usually implemented using structs. The characteristic that
|
||||
distinguishes a smart pointer from an ordinary struct is that smart pointers
|
||||
implement the `Deref` and `Drop` traits. The `Deref` trait allows an instance
|
||||
of the smart pointer struct to behave like a reference so you can write code
|
||||
that works with either references or smart pointers. The `Drop` trait allows
|
||||
you to customize the code that is run when an instance of the smart pointer
|
||||
goes out of scope. In this chapter, we’ll discuss both traits and demonstrate
|
||||
why they’re important to smart pointers.
|
||||
|
||||
Given that the smart pointer pattern is a general design pattern used
|
||||
frequently in Rust, this chapter won’t cover every existing smart pointer. Many
|
||||
libraries have their own smart pointers, and you can even write your own. We’ll
|
||||
cover the most common smart pointers in the standard library:
|
||||
|
||||
* `Box<T>` for allocating values on the heap
|
||||
* `Rc<T>`, a reference counting type that enables multiple ownership
|
||||
* `Ref<T>` and `RefMut<T>`, accessed through `RefCell<T>`, a type that enforces
|
||||
the borrowing rules at runtime instead of compile time
|
||||
|
||||
In addition, we’ll cover the *interior mutability* pattern where an immutable
|
||||
type exposes an API for mutating an interior value. We’ll also discuss
|
||||
*reference cycles*: how they can leak memory and how to prevent them.
|
||||
|
||||
Let’s dive in!
|
||||
280
2018-edition/src/ch15-01-box.md
Normal file
280
2018-edition/src/ch15-01-box.md
Normal file
@@ -0,0 +1,280 @@
|
||||
## Using `Box<T>` to Point to Data on the Heap
|
||||
|
||||
The most straightforward smart pointer is a *box*, whose type is written
|
||||
`Box<T>`. Boxes allow you to store data on the heap rather than the stack. What
|
||||
remains on the stack is the pointer to the heap data. Refer to Chapter 4 to
|
||||
review the difference between the stack and the heap.
|
||||
|
||||
Boxes don’t have performance overhead, other than storing their data on the
|
||||
heap instead of on the stack. But they don’t have many extra capabilities
|
||||
either. You’ll use them most often in these situations:
|
||||
|
||||
* When you have a type whose size can’t be known at compile time and you want
|
||||
to use a value of that type in a context that requires an exact size
|
||||
* When you have a large amount of data and you want to transfer ownership but
|
||||
ensure the data won’t be copied when you do so
|
||||
* When you want to own a value and you care only that it’s a type that
|
||||
implements a particular trait rather than being of a specific type
|
||||
|
||||
We’ll demonstrate the first situation in the “Enabling Recursive Types with
|
||||
Boxes” section. In the second case, transferring ownership of a large amount of
|
||||
data can take a long time because the data is copied around on the stack. To
|
||||
improve performance in this situation, we can store the large amount of data on
|
||||
the heap in a box. Then, only the small amount of pointer data is copied around
|
||||
on the stack, while the data it references stays in one place on the heap. The
|
||||
third case is known as a *trait object*, and Chapter 17 devotes an entire
|
||||
section, “Using Trait Objects That Allow for Values of Different Types,” just
|
||||
to that topic. So what you learn here you’ll apply again in Chapter 17!
|
||||
|
||||
### Using a `Box<T>` to Store Data on the Heap
|
||||
|
||||
Before we discuss this use case for `Box<T>`, we’ll cover the syntax and how to
|
||||
interact with values stored within a `Box<T>`.
|
||||
|
||||
Listing 15-1 shows how to use a box to store an `i32` value on the heap:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let b = Box::new(5);
|
||||
println!("b = {}", b);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-1: Storing an `i32` value on the heap using a
|
||||
box</span>
|
||||
|
||||
We define the variable `b` to have the value of a `Box` that points to the
|
||||
value `5`, which is allocated on the heap. This program will print `b = 5`; in
|
||||
this case, we can access the data in the box similar to how we would if this
|
||||
data were on the stack. Just like any owned value, when a box goes out of
|
||||
scope, as `b` does at the end of `main`, it will be deallocated. The
|
||||
deallocation happens for the box (stored on the stack) and the data it points
|
||||
to (stored on the heap).
|
||||
|
||||
Putting a single value on the heap isn’t very useful, so you won’t use boxes by
|
||||
themselves in this way very often. Having values like a single `i32` on the
|
||||
stack, where they’re stored by default, is more appropriate in the majority of
|
||||
situations. Let’s look at a case where boxes allow us to define types that we
|
||||
wouldn’t be allowed to if we didn’t have boxes.
|
||||
|
||||
### Enabling Recursive Types with Boxes
|
||||
|
||||
At compile time, Rust needs to know how much space a type takes up. One type
|
||||
whose size can’t be known at compile time is a *recursive type*, where a value
|
||||
can have as part of itself another value of the same type. Because this nesting
|
||||
of values could theoretically continue infinitely, Rust doesn’t know how much
|
||||
space a value of a recursive type needs. However, boxes have a known size, so
|
||||
by inserting a box in a recursive type definition, you can have recursive types.
|
||||
|
||||
Let’s explore the *cons list*, which is a data type common in functional
|
||||
programming languages, as an example of a recursive type. The cons list type
|
||||
we’ll define is straightforward except for the recursion; therefore, the
|
||||
concepts in the example we’ll work with will be useful any time you get into
|
||||
more complex situations involving recursive types.
|
||||
|
||||
#### More Information About the Cons List
|
||||
|
||||
A *cons list* is a data structure that comes from the Lisp programming language
|
||||
and its dialects. In Lisp, the `cons` function (short for “construct function”)
|
||||
constructs a new pair from its two arguments, which usually are a single value
|
||||
and another pair. These pairs containing pairs form a list.
|
||||
|
||||
The cons function concept has made its way into more general functional
|
||||
programming jargon: “to cons *x* onto *y*” informally means to construct a new
|
||||
container instance by putting the element *x* at the start of this new
|
||||
container, followed by the container *y*.
|
||||
|
||||
Each item in a cons list contains two elements: the value of the current item
|
||||
and the next item. The last item in the list contains only a value called `Nil`
|
||||
without a next item. A cons list is produced by recursively calling the `cons`
|
||||
function. The canonical name to denote the base case of the recursion is `Nil`.
|
||||
Note that this is not the same as the “null” or “nil” concept in Chapter 6,
|
||||
which is an invalid or absent value.
|
||||
|
||||
Although functional programming languages use cons lists frequently, the cons
|
||||
list isn’t a commonly used data structure in Rust. Most of the time when you
|
||||
have a list of items in Rust, `Vec<T>` is a better choice to use. Other, more
|
||||
complex recursive data types *are* useful in various situations, but by
|
||||
starting with the cons list, we can explore how boxes let us define a recursive
|
||||
data type without much distraction.
|
||||
|
||||
Listing 15-2 contains an enum definition for a cons list. Note that this code
|
||||
won’t compile yet because the `List` type doesn’t have a known size, which
|
||||
we’ll demonstrate.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
enum List {
|
||||
Cons(i32, List),
|
||||
Nil,
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-2: The first attempt at defining an enum to
|
||||
represent a cons list data structure of `i32` values</span>
|
||||
|
||||
> Note: We’re implementing a cons list that holds only `i32` values for the
|
||||
> purposes of this example. We could have implemented it using generics, as we
|
||||
> discussed in Chapter 10, to define a cons list type that could store values of
|
||||
> any type.
|
||||
|
||||
Using the `List` type to store the list `1, 2, 3` would look like the code in
|
||||
Listing 15-3:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
use List::{Cons, Nil};
|
||||
|
||||
fn main() {
|
||||
let list = Cons(1, Cons(2, Cons(3, Nil)));
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-3: Using the `List` enum to store the list `1,
|
||||
2, 3`</span>
|
||||
|
||||
The first `Cons` value holds `1` and another `List` value. This `List` value is
|
||||
another `Cons` value that holds `2` and another `List` value. This `List` value
|
||||
is one more `Cons` value that holds `3` and a `List` value, which is finally
|
||||
`Nil`, the non-recursive variant that signals the end of the list.
|
||||
|
||||
If we try to compile the code in Listing 15-3, we get the error shown in
|
||||
Listing 15-4:
|
||||
|
||||
```text
|
||||
error[E0072]: recursive type `List` has infinite size
|
||||
--> src/main.rs:1:1
|
||||
|
|
||||
1 | enum List {
|
||||
| ^^^^^^^^^ recursive type has infinite size
|
||||
2 | Cons(i32, List),
|
||||
| ----- recursive without indirection
|
||||
|
|
||||
= help: insert indirection (e.g., a `Box`, `Rc`, or `&`) at some point to
|
||||
make `List` representable
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-4: The error we get when attempting to define
|
||||
a recursive enum</span>
|
||||
|
||||
The error shows this type “has infinite size.” The reason is that we’ve defined
|
||||
`List` with a variant that is recursive: it holds another value of itself
|
||||
directly. As a result, Rust can’t figure out how much space it needs to store a
|
||||
`List` value. Let’s break down why we get this error a bit. First, let’s look
|
||||
at how Rust decides how much space it needs to store a value of a non-recursive
|
||||
type.
|
||||
|
||||
#### Computing the Size of a Non-Recursive Type
|
||||
|
||||
Recall the `Message` enum we defined in Listing 6-2 when we discussed enum
|
||||
definitions in Chapter 6:
|
||||
|
||||
```rust
|
||||
enum Message {
|
||||
Quit,
|
||||
Move { x: i32, y: i32 },
|
||||
Write(String),
|
||||
ChangeColor(i32, i32, i32),
|
||||
}
|
||||
```
|
||||
|
||||
To determine how much space to allocate for a `Message` value, Rust goes
|
||||
through each of the variants to see which variant needs the most space. Rust
|
||||
sees that `Message::Quit` doesn’t need any space, `Message::Move` needs enough
|
||||
space to store two `i32` values, and so forth. Because only one variant will be
|
||||
used, the most space a `Message` value will need is the space it would take to
|
||||
store the largest of its variants.
|
||||
|
||||
Contrast this with what happens when Rust tries to determine how much space a
|
||||
recursive type like the `List` enum in Listing 15-2 needs. The compiler starts
|
||||
by looking at the `Cons` variant, which holds a value of type `i32` and a value
|
||||
of type `List`. Therefore, `Cons` needs an amount of space equal to the size of
|
||||
an `i32` plus the size of a `List`. To figure out how much memory the `List`
|
||||
type needs, the compiler looks at the variants, starting with the `Cons`
|
||||
variant. The `Cons` variant holds a value of type `i32` and a value of type
|
||||
`List`, and this process continues infinitely, as shown in Figure 15-1.
|
||||
|
||||
<img alt="An infinite Cons list" src="img/trpl15-01.svg" class="center" style="width: 50%;" />
|
||||
|
||||
<span class="caption">Figure 15-1: An infinite `List` consisting of infinite
|
||||
`Cons` variants</span>
|
||||
|
||||
#### Using `Box<T>` to Get a Recursive Type with a Known Size
|
||||
|
||||
Rust can’t figure out how much space to allocate for recursively defined types,
|
||||
so the compiler gives the error in Listing 15-4. But the error does include
|
||||
this helpful suggestion:
|
||||
|
||||
```text
|
||||
= help: insert indirection (e.g., a `Box`, `Rc`, or `&`) at some point to
|
||||
make `List` representable
|
||||
```
|
||||
|
||||
In this suggestion, “indirection” means that instead of storing a value
|
||||
directly, we’ll change the data structure to store the value indirectly by
|
||||
storing a pointer to the value instead.
|
||||
|
||||
Because a `Box<T>` is a pointer, Rust always knows how much space a `Box<T>`
|
||||
needs: a pointer’s size doesn’t change based on the amount of data it’s
|
||||
pointing to. This means we can put a `Box<T>` inside the `Cons` variant instead
|
||||
of another `List` value directly. The `Box<T>` will point to the next `List`
|
||||
value that will be on the heap rather than inside the `Cons` variant.
|
||||
Conceptually, we still have a list, created with lists “holding” other lists,
|
||||
but this implementation is now more like placing the items next to one another
|
||||
rather than inside one another.
|
||||
|
||||
We can change the definition of the `List` enum in Listing 15-2 and the usage
|
||||
of the `List` in Listing 15-3 to the code in Listing 15-5, which will compile:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
enum List {
|
||||
Cons(i32, Box<List>),
|
||||
Nil,
|
||||
}
|
||||
|
||||
use List::{Cons, Nil};
|
||||
|
||||
fn main() {
|
||||
let list = Cons(1,
|
||||
Box::new(Cons(2,
|
||||
Box::new(Cons(3,
|
||||
Box::new(Nil))))));
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-5: Definition of `List` that uses `Box<T>` in
|
||||
order to have a known size</span>
|
||||
|
||||
The `Cons` variant will need the size of an `i32` plus the space to store the
|
||||
box’s pointer data. The `Nil` variant stores no values, so it needs less space
|
||||
than the `Cons` variant. We now know that any `List` value will take up the
|
||||
size of an `i32` plus the size of a box’s pointer data. By using a box, we’ve
|
||||
broken the infinite, recursive chain, so the compiler can figure out the size
|
||||
it needs to store a `List` value. Figure 15-2 shows what the `Cons` variant
|
||||
looks like now.
|
||||
|
||||
<img alt="A finite Cons list" src="img/trpl15-02.svg" class="center" />
|
||||
|
||||
<span class="caption">Figure 15-2: A `List` that is not infinitely sized
|
||||
because `Cons` holds a `Box`</span>
|
||||
|
||||
Boxes provide only the indirection and heap allocation; they don’t have any
|
||||
other special capabilities, like those we’ll see with the other smart pointer
|
||||
types. They also don’t have any performance overhead that these special
|
||||
capabilities incur, so they can be useful in cases like the cons list where the
|
||||
indirection is the only feature we need. We’ll look at more use cases for boxes
|
||||
in Chapter 17, too.
|
||||
|
||||
The `Box<T>` type is a smart pointer because it implements the `Deref` trait,
|
||||
which allows `Box<T>` values to be treated like references. When a `Box<T>`
|
||||
value goes out of scope, the heap data that the box is pointing to is cleaned
|
||||
up as well because of the `Drop` trait implementation. Let’s explore these two
|
||||
traits in more detail. These two traits will be even more important to the
|
||||
functionality provided by the other smart pointer types we’ll discuss in the
|
||||
rest of this chapter.
|
||||
377
2018-edition/src/ch15-02-deref.md
Normal file
377
2018-edition/src/ch15-02-deref.md
Normal file
@@ -0,0 +1,377 @@
|
||||
## Treating Smart Pointers Like Regular References with the `Deref` Trait
|
||||
|
||||
Implementing the `Deref` trait allows you to customize the behavior of the
|
||||
*dereference operator*, `*` (as opposed to the multiplication or glob
|
||||
operator). By implementing `Deref` in such a way that a smart pointer can be
|
||||
treated like a regular reference, you can write code that operates on
|
||||
references and use that code with smart pointers too.
|
||||
|
||||
Let’s first look at how the dereference operator works with regular references.
|
||||
Then we’ll try to define a custom type that behaves like `Box<T>`, and see why
|
||||
the dereference operator doesn’t work like a reference on our newly defined
|
||||
type. We’ll explore how implementing the `Deref` trait makes it possible for
|
||||
smart pointers to work in a similar way as references. Then we’ll look at
|
||||
Rust’s *deref coercion* feature and how it lets us work with either references
|
||||
or smart pointers.
|
||||
|
||||
### Following the Pointer to the Value with the Dereference Operator
|
||||
|
||||
A regular reference is a type of pointer, and one way to think of a pointer is
|
||||
as an arrow to a value stored somewhere else. In Listing 15-6, we create a
|
||||
reference to an `i32` value and then use the dereference operator to follow the
|
||||
reference to the data:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let x = 5;
|
||||
let y = &x;
|
||||
|
||||
assert_eq!(5, x);
|
||||
assert_eq!(5, *y);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-6: Using the dereference operator to follow a
|
||||
reference to an `i32` value</span>
|
||||
|
||||
The variable `x` holds an `i32` value, `5`. We set `y` equal to a reference to
|
||||
`x`. We can assert that `x` is equal to `5`. However, if we want to make an
|
||||
assertion about the value in `y`, we have to use `*y` to follow the reference
|
||||
to the value it’s pointing to (hence *dereference*). Once we dereference `y`,
|
||||
we have access to the integer value `y` is pointing to that we can compare with
|
||||
`5`.
|
||||
|
||||
If we tried to write `assert_eq!(5, y);` instead, we would get this compilation
|
||||
error:
|
||||
|
||||
```text
|
||||
error[E0277]: the trait bound `{integer}: std::cmp::PartialEq<&{integer}>` is
|
||||
not satisfied
|
||||
--> src/main.rs:6:5
|
||||
|
|
||||
6 | assert_eq!(5, y);
|
||||
| ^^^^^^^^^^^^^^^^^ can't compare `{integer}` with `&{integer}`
|
||||
|
|
||||
= help: the trait `std::cmp::PartialEq<&{integer}>` is not implemented for
|
||||
`{integer}`
|
||||
```
|
||||
|
||||
Comparing a number and a reference to a number isn’t allowed because they’re
|
||||
different types. We must use the dereference operator to follow the reference
|
||||
to the value it’s pointing to.
|
||||
|
||||
### Using `Box<T>` Like a Reference
|
||||
|
||||
We can rewrite the code in Listing 15-6 to use a `Box<T>` instead of a
|
||||
reference; the dereference operator will work as shown in Listing 15-7:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn main() {
|
||||
let x = 5;
|
||||
let y = Box::new(x);
|
||||
|
||||
assert_eq!(5, x);
|
||||
assert_eq!(5, *y);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-7: Using the dereference operator on a
|
||||
`Box<i32>`</span>
|
||||
|
||||
The only difference between Listing 15-7 and Listing 15-6 is that here we set
|
||||
`y` to be an instance of a box pointing to the value in `x` rather than a
|
||||
reference pointing to the value of `x`. In the last assertion, we can use the
|
||||
dereference operator to follow the box’s pointer in the same way that we did
|
||||
when `y` was a reference. Next, we’ll explore what is special about `Box<T>`
|
||||
that enables us to use the dereference operator by defining our own box type.
|
||||
|
||||
### Defining Our Own Smart Pointer
|
||||
|
||||
Let’s build a smart pointer similar to the `Box<T>` type provided by the
|
||||
standard library to experience how smart pointers behave differently than
|
||||
references by default. Then we’ll look at how to add the ability to use the
|
||||
dereference operator.
|
||||
|
||||
The `Box<T>` type is ultimately defined as a tuple struct with one element, so
|
||||
Listing 15-8 defines a `MyBox<T>` type in the same way. We’ll also define a
|
||||
`new` function to match the `new` function defined on `Box<T>`.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
struct MyBox<T>(T);
|
||||
|
||||
impl<T> MyBox<T> {
|
||||
fn new(x: T) -> MyBox<T> {
|
||||
MyBox(x)
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-8: Defining a `MyBox<T>` type</span>
|
||||
|
||||
We define a struct named `MyBox` and declare a generic parameter `T`, because
|
||||
we want our type to hold values of any type. The `MyBox` type is a tuple struct
|
||||
with one element of type `T`. The `MyBox::new` function takes one parameter of
|
||||
type `T` and returns a `MyBox` instance that holds the value passed in.
|
||||
|
||||
Let’s try adding the `main` function in Listing 15-7 to Listing 15-8 and
|
||||
changing it to use the `MyBox<T>` type we’ve defined instead of `Box<T>`. The
|
||||
code in Listing 15-9 won’t compile because Rust doesn’t know how to dereference
|
||||
`MyBox`.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let x = 5;
|
||||
let y = MyBox::new(x);
|
||||
|
||||
assert_eq!(5, x);
|
||||
assert_eq!(5, *y);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-9: Attempting to use `MyBox<T>` in the same
|
||||
way we used references and `Box<T>`</span>
|
||||
|
||||
Here’s the resulting compilation error:
|
||||
|
||||
```text
|
||||
error[E0614]: type `MyBox<{integer}>` cannot be dereferenced
|
||||
--> src/main.rs:14:19
|
||||
|
|
||||
14 | assert_eq!(5, *y);
|
||||
| ^^
|
||||
```
|
||||
|
||||
Our `MyBox<T>` type can’t be dereferenced because we haven’t implemented that
|
||||
ability on our type. To enable dereferencing with the `*` operator, we
|
||||
implement the `Deref` trait.
|
||||
|
||||
### Treating a Type Like a Reference by Implementing the `Deref` Trait
|
||||
|
||||
As discussed in Chapter 10, to implement a trait, we need to provide
|
||||
implementations for the trait’s required methods. The `Deref` trait, provided
|
||||
by the standard library, requires us to implement one method named `deref` that
|
||||
borrows `self` and returns a reference to the inner data. Listing 15-10
|
||||
contains an implementation of `Deref` to add to the definition of `MyBox`:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::ops::Deref;
|
||||
|
||||
# struct MyBox<T>(T);
|
||||
impl<T> Deref for MyBox<T> {
|
||||
type Target = T;
|
||||
|
||||
fn deref(&self) -> &T {
|
||||
&self.0
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-10: Implementing `Deref` on `MyBox<T>`</span>
|
||||
|
||||
The `type Target = T;` syntax defines an associated type for the `Deref` trait
|
||||
to use. Associated types are a slightly different way of declaring a generic
|
||||
parameter, but you don’t need to worry about them for now; we’ll cover them in
|
||||
more detail in Chapter 19.
|
||||
|
||||
We fill in the body of the `deref` method with `&self.0` so `deref` returns a
|
||||
reference to the value we want to access with the `*` operator. The `main`
|
||||
function in Listing 15-9 that calls `*` on the `MyBox<T>` value now compiles,
|
||||
and the assertions pass!
|
||||
|
||||
Without the `Deref` trait, the compiler can only dereference `&` references.
|
||||
The `deref` method gives the compiler the ability to take a value of any type
|
||||
that implements `Deref` and call the `deref` method to get a `&` reference that
|
||||
it knows how to dereference.
|
||||
|
||||
When we entered `*y` in Listing 15-9, behind the scenes Rust actually ran this
|
||||
code:
|
||||
|
||||
```rust,ignore
|
||||
*(y.deref())
|
||||
```
|
||||
|
||||
Rust substitutes the `*` operator with a call to the `deref` method and then a
|
||||
plain dereference so we don’t have to think about whether or not we need to
|
||||
call the `deref` method. This Rust feature lets us write code that functions
|
||||
identically whether we have a regular reference or a type that implements
|
||||
`Deref`.
|
||||
|
||||
The reason the `deref` method returns a reference to a value and that the plain
|
||||
dereference outside the parentheses in `*(y.deref())` is still necessary is the
|
||||
ownership system. If the `deref` method returned the value directly instead of
|
||||
a reference to the value, the value would be moved out of `self`. We don’t want
|
||||
to take ownership of the inner value inside `MyBox<T>` in this case or in most
|
||||
cases where we use the dereference operator.
|
||||
|
||||
Note that the `*` operator is replaced with a call to the `deref` method and
|
||||
then a call to the `*` operator just once, each time we use a `*` in our code.
|
||||
Because the substitution of the `*` operator does not recurse infinitely, we
|
||||
end up with data of type `i32`, which matches the `5` in `assert_eq!` in
|
||||
Listing 15-9.
|
||||
|
||||
### Implicit Deref Coercions with Functions and Methods
|
||||
|
||||
*Deref coercion* is a convenience that Rust performs on arguments to functions
|
||||
and methods. Deref coercion converts a reference to a type that implements
|
||||
`Deref` into a reference to a type that `Deref` can convert the original type
|
||||
into. Deref coercion happens automatically when we pass a reference to a
|
||||
particular type’s value as an argument to a function or method that doesn’t
|
||||
match the parameter type in the function or method definition. A sequence of
|
||||
calls to the `deref` method converts the type we provided into the type the
|
||||
parameter needs.
|
||||
|
||||
Deref coercion was added to Rust so that programmers writing function and
|
||||
method calls don’t need to add as many explicit references and dereferences
|
||||
with `&` and `*`. The deref coercion feature also lets us write more code that
|
||||
can work for either references or smart pointers.
|
||||
|
||||
To see deref coercion in action, let’s use the `MyBox<T>` type we defined in
|
||||
Listing 15-8 as well as the implementation of `Deref` that we added in Listing
|
||||
15-10. Listing 15-11 shows the definition of a function that has a string slice
|
||||
parameter:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
fn hello(name: &str) {
|
||||
println!("Hello, {}!", name);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-11: A `hello` function that has the parameter
|
||||
`name` of type `&str`</span>
|
||||
|
||||
We can call the `hello` function with a string slice as an argument, such as
|
||||
`hello("Rust");` for example. Deref coercion makes it possible to call `hello`
|
||||
with a reference to a value of type `MyBox<String>`, as shown in Listing 15-12:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::ops::Deref;
|
||||
#
|
||||
# struct MyBox<T>(T);
|
||||
#
|
||||
# impl<T> MyBox<T> {
|
||||
# fn new(x: T) -> MyBox<T> {
|
||||
# MyBox(x)
|
||||
# }
|
||||
# }
|
||||
#
|
||||
# impl<T> Deref for MyBox<T> {
|
||||
# type Target = T;
|
||||
#
|
||||
# fn deref(&self) -> &T {
|
||||
# &self.0
|
||||
# }
|
||||
# }
|
||||
#
|
||||
# fn hello(name: &str) {
|
||||
# println!("Hello, {}!", name);
|
||||
# }
|
||||
#
|
||||
fn main() {
|
||||
let m = MyBox::new(String::from("Rust"));
|
||||
hello(&m);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-12: Calling `hello` with a reference to a
|
||||
`MyBox<String>` value, which works because of deref coercion</span>
|
||||
|
||||
Here we’re calling the `hello` function with the argument `&m`, which is a
|
||||
reference to a `MyBox<String>` value. Because we implemented the `Deref` trait
|
||||
on `MyBox<T>` in Listing 15-10, Rust can turn `&MyBox<String>` into `&String`
|
||||
by calling `deref`. The standard library provides an implementation of `Deref`
|
||||
on `String` that returns a string slice, and this is in the API documentation
|
||||
for `Deref`. Rust calls `deref` again to turn the `&String` into `&str`, which
|
||||
matches the `hello` function’s definition.
|
||||
|
||||
If Rust didn’t implement deref coercion, we would have to write the code in
|
||||
Listing 15-13 instead of the code in Listing 15-12 to call `hello` with a value
|
||||
of type `&MyBox<String>`.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::ops::Deref;
|
||||
#
|
||||
# struct MyBox<T>(T);
|
||||
#
|
||||
# impl<T> MyBox<T> {
|
||||
# fn new(x: T) -> MyBox<T> {
|
||||
# MyBox(x)
|
||||
# }
|
||||
# }
|
||||
#
|
||||
# impl<T> Deref for MyBox<T> {
|
||||
# type Target = T;
|
||||
#
|
||||
# fn deref(&self) -> &T {
|
||||
# &self.0
|
||||
# }
|
||||
# }
|
||||
#
|
||||
# fn hello(name: &str) {
|
||||
# println!("Hello, {}!", name);
|
||||
# }
|
||||
#
|
||||
fn main() {
|
||||
let m = MyBox::new(String::from("Rust"));
|
||||
hello(&(*m)[..]);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-13: The code we would have to write if Rust
|
||||
didn’t have deref coercion</span>
|
||||
|
||||
The `(*m)` dereferences the `MyBox<String>` into a `String`. Then the `&` and
|
||||
`[..]` take a string slice of the `String` that is equal to the whole string to
|
||||
match the signature of `hello`. The code without deref coercions is harder to
|
||||
read, write, and understand with all of these symbols involved. Deref coercion
|
||||
allows Rust to handle these conversions for us automatically.
|
||||
|
||||
When the `Deref` trait is defined for the types involved, Rust will analyze the
|
||||
types and use `Deref::deref` as many times as necessary to get a reference to
|
||||
match the parameter’s type. The number of times that `Deref::deref` needs to be
|
||||
inserted is resolved at compile time, so there is no runtime penalty for taking
|
||||
advantage of deref coercion!
|
||||
|
||||
### How Deref Coercion Interacts with Mutability
|
||||
|
||||
Similar to how you use the `Deref` trait to override the `*` operator on
|
||||
immutable references, you can use the `DerefMut` trait to override the `*`
|
||||
operator on mutable references.
|
||||
|
||||
Rust does deref coercion when it finds types and trait implementations in three
|
||||
cases:
|
||||
|
||||
* From `&T` to `&U` when `T: Deref<Target=U>`
|
||||
* From `&mut T` to `&mut U` when `T: DerefMut<Target=U>`
|
||||
* From `&mut T` to `&U` when `T: Deref<Target=U>`
|
||||
|
||||
The first two cases are the same except for mutability. The first case states
|
||||
that if you have a `&T`, and `T` implements `Deref` to some type `U`, you can
|
||||
get a `&U` transparently. The second case states that the same deref coercion
|
||||
happens for mutable references.
|
||||
|
||||
The third case is trickier: Rust will also coerce a mutable reference to an
|
||||
immutable one. But the reverse is *not* possible: immutable references will
|
||||
never coerce to mutable references. Because of the borrowing rules, if you have
|
||||
a mutable reference, that mutable reference must be the only reference to that
|
||||
data (otherwise, the program wouldn’t compile). Converting one mutable
|
||||
reference to one immutable reference will never break the borrowing rules.
|
||||
Converting an immutable reference to a mutable reference would require that
|
||||
there is only one immutable reference to that data, and the borrowing rules
|
||||
don’t guarantee that. Therefore, Rust can’t make the assumption that converting
|
||||
an immutable reference to a mutable reference is possible.
|
||||
189
2018-edition/src/ch15-03-drop.md
Normal file
189
2018-edition/src/ch15-03-drop.md
Normal file
@@ -0,0 +1,189 @@
|
||||
## Running Code on Cleanup with the `Drop` Trait
|
||||
|
||||
The second trait important to the smart pointer pattern is `Drop`, which lets
|
||||
you customize what happens when a value is about to go out of scope. You can
|
||||
provide an implementation for the `Drop` trait on any type, and the code you
|
||||
specify can be used to release resources like files or network connections.
|
||||
We’re introducing `Drop` in the context of smart pointers because the
|
||||
functionality of the `Drop` trait is almost always used when implementing a
|
||||
smart pointer. For example, `Box<T>` customizes `Drop` to deallocate the space
|
||||
on the heap that the box points to.
|
||||
|
||||
In some languages, the programmer must call code to free memory or resources
|
||||
every time they finish using an instance of a smart pointer. If they forget,
|
||||
the system might become overloaded and crash. In Rust, you can specify that a
|
||||
particular bit of code be run whenever a value goes out of scope, and the
|
||||
compiler will insert this code automatically. As a result, you don’t need to be
|
||||
careful about placing cleanup code everywhere in a program that an instance of
|
||||
a particular type is finished with—you still won’t leak resources!
|
||||
|
||||
Specify the code to run when a value goes out of scope by implementing the
|
||||
`Drop` trait. The `Drop` trait requires you to implement one method named
|
||||
`drop` that takes a mutable reference to `self`. To see when Rust calls `drop`,
|
||||
let’s implement `drop` with `println!` statements for now.
|
||||
|
||||
Listing 15-14 shows a `CustomSmartPointer` struct whose only custom
|
||||
functionality is that it will print `Dropping CustomSmartPointer!` when the
|
||||
instance goes out of scope. This example demonstrates when Rust runs the `drop`
|
||||
function.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
struct CustomSmartPointer {
|
||||
data: String,
|
||||
}
|
||||
|
||||
impl Drop for CustomSmartPointer {
|
||||
fn drop(&mut self) {
|
||||
println!("Dropping CustomSmartPointer with data `{}`!", self.data);
|
||||
}
|
||||
}
|
||||
|
||||
fn main() {
|
||||
let c = CustomSmartPointer { data: String::from("my stuff") };
|
||||
let d = CustomSmartPointer { data: String::from("other stuff") };
|
||||
println!("CustomSmartPointers created.");
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-14: A `CustomSmartPointer` struct that
|
||||
implements the `Drop` trait where we would put our cleanup code</span>
|
||||
|
||||
The `Drop` trait is included in the prelude, so we don’t need to import it. We
|
||||
implement the `Drop` trait on `CustomSmartPointer` and provide an
|
||||
implementation for the `drop` method that calls `println!`. The body of the
|
||||
`drop` function is where you would place any logic that you wanted to run when
|
||||
an instance of your type goes out of scope. We’re printing some text here to
|
||||
demonstrate when Rust will call `drop`.
|
||||
|
||||
In `main`, we create two instances of `CustomSmartPointer` and then print
|
||||
`CustomSmartPointers created.`. At the end of `main`, our instances of
|
||||
`CustomSmartPointer` will go out of scope, and Rust will call the code we put
|
||||
in the `drop` method, printing our final message. Note that we didn’t need to
|
||||
call the `drop` method explicitly.
|
||||
|
||||
When we run this program, we’ll see the following output:
|
||||
|
||||
```text
|
||||
CustomSmartPointers created.
|
||||
Dropping CustomSmartPointer with data `other stuff`!
|
||||
Dropping CustomSmartPointer with data `my stuff`!
|
||||
```
|
||||
|
||||
Rust automatically called `drop` for us when our instances went out of scope,
|
||||
calling the code we specified. Variables are dropped in the reverse order of
|
||||
their creation, so `d` was dropped before `c`. This example gives you a visual
|
||||
guide to how the `drop` method works; usually you would specify the cleanup
|
||||
code that your type needs to run rather than a print message.
|
||||
|
||||
### Dropping a Value Early with `std::mem::drop`
|
||||
|
||||
Unfortunately, it’s not straightforward to disable the automatic `drop`
|
||||
functionality. Disabling `drop` isn’t usually necessary; the whole point of the
|
||||
`Drop` trait is that it’s taken care of automatically. Occasionally, however,
|
||||
you might want to clean up a value early. One example is when using smart
|
||||
pointers that manage locks: you might want to force the `drop` method that
|
||||
releases the lock to run so other code in the same scope can acquire the lock.
|
||||
Rust doesn’t let you call the `Drop` trait’s `drop` method manually; instead
|
||||
you have to call the `std::mem::drop` function provided by the standard library
|
||||
if you want to force a value to be dropped before the end of its scope.
|
||||
|
||||
If we try to call the `Drop` trait’s `drop` method manually by modifying the
|
||||
`main` function from Listing 15-14, as shown in Listing 15-15, we’ll get a
|
||||
compiler error:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let c = CustomSmartPointer { data: String::from("some data") };
|
||||
println!("CustomSmartPointer created.");
|
||||
c.drop();
|
||||
println!("CustomSmartPointer dropped before the end of main.");
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-15: Attempting to call the `drop` method from
|
||||
the `Drop` trait manually to clean up early</span>
|
||||
|
||||
When we try to compile this code, we’ll get this error:
|
||||
|
||||
```text
|
||||
error[E0040]: explicit use of destructor method
|
||||
--> src/main.rs:14:7
|
||||
|
|
||||
14 | c.drop();
|
||||
| ^^^^ explicit destructor calls not allowed
|
||||
```
|
||||
|
||||
This error message states that we’re not allowed to explicitly call `drop`. The
|
||||
error message uses the term *destructor*, which is the general programming term
|
||||
for a function that cleans up an instance. A *destructor* is analogous to a
|
||||
*constructor*, which creates an instance. The `drop` function in Rust is one
|
||||
particular destructor.
|
||||
|
||||
Rust doesn’t let us call `drop` explicitly because Rust would still
|
||||
automatically call `drop` on the value at the end of `main`. This would be a
|
||||
*double free* error because Rust would be trying to clean up the same value
|
||||
twice.
|
||||
|
||||
We can’t disable the automatic insertion of `drop` when a value goes out of
|
||||
scope, and we can’t call the `drop` method explicitly. So, if we need to force
|
||||
a value to be cleaned up early, we can use the `std::mem::drop` function.
|
||||
|
||||
The `std::mem::drop` function is different than the `drop` method in the `Drop`
|
||||
trait. We call it by passing the value we want to force to be dropped early as
|
||||
an argument. The function is in the prelude, so we can modify `main` in Listing
|
||||
15-15 to call the `drop` function, as shown in Listing 15-16:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# struct CustomSmartPointer {
|
||||
# data: String,
|
||||
# }
|
||||
#
|
||||
# impl Drop for CustomSmartPointer {
|
||||
# fn drop(&mut self) {
|
||||
# println!("Dropping CustomSmartPointer!");
|
||||
# }
|
||||
# }
|
||||
#
|
||||
fn main() {
|
||||
let c = CustomSmartPointer { data: String::from("some data") };
|
||||
println!("CustomSmartPointer created.");
|
||||
drop(c);
|
||||
println!("CustomSmartPointer dropped before the end of main.");
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-16: Calling `std::mem::drop` to explicitly
|
||||
drop a value before it goes out of scope</span>
|
||||
|
||||
Running this code will print the following:
|
||||
|
||||
```text
|
||||
CustomSmartPointer created.
|
||||
Dropping CustomSmartPointer with data `some data`!
|
||||
CustomSmartPointer dropped before the end of main.
|
||||
```
|
||||
|
||||
The text ```Dropping CustomSmartPointer with data `some data`!``` is printed
|
||||
between the `CustomSmartPointer created.` and `CustomSmartPointer dropped
|
||||
before the end of main.` text, showing that the `drop` method code is called to
|
||||
drop `c` at that point.
|
||||
|
||||
You can use code specified in a `Drop` trait implementation in many ways to
|
||||
make cleanup convenient and safe: for instance, you could use it to create your
|
||||
own memory allocator! With the `Drop` trait and Rust’s ownership system, you
|
||||
don’t have to remember to clean up because Rust does it automatically.
|
||||
|
||||
You also don’t have to worry about problems resulting from accidentally
|
||||
cleaning up values still in use: the ownership system that makes sure
|
||||
references are always valid also ensures that `drop` gets called only once when
|
||||
the value is no longer being used.
|
||||
|
||||
Now that we’ve examined `Box<T>` and some of the characteristics of smart
|
||||
pointers, let’s look at a few other smart pointers defined in the standard
|
||||
library.
|
||||
217
2018-edition/src/ch15-04-rc.md
Normal file
217
2018-edition/src/ch15-04-rc.md
Normal file
@@ -0,0 +1,217 @@
|
||||
## `Rc<T>`, the Reference Counted Smart Pointer
|
||||
|
||||
In the majority of cases, ownership is clear: you know exactly which variable
|
||||
owns a given value. However, there are cases when a single value might have
|
||||
multiple owners. For example, in graph data structures, multiple edges might
|
||||
point to the same node, and that node is conceptually owned by all of the edges
|
||||
that point to it. A node shouldn’t be cleaned up unless it doesn’t have any
|
||||
edges pointing to it.
|
||||
|
||||
To enable multiple ownership, Rust has a type called `Rc<T>`, which is an
|
||||
abbreviation for *reference counting*. The `Rc<T>` type keeps track of the
|
||||
number of references to a value which determines whether or not a value is
|
||||
still in use. If there are zero references to a value, the value can be cleaned
|
||||
up without any references becoming invalid.
|
||||
|
||||
Imagine `Rc<T>` as a TV in a family room. When one person enters to watch TV,
|
||||
they turn it on. Others can come into the room and watch the TV. When the last
|
||||
person leaves the room, they turn off the TV because it’s no longer being used.
|
||||
If someone turns off the TV while others are still watching it, there would be
|
||||
uproar from the remaining TV watchers!
|
||||
|
||||
We use the `Rc<T>` type when we want to allocate some data on the heap for
|
||||
multiple parts of our program to read and we can’t determine at compile time
|
||||
which part will finish using the data last. If we knew which part would finish
|
||||
last, we could just make that part the data’s owner, and the normal ownership
|
||||
rules enforced at compile time would take effect.
|
||||
|
||||
Note that `Rc<T>` is only for use in single-threaded scenarios. When we discuss
|
||||
concurrency in Chapter 16, we’ll cover how to do reference counting in
|
||||
multithreaded programs.
|
||||
|
||||
### Using `Rc<T>` to Share Data
|
||||
|
||||
Let’s return to our cons list example in Listing 15-5. Recall that we defined
|
||||
it using `Box<T>`. This time, we’ll create two lists that both share ownership
|
||||
of a third list. Conceptually, this looks similar to Figure 15-3:
|
||||
|
||||
<img alt="Two lists that share ownership of a third list" src="img/trpl15-03.svg" class="center" />
|
||||
|
||||
<span class="caption">Figure 15-3: Two lists, `b` and `c`, sharing ownership of
|
||||
a third list, `a`</span>
|
||||
|
||||
We’ll create list `a` that contains 5 and then 10. Then we’ll make two more
|
||||
lists: `b` that starts with 3 and `c` that starts with 4. Both `b` and `c`
|
||||
lists will then continue on to the first `a` list containing 5 and 10. In other
|
||||
words, both lists will share the first list containing 5 and 10.
|
||||
|
||||
Trying to implement this scenario using our definition of `List` with `Box<T>`
|
||||
won’t work, as shown in Listing 15-17:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
enum List {
|
||||
Cons(i32, Box<List>),
|
||||
Nil,
|
||||
}
|
||||
|
||||
use List::{Cons, Nil};
|
||||
|
||||
fn main() {
|
||||
let a = Cons(5,
|
||||
Box::new(Cons(10,
|
||||
Box::new(Nil))));
|
||||
let b = Cons(3, Box::new(a));
|
||||
let c = Cons(4, Box::new(a));
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-17: Demonstrating we’re not allowed to have
|
||||
two lists using `Box<T>` that try to share ownership of a third list</span>
|
||||
|
||||
When we compile this code, we get this error:
|
||||
|
||||
```text
|
||||
error[E0382]: use of moved value: `a`
|
||||
--> src/main.rs:13:30
|
||||
|
|
||||
12 | let b = Cons(3, Box::new(a));
|
||||
| - value moved here
|
||||
13 | let c = Cons(4, Box::new(a));
|
||||
| ^ value used here after move
|
||||
|
|
||||
= note: move occurs because `a` has type `List`, which does not implement
|
||||
the `Copy` trait
|
||||
```
|
||||
|
||||
The `Cons` variants own the data they hold, so when we create the `b` list, `a`
|
||||
is moved into `b` and `b` owns `a`. Then, when we try to use `a` again when
|
||||
creating `c`, we’re not allowed to because `a` has been moved.
|
||||
|
||||
We could change the definition of `Cons` to hold references instead, but then
|
||||
we would have to specify lifetime parameters. By specifying lifetime
|
||||
parameters, we would be specifying that every element in the list will live at
|
||||
least as long as the entire list. The borrow checker wouldn’t let us compile
|
||||
`let a = Cons(10, &Nil);` for example, because the temporary `Nil` value would
|
||||
be dropped before `a` could take a reference to it.
|
||||
|
||||
Instead, we’ll change our definition of `List` to use `Rc<T>` in place of
|
||||
`Box<T>`, as shown in Listing 15-18. Each `Cons` variant will now hold a value
|
||||
and an `Rc<T>` pointing to a `List`. When we create `b`, instead of taking
|
||||
ownership of `a`, we’ll clone the `Rc<List>` that `a` is holding, thereby
|
||||
increasing the number of references from one to two and letting `a` and `b`
|
||||
share ownership of the data in that `Rc<List>`. We’ll also clone `a` when
|
||||
creating `c`, increasing the number of references from two to three. Every time
|
||||
we call `Rc::clone`, the reference count to the data within the `Rc<List>` will
|
||||
increase, and the data won’t be cleaned up unless there are zero references to
|
||||
it.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
enum List {
|
||||
Cons(i32, Rc<List>),
|
||||
Nil,
|
||||
}
|
||||
|
||||
use List::{Cons, Nil};
|
||||
use std::rc::Rc;
|
||||
|
||||
fn main() {
|
||||
let a = Rc::new(Cons(5, Rc::new(Cons(10, Rc::new(Nil)))));
|
||||
let b = Cons(3, Rc::clone(&a));
|
||||
let c = Cons(4, Rc::clone(&a));
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-18: A definition of `List` that uses
|
||||
`Rc<T>`</span>
|
||||
|
||||
We need to add a `use` statement to bring `Rc<T>` into scope because it’s not
|
||||
in the prelude. In `main`, we create the list holding 5 and 10 and store it in
|
||||
a new `Rc<List>` in `a`. Then when we create `b` and `c`, we call the
|
||||
`Rc::clone` function and pass a reference to the `Rc<List>` in `a` as an
|
||||
argument.
|
||||
|
||||
We could have called `a.clone()` rather than `Rc::clone(&a)`, but Rust’s
|
||||
convention is to use `Rc::clone` in this case. The implementation of
|
||||
`Rc::clone` doesn’t make a deep copy of all the data like most types’
|
||||
implementations of `clone` do. The call to `Rc::clone` only increments the
|
||||
reference count, which doesn’t take much time. Deep copies of data can take a
|
||||
lot of time. By using `Rc::clone` for reference counting, we can visually
|
||||
distinguish between the deep-copy kinds of clones and the kinds of clones that
|
||||
increase the reference count. When looking for performance problems in the
|
||||
code, we only need to consider the deep-copy clones and can disregard calls to
|
||||
`Rc::clone`.
|
||||
|
||||
### Cloning an `Rc<T>` Increases the Reference Count
|
||||
|
||||
Let’s change our working example in Listing 15-18 so we can see the reference
|
||||
counts changing as we create and drop references to the `Rc<List>` in `a`.
|
||||
|
||||
In Listing 15-19, we’ll change `main` so it has an inner scope around list `c`;
|
||||
then we can see how the reference count changes when `c` goes out of scope.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# enum List {
|
||||
# Cons(i32, Rc<List>),
|
||||
# Nil,
|
||||
# }
|
||||
#
|
||||
# use List::{Cons, Nil};
|
||||
# use std::rc::Rc;
|
||||
#
|
||||
fn main() {
|
||||
let a = Rc::new(Cons(5, Rc::new(Cons(10, Rc::new(Nil)))));
|
||||
println!("count after creating a = {}", Rc::strong_count(&a));
|
||||
let b = Cons(3, Rc::clone(&a));
|
||||
println!("count after creating b = {}", Rc::strong_count(&a));
|
||||
{
|
||||
let c = Cons(4, Rc::clone(&a));
|
||||
println!("count after creating c = {}", Rc::strong_count(&a));
|
||||
}
|
||||
println!("count after c goes out of scope = {}", Rc::strong_count(&a));
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-19: Printing the reference count</span>
|
||||
|
||||
At each point in the program where the reference count changes, we print the
|
||||
reference count, which we can get by calling the `Rc::strong_count` function.
|
||||
This function is named `strong_count` rather than `count` because the `Rc<T>`
|
||||
type also has a `weak_count`; we’ll see what `weak_count` is used for in the
|
||||
“Preventing Reference Cycles” section.
|
||||
|
||||
This code prints the following:
|
||||
|
||||
```text
|
||||
count after creating a = 1
|
||||
count after creating b = 2
|
||||
count after creating c = 3
|
||||
count after c goes out of scope = 2
|
||||
```
|
||||
|
||||
We can see that the `Rc<List>` in `a` has an initial reference count of 1; then
|
||||
each time we call `clone`, the count goes up by 1. When `c` goes out of scope,
|
||||
the count goes down by 1. We don’t have to call a function to decrease the
|
||||
reference count like we have to call `Rc::clone` to increase the reference
|
||||
count: the implementation of the `Drop` trait decreases the reference count
|
||||
automatically when an `Rc<T>` value goes out of scope.
|
||||
|
||||
What we can’t see in this example is that when `b` and then `a` go out of scope
|
||||
at the end of `main`, the count is then 0, and the `Rc<List>` is cleaned up
|
||||
completely at that point. Using `Rc<T>` allows a single value to have
|
||||
multiple owners, and the count ensures that the value remains valid as long as
|
||||
any of the owners still exist.
|
||||
|
||||
Via immutable references, `Rc<T>` allows you to share data between multiple
|
||||
parts of your program for reading only. If `Rc<T>` allowed you to have multiple
|
||||
mutable references too, you might violate one of the borrowing rules discussed
|
||||
in Chapter 4: multiple mutable borrows to the same place can cause data races
|
||||
and inconsistencies. But being able to mutate data is very useful! In the next
|
||||
section, we’ll discuss the interior mutability pattern and the `RefCell<T>`
|
||||
type that you can use in conjunction with an `Rc<T>` to work with this
|
||||
immutability restriction.
|
||||
483
2018-edition/src/ch15-05-interior-mutability.md
Normal file
483
2018-edition/src/ch15-05-interior-mutability.md
Normal file
@@ -0,0 +1,483 @@
|
||||
## `RefCell<T>` and the Interior Mutability Pattern
|
||||
|
||||
<!-- NEXT PARAGRAPH WRAPPED WEIRD INTENTIONALLY SEE #199 -->
|
||||
|
||||
*Interior mutability* is a design pattern in Rust that allows you to mutate
|
||||
data even when there are immutable references to that data; normally, this
|
||||
action is disallowed by the borrowing rules. To mutate data, the pattern uses
|
||||
`unsafe` code inside a data structure to bend Rust’s usual rules that govern
|
||||
mutation and borrowing. We haven’t yet covered unsafe code; we will in
|
||||
Chapter 19. We can use types that use the interior mutability pattern when we
|
||||
can ensure that the borrowing rules will be followed at runtime, even though
|
||||
the compiler can’t guarantee that. The `unsafe` code involved is then wrapped
|
||||
in a safe API, and the outer type is still immutable.
|
||||
|
||||
Let’s explore this concept by looking at the `RefCell<T>` type that follows the
|
||||
interior mutability pattern.
|
||||
|
||||
### Enforcing Borrowing Rules at Runtime with `RefCell<T>`
|
||||
|
||||
Unlike `Rc<T>`, the `RefCell<T>` type represents single ownership over the data
|
||||
it holds. So, what makes `RefCell<T>` different from a type like `Box<T>`?
|
||||
Recall the borrowing rules you learned in Chapter 4:
|
||||
|
||||
* At any given time, you can have *either* (but not both of) one mutable
|
||||
reference or any number of immutable references.
|
||||
* References must always be valid.
|
||||
|
||||
With references and `Box<T>`, the borrowing rules’ invariants are enforced at
|
||||
compile time. With `RefCell<T>`, these invariants are enforced *at runtime*.
|
||||
With references, if you break these rules, you’ll get a compiler error. With
|
||||
`RefCell<T>`, if you break these rules, your program will panic and exit.
|
||||
|
||||
The advantages of checking the borrowing rules at compile time are that errors
|
||||
will be caught sooner in the development process, and there is no impact on
|
||||
runtime performance because all the analysis is completed beforehand. For those
|
||||
reasons, checking the borrowing rules at compile time is the best choice in the
|
||||
majority of cases, which is why this is Rust’s default.
|
||||
|
||||
The advantage of checking the borrowing rules at runtime instead is that
|
||||
certain memory-safe scenarios are then allowed, whereas they are disallowed by
|
||||
the compile-time checks. Static analysis, like the Rust compiler, is inherently
|
||||
conservative. Some properties of code are impossible to detect by analyzing the
|
||||
code: the most famous example is the Halting Problem, which is beyond the scope
|
||||
of this book but is an interesting topic to research.
|
||||
|
||||
Because some analysis is impossible, if the Rust compiler can’t be sure the
|
||||
code complies with the ownership rules, it might reject a correct program; in
|
||||
this way, it’s conservative. If Rust accepted an incorrect program, users
|
||||
wouldn’t be able to trust in the guarantees Rust makes. However, if Rust
|
||||
rejects a correct program, the programmer will be inconvenienced, but nothing
|
||||
catastrophic can occur. The `RefCell<T>` type is useful when you’re sure your
|
||||
code follows the borrowing rules but the compiler is unable to understand and
|
||||
guarantee that.
|
||||
|
||||
Similar to `Rc<T>`, `RefCell<T>` is only for use in single-threaded scenarios
|
||||
and will give you a compile-time error if you try using it in a multithreaded
|
||||
context. We’ll talk about how to get the functionality of `RefCell<T>` in a
|
||||
multithreaded program in Chapter 16.
|
||||
|
||||
Here is a recap of the reasons to choose `Box<T>`, `Rc<T>`, or `RefCell<T>`:
|
||||
|
||||
* `Rc<T>` enables multiple owners of the same data; `Box<T>` and `RefCell<T>`
|
||||
have single owners.
|
||||
* `Box<T>` allows immutable or mutable borrows checked at compile time; `Rc<T>`
|
||||
allows only immutable borrows checked at compile time; `RefCell<T>` allows
|
||||
immutable or mutable borrows checked at runtime.
|
||||
* Because `RefCell<T>` allows mutable borrows checked at runtime, you can
|
||||
mutate the value inside the `RefCell<T>` even when the `RefCell<T>` is
|
||||
immutable.
|
||||
|
||||
Mutating the value inside an immutable value is the *interior mutability*
|
||||
pattern. Let’s look at a situation in which interior mutability is useful and
|
||||
examine how it’s possible.
|
||||
|
||||
### Interior Mutability: A Mutable Borrow to an Immutable Value
|
||||
|
||||
A consequence of the borrowing rules is that when you have an immutable value,
|
||||
you can’t borrow it mutably. For example, this code won’t compile:
|
||||
|
||||
```rust,ignore
|
||||
fn main() {
|
||||
let x = 5;
|
||||
let y = &mut x;
|
||||
}
|
||||
```
|
||||
|
||||
If you tried to compile this code, you’d get the following error:
|
||||
|
||||
```text
|
||||
error[E0596]: cannot borrow immutable local variable `x` as mutable
|
||||
--> src/main.rs:3:18
|
||||
|
|
||||
2 | let x = 5;
|
||||
| - consider changing this to `mut x`
|
||||
3 | let y = &mut x;
|
||||
| ^ cannot borrow mutably
|
||||
```
|
||||
|
||||
However, there are situations in which it would be useful for a value to mutate
|
||||
itself in its methods but appear immutable to other code. Code outside the
|
||||
value’s methods would not be able to mutate the value. Using `RefCell<T>` is
|
||||
one way to get the ability to have interior mutability. But `RefCell<T>`
|
||||
doesn’t get around the borrowing rules completely: the borrow checker in the
|
||||
compiler allows this interior mutability, and the borrowing rules are checked
|
||||
at runtime instead. If you violate the rules, you’ll get a `panic!` instead of
|
||||
a compiler error.
|
||||
|
||||
Let’s work through a practical example where we can use `RefCell<T>` to mutate
|
||||
an immutable value and see why that is useful.
|
||||
|
||||
#### A Use Case for Interior Mutability: Mock Objects
|
||||
|
||||
A *test double* is the general programming concept for a type used in place of
|
||||
another type during testing. *Mock objects* are specific types of test doubles
|
||||
that record what happens during a test so you can assert that the correct
|
||||
actions took place.
|
||||
|
||||
Rust doesn’t have objects in the same sense as other languages have objects,
|
||||
and Rust doesn’t have mock object functionality built into the standard library
|
||||
as some other languages do. However, you can definitely create a struct that
|
||||
will serve the same purposes as a mock object.
|
||||
|
||||
Here’s the scenario we’ll test: we’ll create a library that tracks a value
|
||||
against a maximum value and sends messages based on how close to the maximum
|
||||
value the current value is. This library could be used to keep track of a
|
||||
user’s quota for the number of API calls they’re allowed to make, for example.
|
||||
|
||||
Our library will only provide the functionality of tracking how close to the
|
||||
maximum a value is and what the messages should be at what times. Applications
|
||||
that use our library will be expected to provide the mechanism for sending the
|
||||
messages: the application could put a message in the application, send an
|
||||
email, send a text message, or something else. The library doesn’t need to know
|
||||
that detail. All it needs is something that implements a trait we’ll provide
|
||||
called `Messenger`. Listing 15-20 shows the library code:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
pub trait Messenger {
|
||||
fn send(&self, msg: &str);
|
||||
}
|
||||
|
||||
pub struct LimitTracker<'a, T: 'a + Messenger> {
|
||||
messenger: &'a T,
|
||||
value: usize,
|
||||
max: usize,
|
||||
}
|
||||
|
||||
impl<'a, T> LimitTracker<'a, T>
|
||||
where T: Messenger {
|
||||
pub fn new(messenger: &T, max: usize) -> LimitTracker<T> {
|
||||
LimitTracker {
|
||||
messenger,
|
||||
value: 0,
|
||||
max,
|
||||
}
|
||||
}
|
||||
|
||||
pub fn set_value(&mut self, value: usize) {
|
||||
self.value = value;
|
||||
|
||||
let percentage_of_max = self.value as f64 / self.max as f64;
|
||||
|
||||
if percentage_of_max >= 0.75 && percentage_of_max < 0.9 {
|
||||
self.messenger.send("Warning: You've used up over 75% of your quota!");
|
||||
} else if percentage_of_max >= 0.9 && percentage_of_max < 1.0 {
|
||||
self.messenger.send("Urgent warning: You've used up over 90% of your quota!");
|
||||
} else if percentage_of_max >= 1.0 {
|
||||
self.messenger.send("Error: You are over your quota!");
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-20: A library to keep track of how close a
|
||||
value is to a maximum value and warn when the value is at certain levels</span>
|
||||
|
||||
One important part of this code is that the `Messenger` trait has one method
|
||||
called `send` that takes an immutable reference to `self` and the text of the
|
||||
message. This is the interface our mock object needs to have. The other
|
||||
important part is that we want to test the behavior of the `set_value` method
|
||||
on the `LimitTracker`. We can change what we pass in for the `value` parameter,
|
||||
but `set_value` doesn’t return anything for us to make assertions on. We want
|
||||
to be able to say that if we create a `LimitTracker` with something that
|
||||
implements the `Messenger` trait and a particular value for `max`, when we pass
|
||||
different numbers for `value`, the messenger is told to send the appropriate
|
||||
messages.
|
||||
|
||||
We need a mock object that, instead of sending an email or text message when we
|
||||
call `send`, will only keep track of the messages it’s told to send. We can
|
||||
create a new instance of the mock object, create a `LimitTracker` that uses the
|
||||
mock object, call the `set_value` method on `LimitTracker`, and then check that
|
||||
the mock object has the messages we expect. Listing 15-21 shows an attempt to
|
||||
implement a mock object to do just that, but the borrow checker won’t allow it:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
|
||||
struct MockMessenger {
|
||||
sent_messages: Vec<String>,
|
||||
}
|
||||
|
||||
impl MockMessenger {
|
||||
fn new() -> MockMessenger {
|
||||
MockMessenger { sent_messages: vec![] }
|
||||
}
|
||||
}
|
||||
|
||||
impl Messenger for MockMessenger {
|
||||
fn send(&self, message: &str) {
|
||||
self.sent_messages.push(String::from(message));
|
||||
}
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn it_sends_an_over_75_percent_warning_message() {
|
||||
let mock_messenger = MockMessenger::new();
|
||||
let mut limit_tracker = LimitTracker::new(&mock_messenger, 100);
|
||||
|
||||
limit_tracker.set_value(80);
|
||||
|
||||
assert_eq!(mock_messenger.sent_messages.len(), 1);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-21: An attempt to implement a `MockMessenger`
|
||||
that isn’t allowed by the borrow checker</span>
|
||||
|
||||
This test code defines a `MockMessenger` struct that has a `sent_messages`
|
||||
field with a `Vec` of `String` values to keep track of the messages it’s told
|
||||
to send. We also define an associated function `new` to make it convenient to
|
||||
create new `MockMessenger` values that start with an empty list of messages. We
|
||||
then implement the `Messenger` trait for `MockMessenger` so we can give a
|
||||
`MockMessenger` to a `LimitTracker`. In the definition of the `send` method, we
|
||||
take the message passed in as a parameter and store it in the `MockMessenger`
|
||||
list of `sent_messages`.
|
||||
|
||||
In the test, we’re testing what happens when the `LimitTracker` is told to set
|
||||
`value` to something that is more than 75 percent of the `max` value. First, we
|
||||
create a new `MockMessenger`, which will start with an empty list of messages.
|
||||
Then we create a new `LimitTracker` and give it a reference to the new
|
||||
`MockMessenger` and a `max` value of 100. We call the `set_value` method on the
|
||||
`LimitTracker` with a value of 80, which is more than 75 percent of 100. Then
|
||||
we assert that the list of messages that the `MockMessenger` is keeping track
|
||||
of should now have one message in it.
|
||||
|
||||
However, there’s one problem with this test, as shown here:
|
||||
|
||||
```text
|
||||
error[E0596]: cannot borrow immutable field `self.sent_messages` as mutable
|
||||
--> src/lib.rs:52:13
|
||||
|
|
||||
51 | fn send(&self, message: &str) {
|
||||
| ----- use `&mut self` here to make mutable
|
||||
52 | self.sent_messages.push(String::from(message));
|
||||
| ^^^^^^^^^^^^^^^^^^ cannot mutably borrow immutable field
|
||||
```
|
||||
|
||||
We can’t modify the `MockMessenger` to keep track of the messages, because the
|
||||
`send` method takes an immutable reference to `self`. We also can’t take the
|
||||
suggestion from the error text to use `&mut self` instead, because then the
|
||||
signature of `send` wouldn’t match the signature in the `Messenger` trait
|
||||
definition (feel free to try and see what error message you get).
|
||||
|
||||
This is a situation in which interior mutability can help! We’ll store the
|
||||
`sent_messages` within a `RefCell<T>`, and then the `send` message will be
|
||||
able to modify `sent_messages` to store the messages we’ve seen. Listing 15-22
|
||||
shows what that looks like:
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::*;
|
||||
use std::cell::RefCell;
|
||||
|
||||
struct MockMessenger {
|
||||
sent_messages: RefCell<Vec<String>>,
|
||||
}
|
||||
|
||||
impl MockMessenger {
|
||||
fn new() -> MockMessenger {
|
||||
MockMessenger { sent_messages: RefCell::new(vec![]) }
|
||||
}
|
||||
}
|
||||
|
||||
impl Messenger for MockMessenger {
|
||||
fn send(&self, message: &str) {
|
||||
self.sent_messages.borrow_mut().push(String::from(message));
|
||||
}
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn it_sends_an_over_75_percent_warning_message() {
|
||||
// --snip--
|
||||
# let mock_messenger = MockMessenger::new();
|
||||
# let mut limit_tracker = LimitTracker::new(&mock_messenger, 100);
|
||||
# limit_tracker.set_value(75);
|
||||
|
||||
assert_eq!(mock_messenger.sent_messages.borrow().len(), 1);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-22: Using `RefCell<T>` to mutate an inner
|
||||
value while the outer value is considered immutable</span>
|
||||
|
||||
The `sent_messages` field is now of type `RefCell<Vec<String>>` instead of
|
||||
`Vec<String>`. In the `new` function, we create a new `RefCell<Vec<String>>`
|
||||
instance around the empty vector.
|
||||
|
||||
For the implementation of the `send` method, the first parameter is still an
|
||||
immutable borrow of `self`, which matches the trait definition. We call
|
||||
`borrow_mut` on the `RefCell<Vec<String>>` in `self.sent_messages` to get a
|
||||
mutable reference to the value inside the `RefCell<Vec<String>>`, which is
|
||||
the vector. Then we can call `push` on the mutable reference to the vector to
|
||||
keep track of the messages sent during the test.
|
||||
|
||||
The last change we have to make is in the assertion: to see how many items are
|
||||
in the inner vector, we call `borrow` on the `RefCell<Vec<String>>` to get an
|
||||
immutable reference to the vector.
|
||||
|
||||
Now that you’ve seen how to use `RefCell<T>`, let’s dig into how it works!
|
||||
|
||||
#### Keeping Track of Borrows at Runtime with `RefCell<T>`
|
||||
|
||||
When creating immutable and mutable references, we use the `&` and `&mut`
|
||||
syntax, respectively. With `RefCell<T>`, we use the `borrow` and `borrow_mut`
|
||||
methods, which are part of the safe API that belongs to `RefCell<T>`. The
|
||||
`borrow` method returns the smart pointer type `Ref<T>`, and `borrow_mut`
|
||||
returns the smart pointer type `RefMut<T>`. Both types implement `Deref`, so we
|
||||
can treat them like regular references.
|
||||
|
||||
The `RefCell<T>` keeps track of how many `Ref<T>` and `RefMut<T>` smart
|
||||
pointers are currently active. Every time we call `borrow`, the `RefCell<T>`
|
||||
increases its count of how many immutable borrows are active. When a `Ref<T>`
|
||||
value goes out of scope, the count of immutable borrows goes down by one. Just
|
||||
like the compile-time borrowing rules, `RefCell<T>` lets us have many immutable
|
||||
borrows or one mutable borrow at any point in time.
|
||||
|
||||
If we try to violate these rules, rather than getting a compiler error as we
|
||||
would with references, the implementation of `RefCell<T>` will panic at
|
||||
runtime. Listing 15-23 shows a modification of the implementation of `send` in
|
||||
Listing 15-22. We’re deliberately trying to create two mutable borrows active
|
||||
for the same scope to illustrate that `RefCell<T>` prevents us from doing this
|
||||
at runtime.
|
||||
|
||||
<span class="filename">Filename: src/lib.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
impl Messenger for MockMessenger {
|
||||
fn send(&self, message: &str) {
|
||||
let mut one_borrow = self.sent_messages.borrow_mut();
|
||||
let mut two_borrow = self.sent_messages.borrow_mut();
|
||||
|
||||
one_borrow.push(String::from(message));
|
||||
two_borrow.push(String::from(message));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-23: Creating two mutable references in the
|
||||
same scope to see that `RefCell<T>` will panic</span>
|
||||
|
||||
We create a variable `one_borrow` for the `RefMut<T>` smart pointer returned
|
||||
from `borrow_mut`. Then we create another mutable borrow in the same way in the
|
||||
variable `two_borrow`. This makes two mutable references in the same scope,
|
||||
which isn’t allowed. When we run the tests for our library, the code in Listing
|
||||
15-23 will compile without any errors, but the test will fail:
|
||||
|
||||
```text
|
||||
---- tests::it_sends_an_over_75_percent_warning_message stdout ----
|
||||
thread 'tests::it_sends_an_over_75_percent_warning_message' panicked at
|
||||
'already borrowed: BorrowMutError', src/libcore/result.rs:906:4
|
||||
note: Run with `RUST_BACKTRACE=1` for a backtrace.
|
||||
```
|
||||
|
||||
Notice that the code panicked with the message `already borrowed:
|
||||
BorrowMutError`. This is how `RefCell<T>` handles violations of the borrowing
|
||||
rules at runtime.
|
||||
|
||||
Catching borrowing errors at runtime rather than compile time means that you
|
||||
would find a mistake in your code later in the development process and possibly
|
||||
not until your code was deployed to production. Also, your code would incur a
|
||||
small runtime performance penalty as a result of keeping track of the borrows
|
||||
at runtime rather than compile time. However, using `RefCell<T>` makes it
|
||||
possible to write a mock object that can modify itself to keep track of the
|
||||
messages it has seen while you’re using it in a context where only immutable
|
||||
values are allowed. You can use `RefCell<T>` despite its trade-offs to get more
|
||||
functionality than regular references provide.
|
||||
|
||||
### Having Multiple Owners of Mutable Data by Combining `Rc<T>` and `RefCell<T>`
|
||||
|
||||
A common way to use `RefCell<T>` is in combination with `Rc<T>`. Recall that
|
||||
`Rc<T>` lets you have multiple owners of some data, but it only gives immutable
|
||||
access to that data. If you have an `Rc<T>` that holds a `RefCell<T>`, you can
|
||||
get a value that can have multiple owners *and* that you can mutate!
|
||||
|
||||
For example, recall the cons list example in Listing 15-18 where we used
|
||||
`Rc<T>` to allow multiple lists to share ownership of another list. Because
|
||||
`Rc<T>` holds only immutable values, we can’t change any of the values in the
|
||||
list once we’ve created them. Let’s add in `RefCell<T>` to gain the ability to
|
||||
change the values in the lists. Listing 15-24 shows that by using a
|
||||
`RefCell<T>` in the `Cons` definition, we can modify the value stored in all
|
||||
the lists:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
#[derive(Debug)]
|
||||
enum List {
|
||||
Cons(Rc<RefCell<i32>>, Rc<List>),
|
||||
Nil,
|
||||
}
|
||||
|
||||
use List::{Cons, Nil};
|
||||
use std::rc::Rc;
|
||||
use std::cell::RefCell;
|
||||
|
||||
fn main() {
|
||||
let value = Rc::new(RefCell::new(5));
|
||||
|
||||
let a = Rc::new(Cons(Rc::clone(&value), Rc::new(Nil)));
|
||||
|
||||
let b = Cons(Rc::new(RefCell::new(6)), Rc::clone(&a));
|
||||
let c = Cons(Rc::new(RefCell::new(10)), Rc::clone(&a));
|
||||
|
||||
*value.borrow_mut() += 10;
|
||||
|
||||
println!("a after = {:?}", a);
|
||||
println!("b after = {:?}", b);
|
||||
println!("c after = {:?}", c);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-24: Using `Rc<RefCell<i32>>` to create a
|
||||
`List` that we can mutate</span>
|
||||
|
||||
We create a value that is an instance of `Rc<RefCell<i32>>` and store it in a
|
||||
variable named `value` so we can access it directly later. Then we create a
|
||||
`List` in `a` with a `Cons` variant that holds `value`. We need to clone
|
||||
`value` so both `a` and `value` have ownership of the inner `5` value rather
|
||||
than transferring ownership from `value` to `a` or having `a` borrow from
|
||||
`value`.
|
||||
|
||||
We wrap the list `a` in an `Rc<T>` so when we create lists `b` and `c`, they
|
||||
can both refer to `a`, which is what we did in Listing 15-18.
|
||||
|
||||
After we’ve created the lists in `a`, `b`, and `c`, we add 10 to the value in
|
||||
`value`. We do this by calling `borrow_mut` on `value`, which uses the
|
||||
automatic dereferencing feature we discussed in Chapter 5 (see the section
|
||||
“Where’s the `->` Operator?”) to dereference the `Rc<T>` to the inner
|
||||
`RefCell<T>` value. The `borrow_mut` method returns a `RefMut<T>` smart
|
||||
pointer, and we use the dereference operator on it and change the inner value.
|
||||
|
||||
When we print `a`, `b`, and `c`, we can see that they all have the modified
|
||||
value of 15 rather than 5:
|
||||
|
||||
```text
|
||||
a after = Cons(RefCell { value: 15 }, Nil)
|
||||
b after = Cons(RefCell { value: 6 }, Cons(RefCell { value: 15 }, Nil))
|
||||
c after = Cons(RefCell { value: 10 }, Cons(RefCell { value: 15 }, Nil))
|
||||
```
|
||||
|
||||
This technique is pretty neat! By using `RefCell<T>`, we have an outwardly
|
||||
immutable `List` value. But we can use the methods on `RefCell<T>` that provide
|
||||
access to its interior mutability so we can modify our data when we need to.
|
||||
The runtime checks of the borrowing rules protect us from data races, and it’s
|
||||
sometimes worth trading a bit of speed for this flexibility in our data
|
||||
structures.
|
||||
|
||||
The standard library has other types that provide interior mutability, such as
|
||||
`Cell<T>`, which is similar except that instead of giving references to the
|
||||
inner value, the value is copied in and out of the `Cell<T>`. There’s also
|
||||
`Mutex<T>`, which offers interior mutability that’s safe to use across threads;
|
||||
we’ll discuss its use in Chapter 16. Check out the standard library docs for
|
||||
more details on the differences between these types.
|
||||
498
2018-edition/src/ch15-06-reference-cycles.md
Normal file
498
2018-edition/src/ch15-06-reference-cycles.md
Normal file
@@ -0,0 +1,498 @@
|
||||
## Reference Cycles Can Leak Memory
|
||||
|
||||
Rust’s memory safety guarantees make it difficult, but not impossible, to
|
||||
accidentally create memory that is never cleaned up (known as a *memory leak*).
|
||||
Preventing memory leaks entirely is not one of Rust’s guarantees in the same
|
||||
way that disallowing data races at compile time is, meaning memory leaks are
|
||||
memory safe in Rust. We can see that Rust allows memory leaks by using `Rc<T>`
|
||||
and `RefCell<T>`: it’s possible to create references where items refer to each
|
||||
other in a cycle. This creates memory leaks because the reference count of each
|
||||
item in the cycle will never reach 0, and the values will never be dropped.
|
||||
|
||||
### Creating a Reference Cycle
|
||||
|
||||
Let’s look at how a reference cycle might happen and how to prevent it,
|
||||
starting with the definition of the `List` enum and a `tail` method in Listing
|
||||
15-25:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
<!-- Hidden fn main is here to disable the automatic wrapping in fn main that
|
||||
doc tests do; the `use List` fails if this listing is put within a main -->
|
||||
|
||||
```rust
|
||||
# fn main() {}
|
||||
use std::rc::Rc;
|
||||
use std::cell::RefCell;
|
||||
use List::{Cons, Nil};
|
||||
|
||||
#[derive(Debug)]
|
||||
enum List {
|
||||
Cons(i32, RefCell<Rc<List>>),
|
||||
Nil,
|
||||
}
|
||||
|
||||
impl List {
|
||||
fn tail(&self) -> Option<&RefCell<Rc<List>>> {
|
||||
match *self {
|
||||
Cons(_, ref item) => Some(item),
|
||||
Nil => None,
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-25: A cons list definition that holds a
|
||||
`RefCell<T>` so we can modify what a `Cons` variant is referring to</span>
|
||||
|
||||
We’re using another variation of the `List` definition in Listing 15-5. The
|
||||
second element in the `Cons` variant is now `RefCell<Rc<List>>`, meaning that
|
||||
instead of having the ability to modify the `i32` value as we did in Listing
|
||||
15-24, we want to modify which `List` value a `Cons` variant is pointing to.
|
||||
We’re also adding a `tail` method to make it convenient for us to access the
|
||||
second item if we have a `Cons` variant.
|
||||
|
||||
In Listing 15-26, we’re adding a `main` function that uses the definitions in
|
||||
Listing 15-25. This code creates a list in `a` and a list in `b` that points to
|
||||
the list in `a`. Then it modifies the list in `a` to point to `b`, creating a
|
||||
reference cycle. There are `println!` statements along the way to show what the
|
||||
reference counts are at various points in this process.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use List::{Cons, Nil};
|
||||
# use std::rc::Rc;
|
||||
# use std::cell::RefCell;
|
||||
# #[derive(Debug)]
|
||||
# enum List {
|
||||
# Cons(i32, RefCell<Rc<List>>),
|
||||
# Nil,
|
||||
# }
|
||||
#
|
||||
# impl List {
|
||||
# fn tail(&self) -> Option<&RefCell<Rc<List>>> {
|
||||
# match *self {
|
||||
# Cons(_, ref item) => Some(item),
|
||||
# Nil => None,
|
||||
# }
|
||||
# }
|
||||
# }
|
||||
#
|
||||
fn main() {
|
||||
let a = Rc::new(Cons(5, RefCell::new(Rc::new(Nil))));
|
||||
|
||||
println!("a initial rc count = {}", Rc::strong_count(&a));
|
||||
println!("a next item = {:?}", a.tail());
|
||||
|
||||
let b = Rc::new(Cons(10, RefCell::new(Rc::clone(&a))));
|
||||
|
||||
println!("a rc count after b creation = {}", Rc::strong_count(&a));
|
||||
println!("b initial rc count = {}", Rc::strong_count(&b));
|
||||
println!("b next item = {:?}", b.tail());
|
||||
|
||||
if let Some(link) = a.tail() {
|
||||
*link.borrow_mut() = Rc::clone(&b);
|
||||
}
|
||||
|
||||
println!("b rc count after changing a = {}", Rc::strong_count(&b));
|
||||
println!("a rc count after changing a = {}", Rc::strong_count(&a));
|
||||
|
||||
// Uncomment the next line to see that we have a cycle;
|
||||
// it will overflow the stack
|
||||
// println!("a next item = {:?}", a.tail());
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-26: Creating a reference cycle of two `List`
|
||||
values pointing to each other</span>
|
||||
|
||||
We create an `Rc<List>` instance holding a `List` value in the variable `a`
|
||||
with an initial list of `5, Nil`. We then create an `Rc<List>` instance
|
||||
holding another `List` value in the variable `b` that contains the value 10 and
|
||||
points to the list in `a`.
|
||||
|
||||
We modify `a` so it points to `b` instead of `Nil`, creating a cycle. We
|
||||
do that by using the `tail` method to get a reference to the
|
||||
`RefCell<Rc<List>>` in `a`, which we put in the variable `link`. Then we use
|
||||
the `borrow_mut` method on the `RefCell<Rc<List>>` to change the value inside
|
||||
from an `Rc<List>` that holds a `Nil` value to the `Rc<List>` in `b`.
|
||||
|
||||
When we run this code, keeping the last `println!` commented out for the
|
||||
moment, we’ll get this output:
|
||||
|
||||
```text
|
||||
a initial rc count = 1
|
||||
a next item = Some(RefCell { value: Nil })
|
||||
a rc count after b creation = 2
|
||||
b initial rc count = 1
|
||||
b next item = Some(RefCell { value: Cons(5, RefCell { value: Nil }) })
|
||||
b rc count after changing a = 2
|
||||
a rc count after changing a = 2
|
||||
```
|
||||
|
||||
The reference count of the `Rc<List>` instances in both `a` and `b` are 2
|
||||
after we change the list in `a` to point to `b`. At the end of `main`, Rust
|
||||
will try to drop `b` first, which will decrease the count in each of the
|
||||
`Rc<List>` instances in `a` and `b` by 1.
|
||||
|
||||
However, because `a` is still referencing the `Rc<List>` that was in `b`, that
|
||||
`Rc<List>` has a count of 1 rather than 0, so the memory the `Rc<List>` has on
|
||||
the heap won’t be dropped. The memory will just sit there with a count of 1,
|
||||
forever. To visualize this reference cycle, we’ve created a diagram in Figure
|
||||
15-4.
|
||||
|
||||
<img alt="Reference cycle of lists" src="img/trpl15-04.svg" class="center" />
|
||||
|
||||
<span class="caption">Figure 15-4: A reference cycle of lists `a` and `b`
|
||||
pointing to each other</span>
|
||||
|
||||
If you uncomment the last `println!` and run the program, Rust will try to
|
||||
print this cycle with `a` pointing to `b` pointing to `a` and so forth until it
|
||||
overflows the stack.
|
||||
|
||||
In this case, right after we create the reference cycle, the program ends. The
|
||||
consequences of this cycle aren’t very dire. However, if a more complex program
|
||||
allocated lots of memory in a cycle and held onto it for a long time, the
|
||||
program would use more memory than it needed and might overwhelm the system,
|
||||
causing it to run out of available memory.
|
||||
|
||||
Creating reference cycles is not easily done, but it’s not impossible either.
|
||||
If you have `RefCell<T>` values that contain `Rc<T>` values or similar nested
|
||||
combinations of types with interior mutability and reference counting, you must
|
||||
ensure that you don’t create cycles; you can’t rely on Rust to catch them.
|
||||
Creating a reference cycle would be a logic bug in your program that you should
|
||||
use automated tests, code reviews, and other software development practices to
|
||||
minimize.
|
||||
|
||||
Another solution for avoiding reference cycles is reorganizing your data
|
||||
structures so that some references express ownership and some references don’t.
|
||||
As a result, you can have cycles made up of some ownership relationships and
|
||||
some non-ownership relationships, and only the ownership relationships affect
|
||||
whether or not a value can be dropped. In Listing 15-25, we always want `Cons`
|
||||
variants to own their list, so reorganizing the data structure isn’t possible.
|
||||
Let’s look at an example using graphs made up of parent nodes and child nodes
|
||||
to see when non-ownership relationships are an appropriate way to prevent
|
||||
reference cycles.
|
||||
|
||||
### Preventing Reference Cycles: Turning an `Rc<T>` into a `Weak<T>`
|
||||
|
||||
So far, we’ve demonstrated that calling `Rc::clone` increases the
|
||||
`strong_count` of an `Rc<T>` instance, and an `Rc<T>` instance is only cleaned
|
||||
up if its `strong_count` is 0. You can also create a *weak reference* to the
|
||||
value within an `Rc<T>` instance by calling `Rc::downgrade` and passing a
|
||||
reference to the `Rc<T>`. When you call `Rc::downgrade`, you get a smart
|
||||
pointer of type `Weak<T>`. Instead of increasing the `strong_count` in the
|
||||
`Rc<T>` instance by 1, calling `Rc::downgrade` increases the `weak_count` by 1.
|
||||
The `Rc<T>` type uses `weak_count` to keep track of how many `Weak<T>`
|
||||
references exist, similar to `strong_count`. The difference is the `weak_count`
|
||||
doesn’t need to be 0 for the `Rc<T>` instance to be cleaned up.
|
||||
|
||||
Strong references are how you can share ownership of an `Rc<T>` instance. Weak
|
||||
references don’t express an ownership relationship. They won’t cause a
|
||||
reference cycle because any cycle involving some weak references will be broken
|
||||
once the strong reference count of values involved is 0.
|
||||
|
||||
Because the value that `Weak<T>` references might have been dropped, to do
|
||||
anything with the value that a `Weak<T>` is pointing to, you must make sure the
|
||||
value still exists. Do this by calling the `upgrade` method on a `Weak<T>`
|
||||
instance, which will return an `Option<Rc<T>>`. You’ll get a result of `Some`
|
||||
if the `Rc<T>` value has not been dropped yet and a result of `None` if the
|
||||
`Rc<T>` value has been dropped. Because `upgrade` returns an `Option<T>`, Rust
|
||||
will ensure that the `Some` case and the `None` case are handled, and there
|
||||
won’t be an invalid pointer.
|
||||
|
||||
As an example, rather than using a list whose items know only about the next
|
||||
item, we’ll create a tree whose items know about their children items *and*
|
||||
their parent items.
|
||||
|
||||
#### Creating a Tree Data Structure: a `Node` with Child Nodes
|
||||
|
||||
To start, we’ll build a tree with nodes that know about their child nodes.
|
||||
We’ll create a struct named `Node` that holds its own `i32` value as well as
|
||||
references to its children `Node` values:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::rc::Rc;
|
||||
use std::cell::RefCell;
|
||||
|
||||
#[derive(Debug)]
|
||||
struct Node {
|
||||
value: i32,
|
||||
children: RefCell<Vec<Rc<Node>>>,
|
||||
}
|
||||
```
|
||||
|
||||
We want a `Node` to own its children, and we want to share that ownership with
|
||||
variables so we can access each `Node` in the tree directly. To do this, we
|
||||
define the `Vec<T>` items to be values of type `Rc<Node>`. We also want to
|
||||
modify which nodes are children of another node, so we have a `RefCell<T>` in
|
||||
`children` around the `Vec<Rc<Node>>`.
|
||||
|
||||
Next, we’ll use our struct definition and create one `Node` instance named
|
||||
`leaf` with the value 3 and no children, and another instance named `branch`
|
||||
with the value 5 and `leaf` as one of its children, as shown in Listing 15-27:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::rc::Rc;
|
||||
# use std::cell::RefCell;
|
||||
#
|
||||
# #[derive(Debug)]
|
||||
# struct Node {
|
||||
# value: i32,
|
||||
# children: RefCell<Vec<Rc<Node>>>,
|
||||
# }
|
||||
#
|
||||
fn main() {
|
||||
let leaf = Rc::new(Node {
|
||||
value: 3,
|
||||
children: RefCell::new(vec![]),
|
||||
});
|
||||
|
||||
let branch = Rc::new(Node {
|
||||
value: 5,
|
||||
children: RefCell::new(vec![Rc::clone(&leaf)]),
|
||||
});
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-27: Creating a `leaf` node with no children
|
||||
and a `branch` node with `leaf` as one of its children</span>
|
||||
|
||||
We clone the `Rc<Node>` in `leaf` and store that in `branch`, meaning the
|
||||
`Node` in `leaf` now has two owners: `leaf` and `branch`. We can get from
|
||||
`branch` to `leaf` through `branch.children`, but there’s no way to get from
|
||||
`leaf` to `branch`. The reason is that `leaf` has no reference to `branch` and
|
||||
doesn’t know they’re related. We want `leaf` to know that `branch` is its
|
||||
parent. We’ll do that next.
|
||||
|
||||
#### Adding a Reference from a Child to Its Parent
|
||||
|
||||
To make the child node aware of its parent, we need to add a `parent` field to
|
||||
our `Node` struct definition. The trouble is in deciding what the type of
|
||||
`parent` should be. We know it can’t contain an `Rc<T>`, because that would
|
||||
create a reference cycle with `leaf.parent` pointing to `branch` and
|
||||
`branch.children` pointing to `leaf`, which would cause their `strong_count`
|
||||
values to never be 0.
|
||||
|
||||
Thinking about the relationships another way, a parent node should own its
|
||||
children: if a parent node is dropped, its child nodes should be dropped as
|
||||
well. However, a child should not own its parent: if we drop a child node, the
|
||||
parent should still exist. This is a case for weak references!
|
||||
|
||||
So instead of `Rc<T>`, we’ll make the type of `parent` use `Weak<T>`,
|
||||
specifically a `RefCell<Weak<Node>>`. Now our `Node` struct definition looks
|
||||
like this:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::rc::{Rc, Weak};
|
||||
use std::cell::RefCell;
|
||||
|
||||
#[derive(Debug)]
|
||||
struct Node {
|
||||
value: i32,
|
||||
parent: RefCell<Weak<Node>>,
|
||||
children: RefCell<Vec<Rc<Node>>>,
|
||||
}
|
||||
```
|
||||
|
||||
A node will be able to refer to its parent node but doesn’t own its parent.
|
||||
In Listing 15-28, we update `main` to use this new definition so the `leaf`
|
||||
node will have a way to refer to its parent, `branch`:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::rc::{Rc, Weak};
|
||||
# use std::cell::RefCell;
|
||||
#
|
||||
# #[derive(Debug)]
|
||||
# struct Node {
|
||||
# value: i32,
|
||||
# parent: RefCell<Weak<Node>>,
|
||||
# children: RefCell<Vec<Rc<Node>>>,
|
||||
# }
|
||||
#
|
||||
fn main() {
|
||||
let leaf = Rc::new(Node {
|
||||
value: 3,
|
||||
parent: RefCell::new(Weak::new()),
|
||||
children: RefCell::new(vec![]),
|
||||
});
|
||||
|
||||
println!("leaf parent = {:?}", leaf.parent.borrow().upgrade());
|
||||
|
||||
let branch = Rc::new(Node {
|
||||
value: 5,
|
||||
parent: RefCell::new(Weak::new()),
|
||||
children: RefCell::new(vec![Rc::clone(&leaf)]),
|
||||
});
|
||||
|
||||
*leaf.parent.borrow_mut() = Rc::downgrade(&branch);
|
||||
|
||||
println!("leaf parent = {:?}", leaf.parent.borrow().upgrade());
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-28: A `leaf` node with a weak reference to its
|
||||
parent node `branch`</span>
|
||||
|
||||
Creating the `leaf` node looks similar to how creating the `leaf` node looked
|
||||
in Listing 15-27 with the exception of the `parent` field: `leaf` starts out
|
||||
without a parent, so we create a new, empty `Weak<Node>` reference instance.
|
||||
|
||||
At this point, when we try to get a reference to the parent of `leaf` by using
|
||||
the `upgrade` method, we get a `None` value. We see this in the output from the
|
||||
first `println!` statement:
|
||||
|
||||
```text
|
||||
leaf parent = None
|
||||
```
|
||||
|
||||
When we create the `branch` node, it will also have a new `Weak<Node>`
|
||||
reference in the `parent` field, because `branch` doesn’t have a parent node.
|
||||
We still have `leaf` as one of the children of `branch`. Once we have the
|
||||
`Node` instance in `branch`, we can modify `leaf` to give it a `Weak<Node>`
|
||||
reference to its parent. We use the `borrow_mut` method on the
|
||||
`RefCell<Weak<Node>>` in the `parent` field of `leaf`, and then we use the
|
||||
`Rc::downgrade` function to create a `Weak<Node>` reference to `branch` from
|
||||
the `Rc<Node>` in `branch.`
|
||||
|
||||
When we print the parent of `leaf` again, this time we’ll get a `Some` variant
|
||||
holding `branch`: now `leaf` can access its parent! When we print `leaf`, we
|
||||
also avoid the cycle that eventually ended in a stack overflow like we had in
|
||||
Listing 15-26; the `Weak<Node>` references are printed as `(Weak)`:
|
||||
|
||||
```text
|
||||
leaf parent = Some(Node { value: 5, parent: RefCell { value: (Weak) },
|
||||
children: RefCell { value: [Node { value: 3, parent: RefCell { value: (Weak) },
|
||||
children: RefCell { value: [] } }] } })
|
||||
```
|
||||
|
||||
The lack of infinite output indicates that this code didn’t create a reference
|
||||
cycle. We can also tell this by looking at the values we get from calling
|
||||
`Rc::strong_count` and `Rc::weak_count`.
|
||||
|
||||
#### Visualizing Changes to `strong_count` and `weak_count`
|
||||
|
||||
Let’s look at how the `strong_count` and `weak_count` values of the `Rc<Node>`
|
||||
instances change by creating a new inner scope and moving the creation of
|
||||
`branch` into that scope. By doing so, we can see what happens when `branch` is
|
||||
created and then dropped when it goes out of scope. The modifications are shown
|
||||
in Listing 15-29:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::rc::{Rc, Weak};
|
||||
# use std::cell::RefCell;
|
||||
#
|
||||
# #[derive(Debug)]
|
||||
# struct Node {
|
||||
# value: i32,
|
||||
# parent: RefCell<Weak<Node>>,
|
||||
# children: RefCell<Vec<Rc<Node>>>,
|
||||
# }
|
||||
#
|
||||
fn main() {
|
||||
let leaf = Rc::new(Node {
|
||||
value: 3,
|
||||
parent: RefCell::new(Weak::new()),
|
||||
children: RefCell::new(vec![]),
|
||||
});
|
||||
|
||||
println!(
|
||||
"leaf strong = {}, weak = {}",
|
||||
Rc::strong_count(&leaf),
|
||||
Rc::weak_count(&leaf),
|
||||
);
|
||||
|
||||
{
|
||||
let branch = Rc::new(Node {
|
||||
value: 5,
|
||||
parent: RefCell::new(Weak::new()),
|
||||
children: RefCell::new(vec![Rc::clone(&leaf)]),
|
||||
});
|
||||
|
||||
*leaf.parent.borrow_mut() = Rc::downgrade(&branch);
|
||||
|
||||
println!(
|
||||
"branch strong = {}, weak = {}",
|
||||
Rc::strong_count(&branch),
|
||||
Rc::weak_count(&branch),
|
||||
);
|
||||
|
||||
println!(
|
||||
"leaf strong = {}, weak = {}",
|
||||
Rc::strong_count(&leaf),
|
||||
Rc::weak_count(&leaf),
|
||||
);
|
||||
}
|
||||
|
||||
println!("leaf parent = {:?}", leaf.parent.borrow().upgrade());
|
||||
println!(
|
||||
"leaf strong = {}, weak = {}",
|
||||
Rc::strong_count(&leaf),
|
||||
Rc::weak_count(&leaf),
|
||||
);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 15-29: Creating `branch` in an inner scope and
|
||||
examining strong and weak reference counts</span>
|
||||
|
||||
After `leaf` is created, its `Rc<Node>` has a strong count of 1 and a weak
|
||||
count of 0. In the inner scope, we create `branch` and associate it with
|
||||
`leaf`, at which point when we print the counts, the `Rc<Node>` in `branch`
|
||||
will have a strong count of 1 and a weak count of 1 (for `leaf.parent` pointing
|
||||
to `branch` with a `Weak<Node>`). When we print the counts in `leaf`, we’ll see
|
||||
it will have a strong count of 2, because `branch` now has a clone of the
|
||||
`Rc<Node>` of `leaf` stored in `branch.children`, but will still have a weak
|
||||
count of 0.
|
||||
|
||||
When the inner scope ends, `branch` goes out of scope and the strong count of
|
||||
the `Rc<Node>` decreases to 0, so its `Node` is dropped. The weak count of 1
|
||||
from `leaf.parent` has no bearing on whether or not `Node` is dropped, so we
|
||||
don’t get any memory leaks!
|
||||
|
||||
If we try to access the parent of `leaf` after the end of the scope, we’ll get
|
||||
`None` again. At the end of the program, the `Rc<Node>` in `leaf` has a strong
|
||||
count of 1 and a weak count of 0, because the variable `leaf` is now the only
|
||||
reference to the `Rc<Node>` again.
|
||||
|
||||
All of the logic that manages the counts and value dropping is built into
|
||||
`Rc<T>` and `Weak<T>` and their implementations of the `Drop` trait. By
|
||||
specifying that the relationship from a child to its parent should be a
|
||||
`Weak<T>` reference in the definition of `Node`, you’re able to have parent
|
||||
nodes point to child nodes and vice versa without creating a reference cycle
|
||||
and memory leaks.
|
||||
|
||||
## Summary
|
||||
|
||||
This chapter covered how to use smart pointers to make different guarantees and
|
||||
trade-offs than those Rust makes by default with regular references. The
|
||||
`Box<T>` type has a known size and points to data allocated on the heap. The
|
||||
`Rc<T>` type keeps track of the number of references to data on the heap so
|
||||
that data can have multiple owners. The `RefCell<T>` type with its interior
|
||||
mutability gives us a type that we can use when we need an immutable type but
|
||||
need to change an inner value of that type; it also enforces the borrowing
|
||||
rules at runtime instead of at compile time.
|
||||
|
||||
Also discussed were the `Deref` and `Drop` traits, which enable a lot of the
|
||||
functionality of smart pointers. We explored reference cycles that can cause
|
||||
memory leaks and how to prevent them using `Weak<T>`.
|
||||
|
||||
If this chapter has piqued your interest and you want to implement your own
|
||||
smart pointers, check out [“The Rustonomicon”][nomicon] for more useful
|
||||
information.
|
||||
|
||||
[nomicon]: https://doc.rust-lang.org/stable/nomicon/
|
||||
|
||||
Next, we’ll talk about concurrency in Rust. You’ll even learn about a few new
|
||||
smart pointers.
|
||||
49
2018-edition/src/ch16-00-concurrency.md
Normal file
49
2018-edition/src/ch16-00-concurrency.md
Normal file
@@ -0,0 +1,49 @@
|
||||
# Fearless Concurrency
|
||||
|
||||
Handling concurrent programming safely and efficiently is another of Rust’s
|
||||
major goals. *Concurrent programming*, where different parts of a program
|
||||
execute independently, and *parallel programming*, where different parts of a
|
||||
program execute at the same time, are becoming increasingly important as more
|
||||
computers take advantage of their multiple processors. Historically,
|
||||
programming in these contexts has been difficult and error prone: Rust hopes to
|
||||
change that.
|
||||
|
||||
Initially, the Rust team thought that ensuring memory safety and preventing
|
||||
concurrency problems were two separate challenges to be solved with different
|
||||
methods. Over time, the team discovered that the ownership and type systems are
|
||||
a powerful set of tools to help manage memory safety *and* concurrency
|
||||
problems! By leveraging ownership and type checking, many concurrency errors
|
||||
are compile-time errors in Rust rather than runtime errors. Therefore, rather
|
||||
than making you spend lots of time trying to reproduce the exact circumstances
|
||||
under which a runtime concurrency bug occurs, incorrect code will refuse to
|
||||
compile and present an error explaining the problem. As a result, you can fix
|
||||
your code while you’re working on it rather than potentially after it has been
|
||||
shipped to production. We’ve nicknamed this aspect of Rust *fearless*
|
||||
*concurrency*. Fearless concurrency allows you to write code that is free of
|
||||
subtle bugs and is easy to refactor without introducing new bugs.
|
||||
|
||||
> Note: For simplicity’s sake, we’ll refer to many of the problems as
|
||||
> *concurrent* rather than being more precise by saying *concurrent and/or
|
||||
> parallel*. If this book were about concurrency and/or parallelism, we’d be
|
||||
> more specific. For this chapter, please mentally substitute *concurrent
|
||||
> and/or parallel* whenever we use *concurrent*.
|
||||
|
||||
Many languages are dogmatic about the solutions they offer for handling
|
||||
concurrent problems. For example, Erlang has elegant functionality for
|
||||
message-passing concurrency but has only obscure ways to share state between
|
||||
threads. Supporting only a subset of possible solutions is a reasonable
|
||||
strategy for higher-level languages, because a higher-level language promises
|
||||
benefits from giving up some control to gain abstractions. However, lower-level
|
||||
languages are expected to provide the solution with the best performance in any
|
||||
given situation and have fewer abstractions over the hardware. Therefore, Rust
|
||||
offers a variety of tools for modeling problems in whatever way is appropriate
|
||||
for your situation and requirements.
|
||||
|
||||
Here are the topics we’ll cover in this chapter:
|
||||
|
||||
* How to create threads to run multiple pieces of code at the same time
|
||||
* *Message-passing* concurrency, where channels send messages between threads
|
||||
* *Shared-state* concurrency, where multiple threads have access to some piece
|
||||
of data
|
||||
* The `Sync` and `Send` traits, which extend Rust’s concurrency guarantees to
|
||||
user-defined types as well as types provided by the standard library
|
||||
399
2018-edition/src/ch16-01-threads.md
Normal file
399
2018-edition/src/ch16-01-threads.md
Normal file
@@ -0,0 +1,399 @@
|
||||
## Using Threads to Run Code Simultaneously
|
||||
|
||||
In most current operating systems, an executed program’s code is run in a
|
||||
*process*, and the operating system manages multiple processes at once. Within
|
||||
your program, you can also have independent parts that run simultaneously. The
|
||||
features that run these independent parts are called *threads*.
|
||||
|
||||
Splitting the computation in your program into multiple threads can improve
|
||||
performance because the program does multiple tasks at the same time, but it
|
||||
also adds complexity. Because threads can run simultaneously, there’s no
|
||||
inherent guarantee about the order in which parts of your code on different
|
||||
threads will run. This can lead to problems, such as:
|
||||
|
||||
* Race conditions, where threads are accessing data or resources in an
|
||||
inconsistent order
|
||||
* Deadlocks, where two threads are waiting for each other to finish using a
|
||||
resource the other thread has, preventing both threads from continuing
|
||||
* Bugs that happen only in certain situations and are hard to reproduce and fix
|
||||
reliably
|
||||
|
||||
Rust attempts to mitigate the negative effects of using threads, but
|
||||
programming in a multithreaded context still takes careful thought and requires
|
||||
a code structure that is different from that in programs running in a single
|
||||
thread.
|
||||
|
||||
Programming languages implement threads in a few different ways. Many operating
|
||||
systems provide an API for creating new threads. This model where a language
|
||||
calls the operating system APIs to create threads is sometimes called *1:1*,
|
||||
meaning one operating system thread per one language thread.
|
||||
|
||||
Many programming languages provide their own special implementation of threads.
|
||||
Programming language-provided threads are known as *green* threads, and
|
||||
languages that use these green threads will execute them in the context of a
|
||||
different number of operating system threads. For this reason, the
|
||||
green-threaded model is called the *M:N* model: there are `M` green threads per
|
||||
`N` operating system threads, where `M` and `N` are not necessarily the same
|
||||
number.
|
||||
|
||||
Each model has its own advantages and trade-offs, and the trade-off most
|
||||
important to Rust is runtime support. *Runtime* is a confusing term and can
|
||||
have different meanings in different contexts.
|
||||
|
||||
In this context, by *runtime* we mean code that is included by the language in
|
||||
every binary. This code can be large or small depending on the language, but
|
||||
every non-assembly language will have some amount of runtime code. For that
|
||||
reason, colloquially when people say a language has “no runtime,” they often
|
||||
mean “small runtime.” Smaller runtimes have fewer features but have the
|
||||
advantage of resulting in smaller binaries, which make it easier to combine the
|
||||
language with other languages in more contexts. Although many languages are
|
||||
okay with increasing the runtime size in exchange for more features, Rust needs
|
||||
to have nearly no runtime and cannot compromise on being able to call into C to
|
||||
maintain performance.
|
||||
|
||||
The green-threading M:N model requires a larger language runtime to manage
|
||||
threads. As such, the Rust standard library only provides an implementation of
|
||||
1:1 threading. Because Rust is such a low-level language, there are crates that
|
||||
implement M:N threading if you would rather trade overhead for aspects such as
|
||||
more control over which threads run when and lower costs of context switching,
|
||||
for example.
|
||||
|
||||
Now that we’ve defined threads in Rust, let’s explore how to use the
|
||||
thread-related API provided by the standard library.
|
||||
|
||||
### Creating a New Thread with `spawn`
|
||||
|
||||
To create a new thread, we call the `thread::spawn` function and pass it a
|
||||
closure (we talked about closures in Chapter 13) containing the code we want to
|
||||
run in the new thread. The example in Listing 16-1 prints some text from a main
|
||||
thread and other text from a new thread:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::thread;
|
||||
use std::time::Duration;
|
||||
|
||||
fn main() {
|
||||
thread::spawn(|| {
|
||||
for i in 1..10 {
|
||||
println!("hi number {} from the spawned thread!", i);
|
||||
thread::sleep(Duration::from_millis(1));
|
||||
}
|
||||
});
|
||||
|
||||
for i in 1..5 {
|
||||
println!("hi number {} from the main thread!", i);
|
||||
thread::sleep(Duration::from_millis(1));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-1: Creating a new thread to print one thing
|
||||
while the main thread prints something else</span>
|
||||
|
||||
Note that with this function, the new thread will be stopped when the main
|
||||
thread ends, whether or not it has finished running. The output from this
|
||||
program might be a little different every time, but it will look similar to the
|
||||
following:
|
||||
|
||||
```text
|
||||
hi number 1 from the main thread!
|
||||
hi number 1 from the spawned thread!
|
||||
hi number 2 from the main thread!
|
||||
hi number 2 from the spawned thread!
|
||||
hi number 3 from the main thread!
|
||||
hi number 3 from the spawned thread!
|
||||
hi number 4 from the main thread!
|
||||
hi number 4 from the spawned thread!
|
||||
hi number 5 from the spawned thread!
|
||||
```
|
||||
|
||||
The calls to `thread::sleep` force a thread to stop its execution for a short
|
||||
duration, allowing a different thread to run. The threads will probably take
|
||||
turns, but that isn’t guaranteed: it depends on how your operating system
|
||||
schedules the threads. In this run, the main thread printed first, even though
|
||||
the print statement from the spawned thread appears first in the code. And even
|
||||
though we told the spawned thread to print until `i` is 9, it only got to 5
|
||||
before the main thread shut down.
|
||||
|
||||
If you run this code and only see output from the main thread, or don’t see any
|
||||
overlap, try increasing the numbers in the ranges to create more opportunities
|
||||
for the operating system to switch between the threads.
|
||||
|
||||
### Waiting for All Threads to Finish Using `join` Handles
|
||||
|
||||
The code in Listing 16-1 not only stops the spawned thread prematurely most of
|
||||
the time due to the main thread ending, but also can't guarantee that the
|
||||
spawned thread will get to run at all. The reason is that there is no guarantee
|
||||
on the order in which threads run!
|
||||
|
||||
We can fix the problem of the spawned thread not getting to run, or not getting
|
||||
to run completely, by saving the return value of `thread::spawn` in a variable.
|
||||
The return type of `thread::spawn` is `JoinHandle`. A `JoinHandle` is an owned
|
||||
value that, when we call the `join` method on it, will wait for its thread to
|
||||
finish. Listing 16-2 shows how to use the `JoinHandle` of the thread we created
|
||||
in Listing 16-1 and call `join` to make sure the spawned thread finishes before
|
||||
`main` exits:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::thread;
|
||||
use std::time::Duration;
|
||||
|
||||
fn main() {
|
||||
let handle = thread::spawn(|| {
|
||||
for i in 1..10 {
|
||||
println!("hi number {} from the spawned thread!", i);
|
||||
thread::sleep(Duration::from_millis(1));
|
||||
}
|
||||
});
|
||||
|
||||
for i in 1..5 {
|
||||
println!("hi number {} from the main thread!", i);
|
||||
thread::sleep(Duration::from_millis(1));
|
||||
}
|
||||
|
||||
handle.join().unwrap();
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-2: Saving a `JoinHandle` from `thread::spawn`
|
||||
to guarantee the thread is run to completion</span>
|
||||
|
||||
Calling `join` on the handle blocks the thread currently running until the
|
||||
thread represented by the handle terminates. *Blocking* a thread means that
|
||||
thread is prevented from performing work or exiting. Because we’ve put the call
|
||||
to `join` after the main thread’s `for` loop, running Listing 16-2 should
|
||||
produce output similar to this:
|
||||
|
||||
```text
|
||||
hi number 1 from the main thread!
|
||||
hi number 2 from the main thread!
|
||||
hi number 1 from the spawned thread!
|
||||
hi number 3 from the main thread!
|
||||
hi number 2 from the spawned thread!
|
||||
hi number 4 from the main thread!
|
||||
hi number 3 from the spawned thread!
|
||||
hi number 4 from the spawned thread!
|
||||
hi number 5 from the spawned thread!
|
||||
hi number 6 from the spawned thread!
|
||||
hi number 7 from the spawned thread!
|
||||
hi number 8 from the spawned thread!
|
||||
hi number 9 from the spawned thread!
|
||||
```
|
||||
|
||||
The two threads continue alternating, but the main thread waits because of the
|
||||
call to `handle.join()` and does not end until the spawned thread is finished.
|
||||
|
||||
But let’s see what happens when we instead move `handle.join()` before the
|
||||
`for` loop in `main`, like this:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::thread;
|
||||
use std::time::Duration;
|
||||
|
||||
fn main() {
|
||||
let handle = thread::spawn(|| {
|
||||
for i in 1..10 {
|
||||
println!("hi number {} from the spawned thread!", i);
|
||||
thread::sleep(Duration::from_millis(1));
|
||||
}
|
||||
});
|
||||
|
||||
handle.join().unwrap();
|
||||
|
||||
for i in 1..5 {
|
||||
println!("hi number {} from the main thread!", i);
|
||||
thread::sleep(Duration::from_millis(1));
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
The main thread will wait for the spawned thread to finish and then run its
|
||||
`for` loop, so the output won’t be interleaved anymore, as shown here:
|
||||
|
||||
```text
|
||||
hi number 1 from the spawned thread!
|
||||
hi number 2 from the spawned thread!
|
||||
hi number 3 from the spawned thread!
|
||||
hi number 4 from the spawned thread!
|
||||
hi number 5 from the spawned thread!
|
||||
hi number 6 from the spawned thread!
|
||||
hi number 7 from the spawned thread!
|
||||
hi number 8 from the spawned thread!
|
||||
hi number 9 from the spawned thread!
|
||||
hi number 1 from the main thread!
|
||||
hi number 2 from the main thread!
|
||||
hi number 3 from the main thread!
|
||||
hi number 4 from the main thread!
|
||||
```
|
||||
|
||||
Small details, such as where `join` is called, can affect whether or not your
|
||||
threads run at the same time.
|
||||
|
||||
### Using `move` Closures with Threads
|
||||
|
||||
The `move` closure is often used alongside `thread::spawn` because it allows
|
||||
you to use data from one thread in another thread.
|
||||
|
||||
In Chapter 13, we mentioned we can use the `move` keyword before the parameter
|
||||
list of a closure to force the closure to take ownership of the values it uses
|
||||
in the environment. This technique is especially useful when creating new
|
||||
threads in order to transfer ownership of values from one thread to another.
|
||||
|
||||
Notice in Listing 16-1 that the closure we pass to `thread::spawn` takes no
|
||||
arguments: we’re not using any data from the main thread in the spawned
|
||||
thread’s code. To use data from the main thread in the spawned thread, the
|
||||
spawned thread’s closure must capture the values it needs. Listing 16-3 shows
|
||||
an attempt to create a vector in the main thread and use it in the spawned
|
||||
thread. However, this won’t yet work, as you’ll see in a moment.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
use std::thread;
|
||||
|
||||
fn main() {
|
||||
let v = vec![1, 2, 3];
|
||||
|
||||
let handle = thread::spawn(|| {
|
||||
println!("Here's a vector: {:?}", v);
|
||||
});
|
||||
|
||||
handle.join().unwrap();
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-3: Attempting to use a vector created by the
|
||||
main thread in another thread</span>
|
||||
|
||||
The closure uses `v`, so it will capture `v` and make it part of the closure’s
|
||||
environment. Because `thread::spawn` runs this closure in a new thread, we
|
||||
should be able to access `v` inside that new thread. But when we compile this
|
||||
example, we get the following error:
|
||||
|
||||
```text
|
||||
error[E0373]: closure may outlive the current function, but it borrows `v`,
|
||||
which is owned by the current function
|
||||
--> src/main.rs:6:32
|
||||
|
|
||||
6 | let handle = thread::spawn(|| {
|
||||
| ^^ may outlive borrowed value `v`
|
||||
7 | println!("Here's a vector: {:?}", v);
|
||||
| - `v` is borrowed here
|
||||
|
|
||||
help: to force the closure to take ownership of `v` (and any other referenced
|
||||
variables), use the `move` keyword
|
||||
|
|
||||
6 | let handle = thread::spawn(move || {
|
||||
| ^^^^^^^
|
||||
```
|
||||
|
||||
Rust *infers* how to capture `v`, and because `println!` only needs a reference
|
||||
to `v`, the closure tries to borrow `v`. However, there’s a problem: Rust can’t
|
||||
tell how long the spawned thread will run, so it doesn’t know if the reference
|
||||
to `v` will always be valid.
|
||||
|
||||
Listing 16-4 provides a scenario that’s more likely to have a reference to `v`
|
||||
that won’t be valid:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
use std::thread;
|
||||
|
||||
fn main() {
|
||||
let v = vec![1, 2, 3];
|
||||
|
||||
let handle = thread::spawn(|| {
|
||||
println!("Here's a vector: {:?}", v);
|
||||
});
|
||||
|
||||
drop(v); // oh no!
|
||||
|
||||
handle.join().unwrap();
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-4: A thread with a closure that attempts to
|
||||
capture a reference to `v` from a main thread that drops `v`</span>
|
||||
|
||||
If we were allowed to run this code, there’s a possibility the spawned thread
|
||||
would be immediately put in the background without running at all. The spawned
|
||||
thread has a reference to `v` inside, but the main thread immediately drops
|
||||
`v`, using the `drop` function we discussed in Chapter 15. Then, when the
|
||||
spawned thread starts to execute, `v` is no longer valid, so a reference to it
|
||||
is also invalid. Oh no!
|
||||
|
||||
To fix the compiler error in Listing 16-3, we can use the error message’s
|
||||
advice:
|
||||
|
||||
```text
|
||||
help: to force the closure to take ownership of `v` (and any other referenced
|
||||
variables), use the `move` keyword
|
||||
|
|
||||
6 | let handle = thread::spawn(move || {
|
||||
| ^^^^^^^
|
||||
```
|
||||
|
||||
By adding the `move` keyword before the closure, we force the closure to take
|
||||
ownership of the values it’s using rather than allowing Rust to infer that it
|
||||
should borrow the values. The modification to Listing 16-3 shown in Listing
|
||||
16-5 will compile and run as we intend:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::thread;
|
||||
|
||||
fn main() {
|
||||
let v = vec![1, 2, 3];
|
||||
|
||||
let handle = thread::spawn(move || {
|
||||
println!("Here's a vector: {:?}", v);
|
||||
});
|
||||
|
||||
handle.join().unwrap();
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-5: Using the `move` keyword to force a closure
|
||||
to take ownership of the values it uses</span>
|
||||
|
||||
What would happen to the code in Listing 16-4 where the main thread called
|
||||
`drop` if we use a `move` closure? Would `move` fix that case? Unfortunately,
|
||||
no; we would get a different error because what Listing 16-4 is trying to do
|
||||
isn’t allowed for a different reason. If we added `move` to the closure, we
|
||||
would move `v` into the closure’s environment, and we could no longer call
|
||||
`drop` on it in the main thread. We would get this compiler error instead:
|
||||
|
||||
```text
|
||||
error[E0382]: use of moved value: `v`
|
||||
--> src/main.rs:10:10
|
||||
|
|
||||
6 | let handle = thread::spawn(move || {
|
||||
| ------- value moved (into closure) here
|
||||
...
|
||||
10 | drop(v); // oh no!
|
||||
| ^ value used here after move
|
||||
|
|
||||
= note: move occurs because `v` has type `std::vec::Vec<i32>`, which does
|
||||
not implement the `Copy` trait
|
||||
```
|
||||
|
||||
Rust’s ownership rules have saved us again! We got an error from the code in
|
||||
Listing 16-3 because Rust was being conservative and only borrowing `v` for the
|
||||
thread, which meant the main thread could theoretically invalidate the spawned
|
||||
thread’s reference. By telling Rust to move ownership of `v` to the spawned
|
||||
thread, we’re guaranteeing Rust that the main thread won’t use `v` anymore. If
|
||||
we change Listing 16-4 in the same way, we’re then violating the ownership
|
||||
rules when we try to use `v` in the main thread. The `move` keyword overrides
|
||||
Rust’s conservative default of borrowing; it doesn’t let us violate the
|
||||
ownership rules.
|
||||
|
||||
With a basic understanding of threads and the thread API, let’s look at what we
|
||||
can *do* with threads.
|
||||
366
2018-edition/src/ch16-02-message-passing.md
Normal file
366
2018-edition/src/ch16-02-message-passing.md
Normal file
@@ -0,0 +1,366 @@
|
||||
## Using Message Passing to Transfer Data Between Threads
|
||||
|
||||
One increasingly popular approach to ensuring safe concurrency is *message
|
||||
passing*, where threads or actors communicate by sending each other messages
|
||||
containing data. Here’s the idea in a slogan from [the Go language
|
||||
documentation](http://golang.org/doc/effective_go.html): "Do not communicate by
|
||||
sharing memory; instead, share memory by communicating."
|
||||
|
||||
One major tool Rust has for accomplishing message-sending concurrency is the
|
||||
*channel*, a programming concept that Rust’s standard library provides an
|
||||
implementation of. You can imagine a channel in programming as being like a
|
||||
channel of water, such as a stream or a river. If you put something like a
|
||||
rubber duck or boat into a stream, it will travel downstream to the end of the
|
||||
waterway.
|
||||
|
||||
A channel in programming has two halves: a transmitter and a receiver. The
|
||||
transmitter half is the upstream location where you put rubber ducks into the
|
||||
river, and the receiver half is where the rubber duck ends up downstream. One
|
||||
part of your code calls methods on the transmitter with the data you want to
|
||||
send, and another part checks the receiving end for arriving messages. A
|
||||
channel is said to be *closed* if either the transmitter or receiver half is
|
||||
dropped.
|
||||
|
||||
Here, we’ll work up to a program that has one thread to generate values and
|
||||
send them down a channel, and another thread that will receive the values and
|
||||
print them out. We’ll be sending simple values between threads using a channel
|
||||
to illustrate the feature. Once you’re familiar with the technique, you could
|
||||
use channels to implement a chat system or a system where many threads perform
|
||||
parts of a calculation and send the parts to one thread that aggregates the
|
||||
results.
|
||||
|
||||
First, in Listing 16-6, we’ll create a channel but not do anything with it.
|
||||
Note that this won’t compile yet because Rust can’t tell what type of values we
|
||||
want to send over the channel.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::sync::mpsc;
|
||||
|
||||
fn main() {
|
||||
let (tx, rx) = mpsc::channel();
|
||||
# tx.send(()).unwrap();
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-6: Creating a channel and assigning the two
|
||||
halves to `tx` and `rx`</span>
|
||||
|
||||
We create a new channel using the `mpsc::channel` function; `mpsc` stands for
|
||||
*multiple producer, single consumer*. In short, the way Rust’s standard library
|
||||
implements channels means a channel can have multiple *sending* ends that
|
||||
produce values but only one *receiving* end that consumes those values. Imagine
|
||||
multiple streams flowing together into one big river: everything sent down any
|
||||
of the streams will end up in one river at the end. We’ll start with a single
|
||||
producer for now, but we’ll add multiple producers when we get this example
|
||||
working.
|
||||
|
||||
<!-- NEXT PARAGRAPH WRAPPED WEIRD INTENTIONALLY SEE #199 -->
|
||||
|
||||
The `mpsc::channel` function returns a tuple, the first element of which is the
|
||||
sending end and the second element is the receiving end. The abbreviations `tx`
|
||||
and `rx` are traditionally used in many fields for *transmitter* and *receiver*
|
||||
respectively, so we name our variables as such to indicate each end. We’re
|
||||
using a `let` statement with a pattern that destructures the tuples; we’ll
|
||||
discuss the use of patterns in `let` statements and destructuring in
|
||||
Chapter 18. Using a `let` statement this way is a convenient approach to
|
||||
extract the pieces of the tuple returned by `mpsc::channel`.
|
||||
|
||||
Let’s move the transmitting end into a spawned thread and have it send one
|
||||
string so the spawned thread is communicating with the main thread, as shown in
|
||||
Listing 16-7. This is like putting a rubber duck in the river upstream or
|
||||
sending a chat message from one thread to another.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::thread;
|
||||
use std::sync::mpsc;
|
||||
|
||||
fn main() {
|
||||
let (tx, rx) = mpsc::channel();
|
||||
|
||||
thread::spawn(move || {
|
||||
let val = String::from("hi");
|
||||
tx.send(val).unwrap();
|
||||
});
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-7: Moving `tx` to a spawned thread and sending
|
||||
“hi”</span>
|
||||
|
||||
Again, we’re using `thread::spawn` to create a new thread and then using `move`
|
||||
to move `tx` into the closure so the spawned thread owns `tx`. The spawned
|
||||
thread needs to own the transmitting end of the channel to be able to send
|
||||
messages through the channel.
|
||||
|
||||
The transmitting end has a `send` method that takes the value we want to send.
|
||||
The `send` method returns a `Result<T, E>` type, so if the receiving end has
|
||||
already been dropped and there’s nowhere to send a value, the send operation
|
||||
will return an error. In this example, we’re calling `unwrap` to panic in case
|
||||
of an error. But in a real application, we would handle it properly: return to
|
||||
Chapter 9 to review strategies for proper error handling.
|
||||
|
||||
In Listing 16-8, we’ll get the value from the receiving end of the channel in
|
||||
the main thread. This is like retrieving the rubber duck from the water at the
|
||||
end of the river or like getting a chat message.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::thread;
|
||||
use std::sync::mpsc;
|
||||
|
||||
fn main() {
|
||||
let (tx, rx) = mpsc::channel();
|
||||
|
||||
thread::spawn(move || {
|
||||
let val = String::from("hi");
|
||||
tx.send(val).unwrap();
|
||||
});
|
||||
|
||||
let received = rx.recv().unwrap();
|
||||
println!("Got: {}", received);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-8: Receiving the value “hi” in the main thread
|
||||
and printing it</span>
|
||||
|
||||
The receiving end of a channel has two useful methods: `recv` and `try_recv`.
|
||||
We’re using `recv`, short for *receive*, which will block the main thread’s
|
||||
execution and wait until a value is sent down the channel. Once a value is
|
||||
sent, `recv` will return it in a `Result<T, E>`. When the sending end of the
|
||||
channel closes, `recv` will return an error to signal that no more values will
|
||||
be coming.
|
||||
|
||||
The `try_recv` method doesn’t block, but will instead return a `Result<T, E>`
|
||||
immediately: an `Ok` value holding a message if one is available and an `Err`
|
||||
value if there aren’t any messages this time. Using `try_recv` is useful if
|
||||
this thread has other work to do while waiting for messages: we could write a
|
||||
loop that calls `try_recv` every so often, handles a message if one is
|
||||
available, and otherwise does other work for a little while until checking
|
||||
again.
|
||||
|
||||
We’ve used `recv` in this example for simplicity; we don’t have any other work
|
||||
for the main thread to do other than wait for messages, so blocking the main
|
||||
thread is appropriate.
|
||||
|
||||
When we run the code in Listing 16-8, we’ll see the value printed from the main
|
||||
thread:
|
||||
|
||||
```text
|
||||
Got: hi
|
||||
```
|
||||
|
||||
Perfect!
|
||||
|
||||
### Channels and Ownership Transference
|
||||
|
||||
The ownership rules play a vital role in message sending because they help you
|
||||
write safe, concurrent code. Preventing errors in concurrent programming is the
|
||||
advantage of thinking about ownership throughout your Rust programs. Let’s do
|
||||
an experiment to show how channels and ownership work together to prevent
|
||||
problems: we’ll try to use a `val` value in the spawned thread *after* we’ve
|
||||
sent it down the channel. Try compiling the code in Listing 16-9 to see why
|
||||
this code isn't allowed:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
use std::thread;
|
||||
use std::sync::mpsc;
|
||||
|
||||
fn main() {
|
||||
let (tx, rx) = mpsc::channel();
|
||||
|
||||
thread::spawn(move || {
|
||||
let val = String::from("hi");
|
||||
tx.send(val).unwrap();
|
||||
println!("val is {}", val);
|
||||
});
|
||||
|
||||
let received = rx.recv().unwrap();
|
||||
println!("Got: {}", received);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-9: Attempting to use `val` after we’ve sent it
|
||||
down the channel</span>
|
||||
|
||||
Here, we try to print `val` after we’ve sent it down the channel via `tx.send`.
|
||||
Allowing this would be a bad idea: once the value has been sent to another
|
||||
thread, that thread could modify or drop it before we try to use the value
|
||||
again. Potentially, the other thread’s modifications could cause errors or
|
||||
unexpected results due to inconsistent or nonexistent data. However, Rust gives
|
||||
us an error if we try to compile the code in Listing 16-9:
|
||||
|
||||
```text
|
||||
error[E0382]: use of moved value: `val`
|
||||
--> src/main.rs:10:31
|
||||
|
|
||||
9 | tx.send(val).unwrap();
|
||||
| --- value moved here
|
||||
10 | println!("val is {}", val);
|
||||
| ^^^ value used here after move
|
||||
|
|
||||
= note: move occurs because `val` has type `std::string::String`, which does
|
||||
not implement the `Copy` trait
|
||||
```
|
||||
|
||||
Our concurrency mistake has caused a compile time error. The `send` function
|
||||
takes ownership of its parameter, and when the value is moved, the receiver
|
||||
takes ownership of it. This stops us from accidentally using the value again
|
||||
after sending it; the ownership system checks that everything is okay.
|
||||
|
||||
### Sending Multiple Values and Seeing the Receiver Waiting
|
||||
|
||||
The code in Listing 16-8 compiled and ran, but it didn’t clearly show us that
|
||||
two separate threads were talking to each other over the channel. In Listing
|
||||
16-10 we’ve made some modifications that will prove the code in Listing 16-8 is
|
||||
running concurrently: the spawned thread will now send multiple messages and
|
||||
pause for a second between each message.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::thread;
|
||||
use std::sync::mpsc;
|
||||
use std::time::Duration;
|
||||
|
||||
fn main() {
|
||||
let (tx, rx) = mpsc::channel();
|
||||
|
||||
thread::spawn(move || {
|
||||
let vals = vec![
|
||||
String::from("hi"),
|
||||
String::from("from"),
|
||||
String::from("the"),
|
||||
String::from("thread"),
|
||||
];
|
||||
|
||||
for val in vals {
|
||||
tx.send(val).unwrap();
|
||||
thread::sleep(Duration::from_secs(1));
|
||||
}
|
||||
});
|
||||
|
||||
for received in rx {
|
||||
println!("Got: {}", received);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-10: Sending multiple messages and pausing
|
||||
between each</span>
|
||||
|
||||
This time, the spawned thread has a vector of strings that we want to send to
|
||||
the main thread. We iterate over them, sending each individually, and pause
|
||||
between each by calling the `thread::sleep` function with a `Duration` value of
|
||||
1 second.
|
||||
|
||||
In the main thread, we’re not calling the `recv` function explicitly anymore:
|
||||
instead, we’re treating `rx` as an iterator. For each value received, we’re
|
||||
printing it. When the channel is closed, iteration will end.
|
||||
|
||||
When running the code in Listing 16-10, you should see the following output
|
||||
with a 1-second pause in between each line:
|
||||
|
||||
```text
|
||||
Got: hi
|
||||
Got: from
|
||||
Got: the
|
||||
Got: thread
|
||||
```
|
||||
|
||||
Because we don’t have any code that pauses or delays in the `for` loop in the
|
||||
main thread, we can tell that the main thread is waiting to receive values from
|
||||
the spawned thread.
|
||||
|
||||
### Creating Multiple Producers by Cloning the Transmitter
|
||||
|
||||
Earlier we mentioned that `mpsc` was an acronym for *multiple producer,
|
||||
single consumer*. Let’s put `mpsc` to use and expand the code in Listing 16-10
|
||||
to create multiple threads that all send values to the same receiver. We can do
|
||||
so by cloning the transmitting half of the channel, as shown in Listing 16-11:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
# use std::thread;
|
||||
# use std::sync::mpsc;
|
||||
# use std::time::Duration;
|
||||
#
|
||||
# fn main() {
|
||||
// --snip--
|
||||
|
||||
let (tx, rx) = mpsc::channel();
|
||||
|
||||
let tx1 = mpsc::Sender::clone(&tx);
|
||||
thread::spawn(move || {
|
||||
let vals = vec![
|
||||
String::from("hi"),
|
||||
String::from("from"),
|
||||
String::from("the"),
|
||||
String::from("thread"),
|
||||
];
|
||||
|
||||
for val in vals {
|
||||
tx1.send(val).unwrap();
|
||||
thread::sleep(Duration::from_secs(1));
|
||||
}
|
||||
});
|
||||
|
||||
thread::spawn(move || {
|
||||
let vals = vec![
|
||||
String::from("more"),
|
||||
String::from("messages"),
|
||||
String::from("for"),
|
||||
String::from("you"),
|
||||
];
|
||||
|
||||
for val in vals {
|
||||
tx.send(val).unwrap();
|
||||
thread::sleep(Duration::from_secs(1));
|
||||
}
|
||||
});
|
||||
|
||||
for received in rx {
|
||||
println!("Got: {}", received);
|
||||
}
|
||||
|
||||
// --snip--
|
||||
# }
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-11: Sending multiple messages from multiple
|
||||
producers</span>
|
||||
|
||||
This time, before we create the first spawned thread, we call `clone` on the
|
||||
sending end of the channel. This will give us a new sending handle we can pass
|
||||
to the first spawned thread. We pass the original sending end of the channel to
|
||||
a second spawned thread. This gives us two threads, each sending different
|
||||
messages to the receiving end of the channel.
|
||||
|
||||
When you run the code, your output should look something like this:
|
||||
|
||||
```text
|
||||
Got: hi
|
||||
Got: more
|
||||
Got: from
|
||||
Got: messages
|
||||
Got: for
|
||||
Got: the
|
||||
Got: thread
|
||||
Got: you
|
||||
```
|
||||
|
||||
You might see the values in another order; it depends on your system. This is
|
||||
what makes concurrency interesting as well as difficult. If you experiment with
|
||||
`thread::sleep`, giving it various values in the different threads, each run
|
||||
will be more nondeterministic and create different output each time.
|
||||
|
||||
Now that we’ve looked at how channels work, let’s look at a different method of
|
||||
concurrency.
|
||||
426
2018-edition/src/ch16-03-shared-state.md
Normal file
426
2018-edition/src/ch16-03-shared-state.md
Normal file
@@ -0,0 +1,426 @@
|
||||
## Shared-State Concurrency
|
||||
|
||||
Message passing is a fine way of handling concurrency, but it’s not the only
|
||||
one. Consider this part of the slogan from the Go language documentation again:
|
||||
“communicate by sharing memory.”
|
||||
|
||||
What would communicating by sharing memory look like? In addition, why would
|
||||
message-passing enthusiasts not use it and do the opposite instead?
|
||||
|
||||
In a way, channels in any programming language are similar to single ownership,
|
||||
because once you transfer a value down a channel, you should no longer use that
|
||||
value. Shared memory concurrency is like multiple ownership: multiple threads
|
||||
can access the same memory location at the same time. As you saw in Chapter 15,
|
||||
where smart pointers made multiple ownership possible, multiple ownership can
|
||||
add complexity because these different owners need managing. Rust’s type system
|
||||
and ownership rules greatly assist in getting this management correct. For an
|
||||
example, let’s look at mutexes, one of the more common concurrency primitives
|
||||
for shared memory.
|
||||
|
||||
### Using Mutexes to Allow Access to Data from One Thread at a Time
|
||||
|
||||
*Mutex* is an abbreviation for *mutual exclusion*, as in, a mutex allows only
|
||||
one thread to access some data at any given time. To access the data in a
|
||||
mutex, a thread must first signal that it wants access by asking to acquire the
|
||||
mutex’s *lock*. The lock is a data structure that is part of the mutex that
|
||||
keeps track of who currently has exclusive access to the data. Therefore, the
|
||||
mutex is described as *guarding* the data it holds via the locking system.
|
||||
|
||||
Mutexes have a reputation for being difficult to use because you have to
|
||||
remember two rules:
|
||||
|
||||
* You must attempt to acquire the lock before using the data.
|
||||
* When you’re done with the data that the mutex guards, you must unlock the
|
||||
data so other threads can acquire the lock.
|
||||
|
||||
For a real-world metaphor for a mutex, imagine a panel discussion at a
|
||||
conference with only one microphone. Before a panelist can speak, they have to
|
||||
ask or signal that they want to use the microphone. When they get the
|
||||
microphone, they can talk for as long as they want to and then hand the
|
||||
microphone to the next panelist who requests to speak. If a panelist forgets to
|
||||
hand the microphone off when they’re finished with it, no one else is able to
|
||||
speak. If management of the shared microphone goes wrong, the panel won’t work
|
||||
as planned!
|
||||
|
||||
Management of mutexes can be incredibly tricky to get right, which is why so
|
||||
many people are enthusiastic about channels. However, thanks to Rust’s type
|
||||
system and ownership rules, you can’t get locking and unlocking wrong.
|
||||
|
||||
#### The API of `Mutex<T>`
|
||||
|
||||
As an example of how to use a mutex, let’s start by using a mutex in a
|
||||
single-threaded context, as shown in Listing 16-12:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::sync::Mutex;
|
||||
|
||||
fn main() {
|
||||
let m = Mutex::new(5);
|
||||
|
||||
{
|
||||
let mut num = m.lock().unwrap();
|
||||
*num = 6;
|
||||
}
|
||||
|
||||
println!("m = {:?}", m);
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-12: Exploring the API of `Mutex<T>` in a
|
||||
single-threaded context for simplicity</span>
|
||||
|
||||
As with many types, we create a `Mutex<T>` using the associated function `new`.
|
||||
To access the data inside the mutex, we use the `lock` method to acquire the
|
||||
lock. This call will block the current thread so it can’t do any work until
|
||||
it’s our turn to have the lock.
|
||||
|
||||
The call to `lock` would fail if another thread holding the lock panicked. In
|
||||
that case, no one would ever be able to get the lock, so we’ve chosen to
|
||||
`unwrap` and have this thread panic if we’re in that situation.
|
||||
|
||||
After we’ve acquired the lock, we can treat the return value, named `num` in
|
||||
this case, as a mutable reference to the data inside. The type system ensures
|
||||
that we acquire a lock before using the value in `m`: `Mutex<i32>` is not an
|
||||
`i32`, so we *must* acquire the lock to be able to use the `i32` value. We
|
||||
can’t forget; the type system won’t let us access the inner `i32` otherwise.
|
||||
|
||||
As you might suspect, `Mutex<T>` is a smart pointer. More accurately, the call
|
||||
to `lock` *returns* a smart pointer called `MutexGuard`. This smart pointer
|
||||
implements `Deref` to point at our inner data; the smart pointer also has a
|
||||
`Drop` implementation that releases the lock automatically when a `MutexGuard`
|
||||
goes out of scope, which happens at the end of the inner scope in Listing
|
||||
16-12. As a result, we don’t risk forgetting to release the lock and blocking
|
||||
the mutex from being used by other threads because the lock release happens
|
||||
automatically.
|
||||
|
||||
After dropping the lock, we can print the mutex value and see that we were able
|
||||
to change the inner `i32` to 6.
|
||||
|
||||
#### Sharing a `Mutex<T>` Between Multiple Threads
|
||||
|
||||
Now, let’s try to share a value between multiple threads using `Mutex<T>`.
|
||||
We’ll spin up 10 threads and have them each increment a counter value by 1, so
|
||||
the counter goes from 0 to 10. Note that the next few examples will have
|
||||
compiler errors, and we’ll use those errors to learn more about using
|
||||
`Mutex<T>` and how Rust helps us use it correctly. Listing 16-13 has our
|
||||
starting example:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
use std::sync::Mutex;
|
||||
use std::thread;
|
||||
|
||||
fn main() {
|
||||
let counter = Mutex::new(0);
|
||||
let mut handles = vec![];
|
||||
|
||||
for _ in 0..10 {
|
||||
let handle = thread::spawn(move || {
|
||||
let mut num = counter.lock().unwrap();
|
||||
|
||||
*num += 1;
|
||||
});
|
||||
handles.push(handle);
|
||||
}
|
||||
|
||||
for handle in handles {
|
||||
handle.join().unwrap();
|
||||
}
|
||||
|
||||
println!("Result: {}", *counter.lock().unwrap());
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-13: Ten threads each increment a counter
|
||||
guarded by a `Mutex<T>`</span>
|
||||
|
||||
We create a `counter` variable to hold an `i32` inside a `Mutex<T>`, as we
|
||||
did in Listing 16-12. Next, we create 10 threads by iterating over a range
|
||||
of numbers. We use `thread::spawn` and give all the threads the same closure,
|
||||
one that moves the counter into the thread, acquires a lock on the `Mutex<T>`
|
||||
by calling the `lock` method, and then adds 1 to the value in the mutex. When a
|
||||
thread finishes running its closure, `num` will go out of scope and release the
|
||||
lock so another thread can acquire it.
|
||||
|
||||
In the main thread, we collect all the join handles. Then, as we did in Listing
|
||||
16-2, we call `join` on each handle to make sure all the threads finish. At
|
||||
that point, the main thread will acquire the lock and print the result of this
|
||||
program.
|
||||
|
||||
We hinted that this example wouldn’t compile. Now let’s find out why!
|
||||
|
||||
```text
|
||||
error[E0382]: capture of moved value: `counter`
|
||||
--> src/main.rs:10:27
|
||||
|
|
||||
9 | let handle = thread::spawn(move || {
|
||||
| ------- value moved (into closure) here
|
||||
10 | let mut num = counter.lock().unwrap();
|
||||
| ^^^^^^^ value captured here after move
|
||||
|
|
||||
= note: move occurs because `counter` has type `std::sync::Mutex<i32>`,
|
||||
which does not implement the `Copy` trait
|
||||
|
||||
error[E0382]: use of moved value: `counter`
|
||||
--> src/main.rs:21:29
|
||||
|
|
||||
9 | let handle = thread::spawn(move || {
|
||||
| ------- value moved (into closure) here
|
||||
...
|
||||
21 | println!("Result: {}", *counter.lock().unwrap());
|
||||
| ^^^^^^^ value used here after move
|
||||
|
|
||||
= note: move occurs because `counter` has type `std::sync::Mutex<i32>`,
|
||||
which does not implement the `Copy` trait
|
||||
|
||||
error: aborting due to 2 previous errors
|
||||
```
|
||||
|
||||
The error message states that the `counter` value is moved into the closure and
|
||||
then captured when we call `lock`. That description sounds like what we wanted,
|
||||
but it’s not allowed!
|
||||
|
||||
Let’s figure this out by simplifying the program. Instead of making 10 threads
|
||||
in a `for` loop, let’s just make two threads without a loop and see what
|
||||
happens. Replace the first `for` loop in Listing 16-13 with this code instead:
|
||||
|
||||
```rust,ignore
|
||||
use std::sync::Mutex;
|
||||
use std::thread;
|
||||
|
||||
fn main() {
|
||||
let counter = Mutex::new(0);
|
||||
let mut handles = vec![];
|
||||
|
||||
let handle = thread::spawn(move || {
|
||||
let mut num = counter.lock().unwrap();
|
||||
|
||||
*num += 1;
|
||||
});
|
||||
handles.push(handle);
|
||||
|
||||
let handle2 = thread::spawn(move || {
|
||||
let mut num2 = counter.lock().unwrap();
|
||||
|
||||
*num2 += 1;
|
||||
});
|
||||
handles.push(handle2);
|
||||
|
||||
for handle in handles {
|
||||
handle.join().unwrap();
|
||||
}
|
||||
|
||||
println!("Result: {}", *counter.lock().unwrap());
|
||||
}
|
||||
```
|
||||
|
||||
We make two threads and change the variable names used with the second thread
|
||||
to `handle2` and `num2`. When we run the code this time, compiling gives us the
|
||||
following:
|
||||
|
||||
```text
|
||||
error[E0382]: capture of moved value: `counter`
|
||||
--> src/main.rs:16:24
|
||||
|
|
||||
8 | let handle = thread::spawn(move || {
|
||||
| ------- value moved (into closure) here
|
||||
...
|
||||
16 | let mut num2 = counter.lock().unwrap();
|
||||
| ^^^^^^^ value captured here after move
|
||||
|
|
||||
= note: move occurs because `counter` has type `std::sync::Mutex<i32>`,
|
||||
which does not implement the `Copy` trait
|
||||
|
||||
error[E0382]: use of moved value: `counter`
|
||||
--> src/main.rs:26:29
|
||||
|
|
||||
8 | let handle = thread::spawn(move || {
|
||||
| ------- value moved (into closure) here
|
||||
...
|
||||
26 | println!("Result: {}", *counter.lock().unwrap());
|
||||
| ^^^^^^^ value used here after move
|
||||
|
|
||||
= note: move occurs because `counter` has type `std::sync::Mutex<i32>`,
|
||||
which does not implement the `Copy` trait
|
||||
|
||||
error: aborting due to 2 previous errors
|
||||
```
|
||||
|
||||
Aha! The first error message indicates that `counter` is moved into the closure
|
||||
for the thread associated with `handle`. That move is preventing us from
|
||||
capturing `counter` when we try to call `lock` on it and store the result in
|
||||
`num2` in the second thread! So Rust is telling us that we can’t move ownership
|
||||
of `counter` into multiple threads. This was hard to see earlier because our
|
||||
threads were in a loop, and Rust can’t point to different threads in different
|
||||
iterations of the loop. Let’s fix the compiler error with a multiple-ownership
|
||||
method we discussed in Chapter 15.
|
||||
|
||||
#### Multiple Ownership with Multiple Threads
|
||||
|
||||
In Chapter 15, we gave a value multiple owners by using the smart pointer
|
||||
`Rc<T>` to create a reference counted value. Let’s do the same here and see
|
||||
what happens. We’ll wrap the `Mutex<T>` in `Rc<T>` in Listing 16-14 and clone
|
||||
the `Rc<T>` before moving ownership to the thread. Now that we’ve seen the
|
||||
errors, we’ll also switch back to using the `for` loop, and we’ll keep the
|
||||
`move` keyword with the closure.
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust,ignore
|
||||
use std::rc::Rc;
|
||||
use std::sync::Mutex;
|
||||
use std::thread;
|
||||
|
||||
fn main() {
|
||||
let counter = Rc::new(Mutex::new(0));
|
||||
let mut handles = vec![];
|
||||
|
||||
for _ in 0..10 {
|
||||
let counter = Rc::clone(&counter);
|
||||
let handle = thread::spawn(move || {
|
||||
let mut num = counter.lock().unwrap();
|
||||
|
||||
*num += 1;
|
||||
});
|
||||
handles.push(handle);
|
||||
}
|
||||
|
||||
for handle in handles {
|
||||
handle.join().unwrap();
|
||||
}
|
||||
|
||||
println!("Result: {}", *counter.lock().unwrap());
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-14: Attempting to use `Rc<T>` to allow
|
||||
multiple threads to own the `Mutex<T>`</span>
|
||||
|
||||
Once again, we compile and get... different errors! The compiler is teaching us
|
||||
a lot.
|
||||
|
||||
```text
|
||||
error[E0277]: the trait bound `std::rc::Rc<std::sync::Mutex<i32>>:
|
||||
std::marker::Send` is not satisfied in `[closure@src/main.rs:11:36:
|
||||
15:10 counter:std::rc::Rc<std::sync::Mutex<i32>>]`
|
||||
--> src/main.rs:11:22
|
||||
|
|
||||
11 | let handle = thread::spawn(move || {
|
||||
| ^^^^^^^^^^^^^ `std::rc::Rc<std::sync::Mutex<i32>>`
|
||||
cannot be sent between threads safely
|
||||
|
|
||||
= help: within `[closure@src/main.rs:11:36: 15:10
|
||||
counter:std::rc::Rc<std::sync::Mutex<i32>>]`, the trait `std::marker::Send` is
|
||||
not implemented for `std::rc::Rc<std::sync::Mutex<i32>>`
|
||||
= note: required because it appears within the type
|
||||
`[closure@src/main.rs:11:36: 15:10 counter:std::rc::Rc<std::sync::Mutex<i32>>]`
|
||||
= note: required by `std::thread::spawn`
|
||||
```
|
||||
|
||||
Wow, that error message is very wordy! Here are some important parts to focus
|
||||
on: the first inline error says `` `std::rc::Rc<std::sync::Mutex<i32>>` cannot
|
||||
be sent between threads safely ``. The reason for this is in the next important
|
||||
part to focus on, the error message. The distilled error message says `` the
|
||||
trait bound `Send` is not satisfied ``. We’ll talk about `Send` in the next
|
||||
section: it’s one of the traits that ensures the types we use with threads are
|
||||
meant for use in concurrent situations.
|
||||
|
||||
Unfortunately, `Rc<T>` is not safe to share across threads. When `Rc<T>`
|
||||
manages the reference count, it adds to the count for each call to `clone` and
|
||||
subtracts from the count when each clone is dropped. But it doesn’t use any
|
||||
concurrency primitives to make sure that changes to the count can’t be
|
||||
interrupted by another thread. This could lead to wrong counts—subtle bugs that
|
||||
could in turn lead to memory leaks or a value being dropped before we’re done
|
||||
with it. What we need is a type exactly like `Rc<T>` but one that makes changes
|
||||
to the reference count in a thread-safe way.
|
||||
|
||||
#### Atomic Reference Counting with `Arc<T>`
|
||||
|
||||
Fortunately, `Arc<T>` *is* a type like `Rc<T>` that is safe to use in
|
||||
concurrent situations. The *a* stands for *atomic*, meaning it’s an *atomically
|
||||
reference counted* type. Atomics are an additional kind of concurrency
|
||||
primitive that we won’t cover in detail here: see the standard library
|
||||
documentation for `std::sync::atomic` for more details. At this point, you just
|
||||
need to know that atomics work like primitive types but are safe to share
|
||||
across threads.
|
||||
|
||||
You might then wonder why all primitive types aren’t atomic and why standard
|
||||
library types aren’t implemented to use `Arc<T>` by default. The reason is that
|
||||
thread safety comes with a performance penalty that you only want to pay when
|
||||
you really need to. If you’re just performing operations on values within a
|
||||
single thread, your code can run faster if it doesn’t have to enforce the
|
||||
guarantees atomics provide.
|
||||
|
||||
Let’s return to our example: `Arc<T>` and `Rc<T>` have the same API, so we fix
|
||||
our program by changing the `use` line, the call to `new`, and the call to
|
||||
`clone`. The code in Listing 16-15 will finally compile and run:
|
||||
|
||||
<span class="filename">Filename: src/main.rs</span>
|
||||
|
||||
```rust
|
||||
use std::sync::{Mutex, Arc};
|
||||
use std::thread;
|
||||
|
||||
fn main() {
|
||||
let counter = Arc::new(Mutex::new(0));
|
||||
let mut handles = vec![];
|
||||
|
||||
for _ in 0..10 {
|
||||
let counter = Arc::clone(&counter);
|
||||
let handle = thread::spawn(move || {
|
||||
let mut num = counter.lock().unwrap();
|
||||
|
||||
*num += 1;
|
||||
});
|
||||
handles.push(handle);
|
||||
}
|
||||
|
||||
for handle in handles {
|
||||
handle.join().unwrap();
|
||||
}
|
||||
|
||||
println!("Result: {}", *counter.lock().unwrap());
|
||||
}
|
||||
```
|
||||
|
||||
<span class="caption">Listing 16-15: Using an `Arc<T>` to wrap the `Mutex<T>`
|
||||
to be able to share ownership across multiple threads</span>
|
||||
|
||||
This code will print the following:
|
||||
|
||||
```text
|
||||
Result: 10
|
||||
```
|
||||
|
||||
We did it! We counted from 0 to 10, which may not seem very impressive, but it
|
||||
did teach us a lot about `Mutex<T>` and thread safety. You could also use this
|
||||
program’s structure to do more complicated operations than just incrementing a
|
||||
counter. Using this strategy, you can divide a calculation into independent
|
||||
parts, split those parts across threads, and then use a `Mutex<T>` to have each
|
||||
thread update the final result with its part.
|
||||
|
||||
### Similarities Between `RefCell<T>`/`Rc<T>` and `Mutex<T>`/`Arc<T>`
|
||||
|
||||
You might have noticed that `counter` is immutable but we could get a mutable
|
||||
reference to the value inside it; this means `Mutex<T>` provides interior
|
||||
mutability, as the `Cell` family does. In the same way we used `RefCell<T>` in
|
||||
Chapter 15 to allow us to mutate contents inside an `Rc<T>`, we use `Mutex<T>`
|
||||
to mutate contents inside an `Arc<T>`.
|
||||
|
||||
Another detail to note is that Rust can’t protect you from all kinds of logic
|
||||
errors when you use `Mutex<T>`. Recall in Chapter 15 that using `Rc<T>` came
|
||||
with the risk of creating reference cycles, where two `Rc<T>` values refer to
|
||||
each other, causing memory leaks. Similarly, `Mutex<T>` comes with the risk of
|
||||
creating *deadlocks*. These occur when an operation needs to lock two resources
|
||||
and two threads have each acquired one of the locks, causing them to wait for
|
||||
each other forever. If you’re interested in deadlocks, try creating a Rust
|
||||
program that has a deadlock; then research deadlock mitigation strategies for
|
||||
mutexes in any language and have a go at implementing them in Rust. The
|
||||
standard library API documentation for `Mutex<T>` and `MutexGuard` offers
|
||||
useful information.
|
||||
|
||||
We’ll round out this chapter by talking about the `Send` and `Sync` traits and
|
||||
how we can use them with custom types.
|
||||
@@ -0,0 +1,87 @@
|
||||
## Extensible Concurrency with the `Sync` and `Send` Traits
|
||||
|
||||
Interestingly, the Rust language has *very* few concurrency features. Almost
|
||||
every concurrency feature we’ve talked about so far in this chapter has been
|
||||
part of the standard library, not the language. Your options for handling
|
||||
concurrency are not limited to the language or the standard library; you can
|
||||
write your own concurrency features or use those written by others.
|
||||
|
||||
However, two concurrency concepts are embedded in the language: the
|
||||
`std::marker` traits `Sync` and `Send`.
|
||||
|
||||
### Allowing Transference of Ownership Between Threads with `Send`
|
||||
|
||||
The `Send` marker trait indicates that ownership of the type implementing
|
||||
`Send` can be transferred between threads. Almost every Rust type is `Send`,
|
||||
but there are some exceptions, including `Rc<T>`: this cannot be `Send` because
|
||||
if you cloned an `Rc<T>` value and tried to transfer ownership of the clone to
|
||||
another thread, both threads might update the reference count at the same time.
|
||||
For this reason, `Rc<T>` is implemented for use in single-threaded situations
|
||||
where you don’t want to pay the thread-safe performance penalty.
|
||||
|
||||
Therefore, Rust’s type system and trait bounds ensure that you can never
|
||||
accidentally send an `Rc<T>` value across threads unsafely. When we tried to do
|
||||
this in Listing 16-14, we got the error `the trait Send is not implemented for
|
||||
Rc<Mutex<i32>>`. When we switched to `Arc<T>`, which is `Send`, the code
|
||||
compiled.
|
||||
|
||||
Any type composed entirely of `Send` types is automatically marked as `Send` as
|
||||
well. Almost all primitive types are `Send`, aside from raw pointers, which
|
||||
we’ll discuss in Chapter 19.
|
||||
|
||||
### Allowing Access from Multiple Threads with `Sync`
|
||||
|
||||
The `Sync` marker trait indicates that it is safe for the type implementing
|
||||
`Sync` to be referenced from multiple threads. In other words, any type `T` is
|
||||
`Sync` if `&T` (a reference to `T`) is `Send`, meaning the reference can be
|
||||
sent safely to another thread. Similar to `Send`, primitive types are `Sync`,
|
||||
and types composed entirely of types that are `Sync` are also `Sync`.
|
||||
|
||||
The smart pointer `Rc<T>` is also not `Sync` for the same reasons that it’s not
|
||||
`Send`. The `RefCell<T>` type (which we talked about in Chapter 15) and the
|
||||
family of related `Cell<T>` types are not `Sync`. The implementation of borrow
|
||||
checking that `RefCell<T>` does at runtime is not thread-safe. The smart
|
||||
pointer `Mutex<T>` is `Sync` and can be used to share access with multiple
|
||||
threads as you saw in the “Sharing a `Mutex<T>` Between Multiple Threads”
|
||||
section.
|
||||
|
||||
### Implementing `Send` and `Sync` Manually Is Unsafe
|
||||
|
||||
Because types that are made up of `Send` and `Sync` traits are automatically
|
||||
also `Send` and `Sync`, we don’t have to implement those traits manually. As
|
||||
marker traits, they don’t even have any methods to implement. They’re just
|
||||
useful for enforcing invariants related to concurrency.
|
||||
|
||||
Manually implementing these traits involves implementing unsafe Rust code.
|
||||
We’ll talk about using unsafe Rust code in Chapter 19; for now, the important
|
||||
information is that building new concurrent types not made up of `Send` and
|
||||
`Sync` parts requires careful thought to uphold the safety guarantees.
|
||||
[The Rustonomicon] has more information about these guarantees and how to
|
||||
uphold them.
|
||||
|
||||
[The Rustonomicon]: https://doc.rust-lang.org/stable/nomicon/
|
||||
|
||||
## Summary
|
||||
|
||||
This isn’t the last you’ll see of concurrency in this book: the project in
|
||||
Chapter 20 will use the concepts in this chapter in a more realistic situation
|
||||
than the smaller examples discussed here.
|
||||
|
||||
As mentioned earlier, because very little of how Rust handles concurrency is
|
||||
part of the language, many concurrency solutions are implemented as crates.
|
||||
These evolve more quickly than the standard library, so be sure to search
|
||||
online for the current, state-of-the-art crates to use in multithreaded
|
||||
situations.
|
||||
|
||||
The Rust standard library provides channels for message passing and smart
|
||||
pointer types, such as `Mutex<T>` and `Arc<T>`, that are safe to use in
|
||||
concurrent contexts. The type system and the borrow checker ensure that the
|
||||
code using these solutions won’t end up with data races or invalid references.
|
||||
Once you get your code to compile, you can rest assured that it will happily
|
||||
run on multiple threads without the kinds of hard-to-track-down bugs common in
|
||||
other languages. Concurrent programming is no longer a concept to be afraid of:
|
||||
go forth and make your programs concurrent, fearlessly!
|
||||
|
||||
Next, we’ll talk about idiomatic ways to model problems and structure solutions
|
||||
as your Rust programs get bigger. In addition, we’ll discuss how Rust’s idioms
|
||||
relate to those you might be familiar with from object-oriented programming.
|
||||
Some files were not shown because too many files have changed in this diff Show More
Reference in New Issue
Block a user