From 656886474bf7c6c212b29c6ebc35c002f15698de Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 1 Oct 2015 16:21:59 -0400 Subject: [PATCH 001/630] initial empty commit From 1b1dcf9c21e9915c0226bca2fb51818fb5395562 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 1 Oct 2015 16:21:59 -0400 Subject: [PATCH 002/630] MXNet.jl generated files. license: MIT authors: Chiyuan Zhang years: 2015 user: pluskid Julia Version 0.4.0-rc2 [fa52609*] --- .gitignore | 3 +++ .travis.yml | 14 ++++++++++++++ LICENSE.md | 22 ++++++++++++++++++++++ README.md | 3 +++ REQUIRE | 1 + appveyor.yml | 34 ++++++++++++++++++++++++++++++++++ src/MXNet.jl | 5 +++++ test/runtests.jl | 5 +++++ 8 files changed, 87 insertions(+) create mode 100644 .gitignore create mode 100644 .travis.yml create mode 100644 LICENSE.md create mode 100644 README.md create mode 100644 REQUIRE create mode 100644 appveyor.yml create mode 100644 src/MXNet.jl create mode 100644 test/runtests.jl diff --git a/.gitignore b/.gitignore new file mode 100644 index 000000000000..8c960ec808d9 --- /dev/null +++ b/.gitignore @@ -0,0 +1,3 @@ +*.jl.cov +*.jl.*.cov +*.jl.mem diff --git a/.travis.yml b/.travis.yml new file mode 100644 index 000000000000..00656a7e0f7d --- /dev/null +++ b/.travis.yml @@ -0,0 +1,14 @@ +# Documentation: http://docs.travis-ci.com/user/languages/julia/ +language: julia +os: + - linux + - osx +julia: + - release + - nightly +notifications: + email: false +# uncomment the following lines to override the default test script +#script: +# - if [[ -a .git/shallow ]]; then git fetch --unshallow; fi +# - julia -e 'Pkg.clone(pwd()); Pkg.build("MXNet"); Pkg.test("MXNet"; coverage=true)' diff --git a/LICENSE.md b/LICENSE.md new file mode 100644 index 000000000000..c578b73f5fdf --- /dev/null +++ b/LICENSE.md @@ -0,0 +1,22 @@ +The MXNet.jl package is licensed under the MIT "Expat" License: + +> Copyright (c) 2015: Chiyuan Zhang. +> +> Permission is hereby granted, free of charge, to any person obtaining +> a copy of this software and associated documentation files (the +> "Software"), to deal in the Software without restriction, including +> without limitation the rights to use, copy, modify, merge, publish, +> distribute, sublicense, and/or sell copies of the Software, and to +> permit persons to whom the Software is furnished to do so, subject to +> the following conditions: +> +> The above copyright notice and this permission notice shall be +> included in all copies or substantial portions of the Software. +> +> THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, +> EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF +> MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. +> IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY +> CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, +> TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE +> SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. diff --git a/README.md b/README.md new file mode 100644 index 000000000000..731c12553095 --- /dev/null +++ b/README.md @@ -0,0 +1,3 @@ +# MXNet + +[![Build Status](https://travis-ci.org/pluskid/MXNet.jl.svg?branch=master)](https://travis-ci.org/pluskid/MXNet.jl) diff --git a/REQUIRE b/REQUIRE new file mode 100644 index 000000000000..2c4ef82cb1ab --- /dev/null +++ b/REQUIRE @@ -0,0 +1 @@ +julia 0.3 diff --git a/appveyor.yml b/appveyor.yml new file mode 100644 index 000000000000..8b7699447712 --- /dev/null +++ b/appveyor.yml @@ -0,0 +1,34 @@ +environment: + matrix: + - JULIAVERSION: "julialang/bin/winnt/x86/0.3/julia-0.3-latest-win32.exe" + - JULIAVERSION: "julialang/bin/winnt/x64/0.3/julia-0.3-latest-win64.exe" + - JULIAVERSION: "julianightlies/bin/winnt/x86/julia-latest-win32.exe" + - JULIAVERSION: "julianightlies/bin/winnt/x64/julia-latest-win64.exe" + +branches: + only: + - master + - /release-.*/ + +notifications: + - provider: Email + on_build_success: false + on_build_failure: false + on_build_status_changed: false + +install: +# Download most recent Julia Windows binary + - ps: (new-object net.webclient).DownloadFile( + $("http://s3.amazonaws.com/"+$env:JULIAVERSION), + "C:\projects\julia-binary.exe") +# Run installer silently, output to C:\projects\julia + - C:\projects\julia-binary.exe /S /D=C:\projects\julia + +build_script: +# Need to convert from shallow to complete for Pkg.clone to work + - IF EXIST .git\shallow (git fetch --unshallow) + - C:\projects\julia\bin\julia -e "versioninfo(); + Pkg.clone(pwd(), \"MXNet\"); Pkg.build(\"MXNet\")" + +test_script: + - C:\projects\julia\bin\julia --check-bounds=yes -e "Pkg.test(\"MXNet\")" diff --git a/src/MXNet.jl b/src/MXNet.jl new file mode 100644 index 000000000000..c45f25e4610a --- /dev/null +++ b/src/MXNet.jl @@ -0,0 +1,5 @@ +module MXNet + +# package code goes here + +end # module diff --git a/test/runtests.jl b/test/runtests.jl new file mode 100644 index 000000000000..d6005fcf699d --- /dev/null +++ b/test/runtests.jl @@ -0,0 +1,5 @@ +using MXNet +using Base.Test + +# write your own tests here +@test 1 == 1 From 3e0abcef744ec0082e372baa4f81f83fad441e8c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 1 Oct 2015 16:23:07 -0400 Subject: [PATCH 003/630] MXNet.jl regenerated files. license: ASL authors: Chiyuan Zhang years: 2015 user: pluskid Julia Version 0.4.0-rc2 [fa52609*] --- LICENSE.md | 199 +++++++++++++++++++++++++++++++++++++++++++++++------ 1 file changed, 178 insertions(+), 21 deletions(-) diff --git a/LICENSE.md b/LICENSE.md index c578b73f5fdf..a34c4a0f662e 100644 --- a/LICENSE.md +++ b/LICENSE.md @@ -1,22 +1,179 @@ -The MXNet.jl package is licensed under the MIT "Expat" License: +The MXNet.jl package is licensed under version 2.0 of the Apache License: -> Copyright (c) 2015: Chiyuan Zhang. -> -> Permission is hereby granted, free of charge, to any person obtaining -> a copy of this software and associated documentation files (the -> "Software"), to deal in the Software without restriction, including -> without limitation the rights to use, copy, modify, merge, publish, -> distribute, sublicense, and/or sell copies of the Software, and to -> permit persons to whom the Software is furnished to do so, subject to -> the following conditions: -> -> The above copyright notice and this permission notice shall be -> included in all copies or substantial portions of the Software. -> -> THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, -> EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF -> MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. -> IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY -> CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, -> TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE -> SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. +> Copyright (c) 2015: +> * Chiyuan Zhang +> +> Apache License +> Version 2.0, January 2004 +> http://www.apache.org/licenses/ +> +> TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION +> +> 1. Definitions. +> +> "License" shall mean the terms and conditions for use, reproduction, +> and distribution as defined by Sections 1 through 9 of this document. +> +> "Licensor" shall mean the copyright owner or entity authorized by +> the copyright owner that is granting the License. +> +> "Legal Entity" shall mean the union of the acting entity and all +> other entities that control, are controlled by, or are under common +> control with that entity. For the purposes of this definition, +> "control" means (i) the power, direct or indirect, to cause the +> direction or management of such entity, whether by contract or +> otherwise, or (ii) ownership of fifty percent (50%) or more of the +> outstanding shares, or (iii) beneficial ownership of such entity. +> +> "You" (or "Your") shall mean an individual or Legal Entity +> exercising permissions granted by this License. +> +> "Source" form shall mean the preferred form for making modifications, +> including but not limited to software source code, documentation +> source, and configuration files. +> +> "Object" form shall mean any form resulting from mechanical +> transformation or translation of a Source form, including but +> not limited to compiled object code, generated documentation, +> and conversions to other media types. +> +> "Work" shall mean the work of authorship, whether in Source or +> Object form, made available under the License, as indicated by a +> copyright notice that is included in or attached to the work +> (an example is provided in the Appendix below). +> +> "Derivative Works" shall mean any work, whether in Source or Object +> form, that is based on (or derived from) the Work and for which the +> editorial revisions, annotations, elaborations, or other modifications +> represent, as a whole, an original work of authorship. For the purposes +> of this License, Derivative Works shall not include works that remain +> separable from, or merely link (or bind by name) to the interfaces of, +> the Work and Derivative Works thereof. +> +> "Contribution" shall mean any work of authorship, including +> the original version of the Work and any modifications or additions +> to that Work or Derivative Works thereof, that is intentionally +> submitted to Licensor for inclusion in the Work by the copyright owner +> or by an individual or Legal Entity authorized to submit on behalf of +> the copyright owner. For the purposes of this definition, "submitted" +> means any form of electronic, verbal, or written communication sent +> to the Licensor or its representatives, including but not limited to +> communication on electronic mailing lists, source code control systems, +> and issue tracking systems that are managed by, or on behalf of, the +> Licensor for the purpose of discussing and improving the Work, but +> excluding communication that is conspicuously marked or otherwise +> designated in writing by the copyright owner as "Not a Contribution." +> +> "Contributor" shall mean Licensor and any individual or Legal Entity +> on behalf of whom a Contribution has been received by Licensor and +> subsequently incorporated within the Work. +> +> 2. Grant of Copyright License. Subject to the terms and conditions of +> this License, each Contributor hereby grants to You a perpetual, +> worldwide, non-exclusive, no-charge, royalty-free, irrevocable +> copyright license to reproduce, prepare Derivative Works of, +> publicly display, publicly perform, sublicense, and distribute the +> Work and such Derivative Works in Source or Object form. +> +> 3. Grant of Patent License. Subject to the terms and conditions of +> this License, each Contributor hereby grants to You a perpetual, +> worldwide, non-exclusive, no-charge, royalty-free, irrevocable +> (except as stated in this section) patent license to make, have made, +> use, offer to sell, sell, import, and otherwise transfer the Work, +> where such license applies only to those patent claims licensable +> by such Contributor that are necessarily infringed by their +> Contribution(s) alone or by combination of their Contribution(s) +> with the Work to which such Contribution(s) was submitted. If You +> institute patent litigation against any entity (including a +> cross-claim or counterclaim in a lawsuit) alleging that the Work +> or a Contribution incorporated within the Work constitutes direct +> or contributory patent infringement, then any patent licenses +> granted to You under this License for that Work shall terminate +> as of the date such litigation is filed. +> +> 4. Redistribution. You may reproduce and distribute copies of the +> Work or Derivative Works thereof in any medium, with or without +> modifications, and in Source or Object form, provided that You +> meet the following conditions: +> +> (a) You must give any other recipients of the Work or +> Derivative Works a copy of this License; and +> +> (b) You must cause any modified files to carry prominent notices +> stating that You changed the files; and +> +> (c) You must retain, in the Source form of any Derivative Works +> that You distribute, all copyright, patent, trademark, and +> attribution notices from the Source form of the Work, +> excluding those notices that do not pertain to any part of +> the Derivative Works; and +> +> (d) If the Work includes a "NOTICE" text file as part of its +> distribution, then any Derivative Works that You distribute must +> include a readable copy of the attribution notices contained +> within such NOTICE file, excluding those notices that do not +> pertain to any part of the Derivative Works, in at least one +> of the following places: within a NOTICE text file distributed +> as part of the Derivative Works; within the Source form or +> documentation, if provided along with the Derivative Works; or, +> within a display generated by the Derivative Works, if and +> wherever such third-party notices normally appear. The contents +> of the NOTICE file are for informational purposes only and +> do not modify the License. You may add Your own attribution +> notices within Derivative Works that You distribute, alongside +> or as an addendum to the NOTICE text from the Work, provided +> that such additional attribution notices cannot be construed +> as modifying the License. +> +> You may add Your own copyright statement to Your modifications and +> may provide additional or different license terms and conditions +> for use, reproduction, or distribution of Your modifications, or +> for any such Derivative Works as a whole, provided Your use, +> reproduction, and distribution of the Work otherwise complies with +> the conditions stated in this License. +> +> 5. Submission of Contributions. Unless You explicitly state otherwise, +> any Contribution intentionally submitted for inclusion in the Work +> by You to the Licensor shall be under the terms and conditions of +> this License, without any additional terms or conditions. +> Notwithstanding the above, nothing herein shall supersede or modify +> the terms of any separate license agreement you may have executed +> with Licensor regarding such Contributions. +> +> 6. Trademarks. This License does not grant permission to use the trade +> names, trademarks, service marks, or product names of the Licensor, +> except as required for reasonable and customary use in describing the +> origin of the Work and reproducing the content of the NOTICE file. +> +> 7. Disclaimer of Warranty. Unless required by applicable law or +> agreed to in writing, Licensor provides the Work (and each +> Contributor provides its Contributions) on an "AS IS" BASIS, +> WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or +> implied, including, without limitation, any warranties or conditions +> of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A +> PARTICULAR PURPOSE. You are solely responsible for determining the +> appropriateness of using or redistributing the Work and assume any +> risks associated with Your exercise of permissions under this License. +> +> 8. Limitation of Liability. In no event and under no legal theory, +> whether in tort (including negligence), contract, or otherwise, +> unless required by applicable law (such as deliberate and grossly +> negligent acts) or agreed to in writing, shall any Contributor be +> liable to You for damages, including any direct, indirect, special, +> incidental, or consequential damages of any character arising as a +> result of this License or out of the use or inability to use the +> Work (including but not limited to damages for loss of goodwill, +> work stoppage, computer failure or malfunction, or any and all +> other commercial damages or losses), even if such Contributor +> has been advised of the possibility of such damages. +> +> 9. Accepting Warranty or Additional Liability. While redistributing +> the Work or Derivative Works thereof, You may choose to offer, +> and charge a fee for, acceptance of support, warranty, indemnity, +> or other liability obligations and/or rights consistent with this +> License. However, in accepting such obligations, You may act only +> on Your own behalf and on Your sole responsibility, not on behalf +> of any other Contributor, and only if You agree to indemnify, +> defend, and hold each Contributor harmless for any liability +> incurred by, or claims asserted against, such Contributor by reason +> of your accepting any such warranty or additional liability. From e25bf7e1c1121b50b7e3a298857825b797f6f60f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 2 Oct 2015 00:01:50 -0400 Subject: [PATCH 004/630] basic API testing, create NDArray --- src/MXNet.jl | 4 +++- src/context.jl | 14 +++++++++++ src/init.jl | 65 ++++++++++++++++++++++++++++++++++++++++++++++++++ src/ndarray.jl | 40 +++++++++++++++++++++++++++++++ 4 files changed, 122 insertions(+), 1 deletion(-) create mode 100644 src/context.jl create mode 100644 src/init.jl create mode 100644 src/ndarray.jl diff --git a/src/MXNet.jl b/src/MXNet.jl index c45f25e4610a..b1fcedb35e16 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -1,5 +1,7 @@ module MXNet -# package code goes here +include("init.jl") +include("context.jl") +include("ndarray.jl") end # module diff --git a/src/context.jl b/src/context.jl new file mode 100644 index 000000000000..af8cfd725a49 --- /dev/null +++ b/src/context.jl @@ -0,0 +1,14 @@ +@enum CONTEXT_TYPE CPU=1 GPU=2 + +type Context + device_type :: CONTEXT_TYPE + device_id :: Cint + + old_ctx :: Nullable{Context} +end +Context(dev_type :: CONTEXT_TYPE, dev_id = 0) = + Context(dev_type, dev_id, Nullable{Context}()) + + +# global default context +DEFAULT_CONTEXT = Context(CPU) diff --git a/src/init.jl b/src/init.jl new file mode 100644 index 000000000000..41fbbbcd3210 --- /dev/null +++ b/src/init.jl @@ -0,0 +1,65 @@ +export MXError + +"Exception thrown when an error occurred calling MXNet API." +immutable MXError <: Exception + msg :: AbstractString +end + +################################################################################ +# Common types used in MXNet API +################################################################################ +typealias MX_uint Cuint +typealias MX_float Cfloat + +macro mx_define_handle_t(name) + name = esc(name) + quote + type $name + value :: Ptr{Void} + end + $name() = $name(C_NULL) + function Base.cconvert(::Type{Ptr{Void}}, obj::$name) + obj.value + end + function Base.isnull(obj::$name) obj.value == C_NULL end + function Base.reset(obj::$name) obj.value = C_NULL end + end +end + +@mx_define_handle_t(MX_NDArrayHandle) +@mx_define_handle_t(MX_FunctionHandle) + +################################################################################ +# Initialization and library API entrance +################################################################################ +const MXNET_LIB = Libdl.find_library(["libmxnet.so"], ["/Users/chiyuan/work/mxnet/mxnet/lib"]) + +function __init__() + atexit() do + # notify libmxnet we are shutting down + ccall( ("MXNotifyShutdown", MXNET_LIB), Cint, () ) + end +end + +function mx_get_last_error() + msg = ccall( ("MXGetLastError", MXNET_LIB), Ptr{UInt8}, () ) + if msg == C_NULL + throw(MXError("Failed to get last error message")) + end + return bytestring(msg) +end + +"Utility macro to call MXNet API functions" +macro mxcall(fv, argtypes, args...) + f = eval(fv) + args = map(esc, args) + quote + _mxret = ccall( ($(Meta.quot(f)), $MXNET_LIB), + Cint, $argtypes, $(args...) ) + if _mxret != 0 + err_msg = mx_get_last_error() + throw(MXError(err_msg)) + end + end +end + diff --git a/src/ndarray.jl b/src/ndarray.jl new file mode 100644 index 000000000000..ea26504559a7 --- /dev/null +++ b/src/ndarray.jl @@ -0,0 +1,40 @@ +export NDArray +export delete + +function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) + h_ref = Ref{Ptr{Void}}(0) + shape = MX_uint[shape...] + @mxcall(:MXNDArrayCreate, (Ptr{MX_uint}, MX_uint, Cint, Cint, Cint, Ref{Ptr{Void}}), + shape, length(shape), ctx.device_type, ctx.device_id, delay_alloc, h_ref) + handle = MX_NDArrayHandle(h_ref[]) + return handle +end + +type NDArray + handle :: MX_NDArrayHandle + writable :: Bool + + function NDArray(handle, writable=true) + obj = new(handle, writable) + + # TODO: there is currently no good way of automatically managing external resources + # using finalizers is said to slow down the GC significantly + finalizer(obj, delete) + obj + end +end + +function delete(obj :: NDArray) + if !isnull(obj.handle) + @mxcall(:MXNDArrayFree, (Ptr{Void},), obj.handle) + reset(obj.handle) + end +end + +function empty{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) + NDArray(_ndarray_alloc(shape, ctx, false)) +end +function empty(shape :: Int...) + empty(shape) +end + From 11029be0876b73f563b556787e5184b2668c35a1 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 2 Oct 2015 00:11:50 -0400 Subject: [PATCH 005/630] a placeholder README --- README.md | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 731c12553095..e9ce3583fcae 100644 --- a/README.md +++ b/README.md @@ -1,3 +1,5 @@ # MXNet -[![Build Status](https://travis-ci.org/pluskid/MXNet.jl.svg?branch=master)](https://travis-ci.org/pluskid/MXNet.jl) +[![Build Status](https://travis-ci.org/dmlc/MXNet.jl.svg?branch=master)](https://travis-ci.org/dmlc/MXNet.jl) + +Julia wrapper of [MXNet](https://github.com/dmlc/mxnet). From d7f011c7f499d3076bc3fe43abd7d824bc216247 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 3 Oct 2015 10:20:37 -0400 Subject: [PATCH 006/630] move gc to handle finalizer --- src/MXNet.jl | 9 +++++++- src/init.jl | 59 +++++++++++++++++++++++++++++++++++--------------- src/ndarray.jl | 14 ++++++------ 3 files changed, 56 insertions(+), 26 deletions(-) diff --git a/src/MXNet.jl b/src/MXNet.jl index b1fcedb35e16..efdf1c76c0c9 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -1,7 +1,14 @@ module MXNet +# we put everything in the namespace mx, because there are a lot of +# functions with the same names as built-in utilities like "zeros", etc. +export mx +module mx + include("init.jl") include("context.jl") include("ndarray.jl") -end # module +end # mx + +end # module MXNet diff --git a/src/init.jl b/src/init.jl index 41fbbbcd3210..f062b52f07f5 100644 --- a/src/init.jl +++ b/src/init.jl @@ -11,24 +11,6 @@ end typealias MX_uint Cuint typealias MX_float Cfloat -macro mx_define_handle_t(name) - name = esc(name) - quote - type $name - value :: Ptr{Void} - end - $name() = $name(C_NULL) - function Base.cconvert(::Type{Ptr{Void}}, obj::$name) - obj.value - end - function Base.isnull(obj::$name) obj.value == C_NULL end - function Base.reset(obj::$name) obj.value = C_NULL end - end -end - -@mx_define_handle_t(MX_NDArrayHandle) -@mx_define_handle_t(MX_FunctionHandle) - ################################################################################ # Initialization and library API entrance ################################################################################ @@ -63,3 +45,44 @@ macro mxcall(fv, argtypes, args...) end end +################################################################################ +# Handle types +################################################################################ +macro mx_define_handle_t(name, destructor) + name = esc(name) + quote + type $name + value :: Ptr{Void} + + function $name(value = C_NULL) + hdr = new(value) + + $(if destructor != :nop + :(finalizer(hdr, delete!)) + end) + + return hdr + end + end + + $(if finalizer != :nop + quote + function delete!(h :: $name) + if h.value != C_NULL + @mxcall($(Meta.quot(destructor)), (Ptr{Void},), h.value) + h.value = C_NULL + end + end + end + end) + + function Base.cconvert(::Type{Ptr{Void}}, obj::$name) + obj.value + end + function Base.isnull(obj::$name) obj.value == C_NULL end + end +end + +@mx_define_handle_t(MX_NDArrayHandle, MXNDArrayFree) +@mx_define_handle_t(MX_FunctionHandle, nop) + diff --git a/src/ndarray.jl b/src/ndarray.jl index ea26504559a7..9cb458a991c9 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -19,17 +19,17 @@ type NDArray # TODO: there is currently no good way of automatically managing external resources # using finalizers is said to slow down the GC significantly - finalizer(obj, delete) + #finalizer(obj, delete) obj end end -function delete(obj :: NDArray) - if !isnull(obj.handle) - @mxcall(:MXNDArrayFree, (Ptr{Void},), obj.handle) - reset(obj.handle) - end -end +#function delete(obj :: NDArray) +# if !isnull(obj.handle) +# @mxcall(:MXNDArrayFree, (Ptr{Void},), obj.handle) +# reset(obj.handle) +# end +#end function empty{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) NDArray(_ndarray_alloc(shape, ctx, false)) From 28531c8679ccd56ba1bed13e159e1260357fd913 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 3 Oct 2015 12:30:55 -0400 Subject: [PATCH 007/630] define binary dn array functions --- src/init.jl | 13 ++++-- src/ndarray.jl | 122 +++++++++++++++++++++++++++++++++++++++++++------ 2 files changed, 116 insertions(+), 19 deletions(-) diff --git a/src/init.jl b/src/init.jl index f062b52f07f5..96aa6d7f0d69 100644 --- a/src/init.jl +++ b/src/init.jl @@ -10,6 +10,10 @@ end ################################################################################ typealias MX_uint Cuint typealias MX_float Cfloat +typealias MX_handle Ptr{Void} + +typealias char_p Ptr{UInt8} +typealias char_pp Ptr{char_p} ################################################################################ # Initialization and library API entrance @@ -17,6 +21,7 @@ typealias MX_float Cfloat const MXNET_LIB = Libdl.find_library(["libmxnet.so"], ["/Users/chiyuan/work/mxnet/mxnet/lib"]) function __init__() + _import_ndarray_functions() atexit() do # notify libmxnet we are shutting down ccall( ("MXNotifyShutdown", MXNET_LIB), Cint, () ) @@ -24,7 +29,7 @@ function __init__() end function mx_get_last_error() - msg = ccall( ("MXGetLastError", MXNET_LIB), Ptr{UInt8}, () ) + msg = ccall( ("MXGetLastError", MXNET_LIB), char_p, () ) if msg == C_NULL throw(MXError("Failed to get last error message")) end @@ -52,7 +57,7 @@ macro mx_define_handle_t(name, destructor) name = esc(name) quote type $name - value :: Ptr{Void} + value :: MX_handle function $name(value = C_NULL) hdr = new(value) @@ -69,14 +74,14 @@ macro mx_define_handle_t(name, destructor) quote function delete!(h :: $name) if h.value != C_NULL - @mxcall($(Meta.quot(destructor)), (Ptr{Void},), h.value) + @mxcall($(Meta.quot(destructor)), (MX_handle,), h.value) h.value = C_NULL end end end end) - function Base.cconvert(::Type{Ptr{Void}}, obj::$name) + function Base.convert(::Type{MX_handle}, obj::$name) obj.value end function Base.isnull(obj::$name) obj.value == C_NULL end diff --git a/src/ndarray.jl b/src/ndarray.jl index 9cb458a991c9..0c20a56e6e87 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1,36 +1,34 @@ export NDArray export delete +# create a NDArray handle of specific shape function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) - h_ref = Ref{Ptr{Void}}(0) + h_ref = Ref{MX_handle}(0) shape = MX_uint[shape...] - @mxcall(:MXNDArrayCreate, (Ptr{MX_uint}, MX_uint, Cint, Cint, Cint, Ref{Ptr{Void}}), + @mxcall(:MXNDArrayCreate, (Ptr{MX_uint}, MX_uint, Cint, Cint, Cint, Ref{MX_handle}), shape, length(shape), ctx.device_type, ctx.device_id, delay_alloc, h_ref) handle = MX_NDArrayHandle(h_ref[]) return handle end +# create a handle to an empty NDArray, this handle can be used to hold +# results returned by libmx API calls +function _ndarray_alloc() + h_ref = Ref{MX_handle}(0) + @mxcall(:MXNDArrayCreateNone, (Ref{MX_handle},), h_ref) + return MX_NDArrayHandle(h_ref[]) +end + + type NDArray handle :: MX_NDArrayHandle writable :: Bool function NDArray(handle, writable=true) - obj = new(handle, writable) - - # TODO: there is currently no good way of automatically managing external resources - # using finalizers is said to slow down the GC significantly - #finalizer(obj, delete) - obj + new(handle, writable) end end -#function delete(obj :: NDArray) -# if !isnull(obj.handle) -# @mxcall(:MXNDArrayFree, (Ptr{Void},), obj.handle) -# reset(obj.handle) -# end -#end - function empty{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) NDArray(_ndarray_alloc(shape, ctx, false)) end @@ -38,3 +36,97 @@ function empty(shape :: Int...) empty(shape) end +module _lib +# this module is used to hold functions automatically imported +# from libmxnet +end +function _register_function(lib::Module, name::Symbol, func::Function) + eval(lib, quote + $name = $func + end) +end + +@enum(LIBMX_FUNC_TYPE_MASK, + NDARRAY_ARG_BEFORE_SCALAR = 1, + ACCEPT_EMPTY_MUTATE_TARGET = (1 << 2) +) + +function _import_ndarray_functions() + n_ref = Ref{MX_uint}(0) + h_ref = Ref{Ptr{MX_handle}}(0) + @mxcall(:MXListFunctions, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) + + n_funcs = n_ref[] + h_funcs = pointer_to_array(h_ref[], n_funcs) + + for i = 1:n_funcs + func_handle = h_funcs[i] + + #---------------------------------------- + # get function information (human readable) + ref_name = Ref{char_p}(0) + ref_desc = Ref{char_p}(0) + ref_narg = Ref{MX_uint}(0) + + ref_arg_names = Ref{char_pp}(0) + ref_arg_types = Ref{char_pp}(0) + ref_arg_descs = Ref{char_pp}(0) + + @mxcall(:MXFuncGetInfo, + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), + func_handle, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) + func_name = symbol(bytestring(ref_name[])) + + #---------------------------------------- + # get function specification + ref_n_use_vars = Ref{MX_uint}(0) + ref_n_scalars = Ref{MX_uint}(0) + ref_n_mut_vars = Ref{MX_uint}(0) + ref_type_mask = Ref{Cint}(0) + @mxcall(:MXFuncDescribe, + (MX_handle, Ref{MX_uint}, Ref{MX_uint}, Ref{MX_uint}, Ref{Cint}), + func_handle, ref_n_use_vars, ref_n_scalars, ref_n_mut_vars, ref_type_mask) + + #---------------------------------------- + # prepare function definition + n_used_vars = ref_n_use_vars[] + n_scalars = ref_n_scalars[] + n_mutate_vars = ref_n_mut_vars[] + type_mask = ref_type_mask[] + accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 + if (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 + use_vars_range = 1:n_used_vars + scalar_range = n_used_vars+1:n_used_vars+n_scalars + else + scalar_range = 1:n_scalars + use_vars_range = n_scalars+1:n_scalars+n_used_vars + end + + if n_mutate_vars == 1 && n_used_vars == 2 && n_scalars == 0 + println("defining $func_name") + # binary ndarray function + function binary_ndarray_function(lhs::NDArray, rhs::NDArray, out::NDArray) + @assert(out.writable) + use_vars = MX_handle[lhs.handle, rhs.handle] + scalars = MX_float[] + mut_vars = MX_handle[out.handle] + @mxcall(:MXFuncInvoke, + (MX_handle, Ptr{MX_handle}, Ptr{MX_float}, Ptr{MX_handle}), + func_handle, use_vars, scalars, mut_vars) + return out + end + if accept_empty_mutate + function binary_ndarray_function(lhs::NDArray, rhs::NDArray) + out = NDArray(_ndarray_alloc()) + binary_ndarray_function(lhs, rhs, out) + end + end + + # add methods to the module + eval(_lib, quote + $func_name = $binary_ndarray_function + end) + end + end +end + From e426493be0b5abfabb033e8be1bed3fd91e5d9ff Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 3 Oct 2015 12:56:07 -0400 Subject: [PATCH 008/630] copy ndarray to cpu for debuggin --- src/init.jl | 5 ++++- src/ndarray.jl | 27 +++++++++++++++++++++++++-- 2 files changed, 29 insertions(+), 3 deletions(-) diff --git a/src/init.jl b/src/init.jl index 96aa6d7f0d69..2a9844b0cd2f 100644 --- a/src/init.jl +++ b/src/init.jl @@ -81,9 +81,12 @@ macro mx_define_handle_t(name, destructor) end end) - function Base.convert(::Type{MX_handle}, obj::$name) + function Base.unsafe_convert(::Type{MX_handle}, obj::$name) obj.value end + Base.convert(t::Type{MX_handle}, obj::$name) = Base.unsafe_convert(t, obj) + Base.cconvert(t::Type{MX_handle}, obj::$name) = Base.unsafe_convert(t, obj) + function Base.isnull(obj::$name) obj.value == C_NULL end end end diff --git a/src/ndarray.jl b/src/ndarray.jl index 0c20a56e6e87..7825b0e2a331 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1,5 +1,5 @@ export NDArray -export delete +export empty # create a NDArray handle of specific shape function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) @@ -19,7 +19,9 @@ function _ndarray_alloc() return MX_NDArrayHandle(h_ref[]) end - +################################################################################ +# NDArray Type +################################################################################ type NDArray handle :: MX_NDArrayHandle writable :: Bool @@ -29,6 +31,9 @@ type NDArray end end +################################################################################ +# NDArray functions exported to the users +################################################################################ function empty{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) NDArray(_ndarray_alloc(shape, ctx, false)) end @@ -36,6 +41,24 @@ function empty(shape :: Int...) empty(shape) end +function Base.size(arr :: NDArray) + ref_ndim = Ref{MX_uint}(0) + ref_shape = Ref{Ptr{MX_uint}}(0) + @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), + arr.handle, ref_ndim, ref_shape) + tuple(map(Int, pointer_to_array(ref_shape[], ref_ndim[]))...) +end + +function to_array(arr :: NDArray) + out = Array(MX_float, size(arr)) + @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{MX_float}, Csize_t), + arr.handle, pointer(out), length(out)) + return out +end + +################################################################################ +# NDArray functions dynamically exported from libmx +################################################################################ module _lib # this module is used to hold functions automatically imported # from libmxnet From 0062c9db226b05439c20c7372616bf96f4505251 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 3 Oct 2015 13:29:35 -0400 Subject: [PATCH 009/630] define unary ndarray functions --- src/ndarray.jl | 46 +++++++++++++++++++++++++++++++--------------- 1 file changed, 31 insertions(+), 15 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 7825b0e2a331..80a611a51bfc 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -63,10 +63,10 @@ module _lib # this module is used to hold functions automatically imported # from libmxnet end -function _register_function(lib::Module, name::Symbol, func::Function) - eval(lib, quote - $name = $func - end) +function _invoke_mxfunction(func_handle::MX_handle, use_vars, scalars, mut_vars) + @mxcall(:MXFuncInvoke, + (MX_handle, Ptr{MX_handle}, Ptr{MX_float}, Ptr{MX_handle}), + func_handle, use_vars, scalars, mut_vars) end @enum(LIBMX_FUNC_TYPE_MASK, @@ -126,29 +126,45 @@ function _import_ndarray_functions() end if n_mutate_vars == 1 && n_used_vars == 2 && n_scalars == 0 - println("defining $func_name") + println("defining binary $func_name") # binary ndarray function - function binary_ndarray_function(lhs::NDArray, rhs::NDArray, out::NDArray) + binary_func = (lhs::NDArray, rhs::NDArray, out::NDArray) -> begin @assert(out.writable) use_vars = MX_handle[lhs.handle, rhs.handle] scalars = MX_float[] mut_vars = MX_handle[out.handle] - @mxcall(:MXFuncInvoke, - (MX_handle, Ptr{MX_handle}, Ptr{MX_float}, Ptr{MX_handle}), - func_handle, use_vars, scalars, mut_vars) + _invoke_mxfunction(use_vars, scalars, mut_vars) return out end + eval(_lib, :(function $func_name(lhs, rhs, out) $binary_func(lhs, rhs, out) end)) + if accept_empty_mutate - function binary_ndarray_function(lhs::NDArray, rhs::NDArray) + binary_func_2 = (lhs::NDArray, rhs::NDArray) -> begin out = NDArray(_ndarray_alloc()) - binary_ndarray_function(lhs, rhs, out) + binary_func(lhs, rhs, out) end + eval(_lib, :(function $func_name(lhs, rhs) $binary_func_2(lhs, rhs) end)) + end + elseif n_mutate_vars == 1 && n_used_vars == 1 && n_scalars == 0 + println("defining unary $func_name") + # unary ndarray function + unary_func = (src::NDArray, out::NDArray) -> begin + @assert(out.writable) + use_vars = MX_handle[src.handle] + scalars = MX_float[] + mut_vars = MX_handle[out.handle] + _invoke_mxfunction(use_vars, scalars, mut_vars) + return out end + eval(_lib, :(function $func_name(src, out) $unary_func(src, out) end)) - # add methods to the module - eval(_lib, quote - $func_name = $binary_ndarray_function - end) + if accept_empty_mutate + unary_func_2 = (src::NDArray) -> begin + out = NDArray(_ndarray_alloc()) + unary_func(src, out) + end + eval(_lib, :(function $func_name(src) $unary_func_2(src) end)) + end end end end From 0ee41beca36e9f9b6311a2b469eaa34cf2ab2eb4 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 3 Oct 2015 14:44:35 -0400 Subject: [PATCH 010/630] use a prefix instead of submodule for dynamically imported functions --- src/ndarray.jl | 71 +++++++++++++++++++++++++++----------------------- 1 file changed, 38 insertions(+), 33 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 80a611a51bfc..eae969c9d2af 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -59,10 +59,6 @@ end ################################################################################ # NDArray functions dynamically exported from libmx ################################################################################ -module _lib -# this module is used to hold functions automatically imported -# from libmxnet -end function _invoke_mxfunction(func_handle::MX_handle, use_vars, scalars, mut_vars) @mxcall(:MXFuncInvoke, (MX_handle, Ptr{MX_handle}, Ptr{MX_float}, Ptr{MX_handle}), @@ -98,7 +94,14 @@ function _import_ndarray_functions() @mxcall(:MXFuncGetInfo, (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), func_handle, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) - func_name = symbol(bytestring(ref_name[])) + + # We attach the symbol ℵ (\aleph) to those functions to indicate that they are + # dynamically imported from libmxnet + # + # A first attempt was to collect all those functions in a submodule _lib. But working + # with submodules in Julia is really painful, especially when macros (@mxcall) are + # involved in a function that is to be dynamically generated via eval. + func_name = symbol("ℵ" * bytestring(ref_name[])) #---------------------------------------- # get function specification @@ -128,42 +131,44 @@ function _import_ndarray_functions() if n_mutate_vars == 1 && n_used_vars == 2 && n_scalars == 0 println("defining binary $func_name") # binary ndarray function - binary_func = (lhs::NDArray, rhs::NDArray, out::NDArray) -> begin - @assert(out.writable) - use_vars = MX_handle[lhs.handle, rhs.handle] - scalars = MX_float[] - mut_vars = MX_handle[out.handle] - _invoke_mxfunction(use_vars, scalars, mut_vars) - return out - end - eval(_lib, :(function $func_name(lhs, rhs, out) $binary_func(lhs, rhs, out) end)) + eval(mx, quote + function $func_name(lhs::NDArray, rhs::NDArray, out::NDArray) + @assert(out.writable) + use_vars = MX_handle[lhs.handle, rhs.handle] + scalars = MX_float[] + mut_vars = MX_handle[out.handle] + _invoke_mxfunction($func_handle, use_vars, scalars, mut_vars) + return out + end + end) if accept_empty_mutate - binary_func_2 = (lhs::NDArray, rhs::NDArray) -> begin - out = NDArray(_ndarray_alloc()) - binary_func(lhs, rhs, out) - end - eval(_lib, :(function $func_name(lhs, rhs) $binary_func_2(lhs, rhs) end)) + eval(mx, quote + function $func_name(lhs::NDArray, rhs::NDArray) + $func_name(lhs, rhs, NDArray(_ndarray_alloc())) + end + end) end elseif n_mutate_vars == 1 && n_used_vars == 1 && n_scalars == 0 println("defining unary $func_name") # unary ndarray function - unary_func = (src::NDArray, out::NDArray) -> begin - @assert(out.writable) - use_vars = MX_handle[src.handle] - scalars = MX_float[] - mut_vars = MX_handle[out.handle] - _invoke_mxfunction(use_vars, scalars, mut_vars) - return out - end - eval(_lib, :(function $func_name(src, out) $unary_func(src, out) end)) + eval(mx, quote + function $func_name(src::NDArray, out::NDArray) + @assert(out.writable) + use_vars = MX_handle[src.handle] + scalars = MX_float[] + mut_vars = MX_handle[out.handle] + _invoke_mxfunction($func_handle, use_vars, scalars, mut_vars) + return out + end + end) if accept_empty_mutate - unary_func_2 = (src::NDArray) -> begin - out = NDArray(_ndarray_alloc()) - unary_func(src, out) - end - eval(_lib, :(function $func_name(src) $unary_func_2(src) end)) + eval(mx, quote + function $func_name(src::NDArray) + $func_name(NDArray(_ndarray_alloc())) + end + end) end end end From f3184ad031b6496c8d1077471ac1e4a5bc91428f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 3 Oct 2015 15:44:01 -0400 Subject: [PATCH 011/630] a more general way of defining mx imported functions --- src/ndarray.jl | 59 +++++++++++++++++++++++++++++++++++++++++--------- 1 file changed, 49 insertions(+), 10 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index eae969c9d2af..09b47acaf445 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -31,6 +31,12 @@ type NDArray end end +function Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) + Base.unsafe_convert(MX_handle, obj.handle) +end +Base.convert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) +Base.cconvert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) + ################################################################################ # NDArray functions exported to the users ################################################################################ @@ -45,14 +51,14 @@ function Base.size(arr :: NDArray) ref_ndim = Ref{MX_uint}(0) ref_shape = Ref{Ptr{MX_uint}}(0) @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), - arr.handle, ref_ndim, ref_shape) + arr, ref_ndim, ref_shape) tuple(map(Int, pointer_to_array(ref_shape[], ref_ndim[]))...) end function to_array(arr :: NDArray) out = Array(MX_float, size(arr)) @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{MX_float}, Csize_t), - arr.handle, pointer(out), length(out)) + arr, pointer(out), length(out)) return out end @@ -131,19 +137,19 @@ function _import_ndarray_functions() if n_mutate_vars == 1 && n_used_vars == 2 && n_scalars == 0 println("defining binary $func_name") # binary ndarray function - eval(mx, quote + eval(quote function $func_name(lhs::NDArray, rhs::NDArray, out::NDArray) @assert(out.writable) - use_vars = MX_handle[lhs.handle, rhs.handle] + use_vars = MX_handle[lhs, rhs] scalars = MX_float[] - mut_vars = MX_handle[out.handle] + mut_vars = MX_handle[out] _invoke_mxfunction($func_handle, use_vars, scalars, mut_vars) return out end end) if accept_empty_mutate - eval(mx, quote + eval(quote function $func_name(lhs::NDArray, rhs::NDArray) $func_name(lhs, rhs, NDArray(_ndarray_alloc())) end @@ -152,24 +158,57 @@ function _import_ndarray_functions() elseif n_mutate_vars == 1 && n_used_vars == 1 && n_scalars == 0 println("defining unary $func_name") # unary ndarray function - eval(mx, quote + eval(quote function $func_name(src::NDArray, out::NDArray) @assert(out.writable) - use_vars = MX_handle[src.handle] + use_vars = MX_handle[src] scalars = MX_float[] - mut_vars = MX_handle[out.handle] + mut_vars = MX_handle[out] _invoke_mxfunction($func_handle, use_vars, scalars, mut_vars) return out end end) if accept_empty_mutate - eval(mx, quote + eval(quote function $func_name(src::NDArray) $func_name(NDArray(_ndarray_alloc())) end end) end + else + println("defining generic $func_name") + # general ndarray function + args = vcat([Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), symbol("sca$i"), AbstractFloat) for i=1:n_scalars], + [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + _use_vars = Expr(:ref, :MX_handle, [symbol("in$i") for i=1:n_used_vars]...) + _scalars = Expr(:ref, :MX_float, [symbol("sca$i") for i=1:n_scalars]...) + _mut_vars = Expr(:ref, :MX_handle, [symbol("out$i") for i=1:n_mutate_vars]...) + stmt_call = Expr(:call, :_invoke_mxfunction, func_handle, _use_vars, _scalars, _mut_vars) + if n_mutate_vars == 1 + stmt_ret = :(return out1) + else + stmt_ret = Expr(:return, Expr(:tuple, [symbol("out$i") for i=1:n_mutate_vars]...)) + end + + func_body = Expr(:block, stmt_call, stmt_ret) + func_head = Expr(:call, func_name, args...) + + func_def = Expr(:function, func_head, func_body) + eval(func_def) + + if accept_empty_mutate + args0 = args[1:n_used_vars+n_scalars] + func_head0 = Expr(:call, func_name, args0...) + _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] + stmt_call0 = Expr(:call, func_name, args0..., _mut_vars0...) + func_body0 = Expr(:block, stmt_call0) + func_head0 = Expr(:call, func_name, args0...) + + func_def0 = Expr(:function, func_head0, func_body0) + eval(func_def0) + end end end end From e3a41197c9560397c86b2c48262b2ea99f5411ba Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 3 Oct 2015 15:50:27 -0400 Subject: [PATCH 012/630] only the generic way of defining function is enough --- src/ndarray.jl | 115 ++++++++++++++++--------------------------------- 1 file changed, 36 insertions(+), 79 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 09b47acaf445..4ddd7ed6afdf 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -126,89 +126,46 @@ function _import_ndarray_functions() n_mutate_vars = ref_n_mut_vars[] type_mask = ref_type_mask[] accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 - if (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 - use_vars_range = 1:n_used_vars - scalar_range = n_used_vars+1:n_used_vars+n_scalars - else - scalar_range = 1:n_scalars - use_vars_range = n_scalars+1:n_scalars+n_used_vars - end + arg_before_scalar = (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 - if n_mutate_vars == 1 && n_used_vars == 2 && n_scalars == 0 - println("defining binary $func_name") - # binary ndarray function - eval(quote - function $func_name(lhs::NDArray, rhs::NDArray, out::NDArray) - @assert(out.writable) - use_vars = MX_handle[lhs, rhs] - scalars = MX_float[] - mut_vars = MX_handle[out] - _invoke_mxfunction($func_handle, use_vars, scalars, mut_vars) - return out - end - end) - - if accept_empty_mutate - eval(quote - function $func_name(lhs::NDArray, rhs::NDArray) - $func_name(lhs, rhs, NDArray(_ndarray_alloc())) - end - end) - end - elseif n_mutate_vars == 1 && n_used_vars == 1 && n_scalars == 0 - println("defining unary $func_name") - # unary ndarray function - eval(quote - function $func_name(src::NDArray, out::NDArray) - @assert(out.writable) - use_vars = MX_handle[src] - scalars = MX_float[] - mut_vars = MX_handle[out] - _invoke_mxfunction($func_handle, use_vars, scalars, mut_vars) - return out - end - end) - - if accept_empty_mutate - eval(quote - function $func_name(src::NDArray) - $func_name(NDArray(_ndarray_alloc())) - end - end) - end - else - println("defining generic $func_name") - # general ndarray function + println("defining generic $func_name") + # general ndarray function + if arg_before_scalar args = vcat([Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], [Expr(:(::), symbol("sca$i"), AbstractFloat) for i=1:n_scalars], [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) - _use_vars = Expr(:ref, :MX_handle, [symbol("in$i") for i=1:n_used_vars]...) - _scalars = Expr(:ref, :MX_float, [symbol("sca$i") for i=1:n_scalars]...) - _mut_vars = Expr(:ref, :MX_handle, [symbol("out$i") for i=1:n_mutate_vars]...) - stmt_call = Expr(:call, :_invoke_mxfunction, func_handle, _use_vars, _scalars, _mut_vars) - if n_mutate_vars == 1 - stmt_ret = :(return out1) - else - stmt_ret = Expr(:return, Expr(:tuple, [symbol("out$i") for i=1:n_mutate_vars]...)) - end - - func_body = Expr(:block, stmt_call, stmt_ret) - func_head = Expr(:call, func_name, args...) - - func_def = Expr(:function, func_head, func_body) - eval(func_def) - - if accept_empty_mutate - args0 = args[1:n_used_vars+n_scalars] - func_head0 = Expr(:call, func_name, args0...) - _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] - stmt_call0 = Expr(:call, func_name, args0..., _mut_vars0...) - func_body0 = Expr(:block, stmt_call0) - func_head0 = Expr(:call, func_name, args0...) - - func_def0 = Expr(:function, func_head0, func_body0) - eval(func_def0) - end + else + args = vcat([Expr(:(::), symbol("sca$i"), AbstractFloat) for i=1:n_scalars], + [Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + end + + _use_vars = Expr(:ref, :MX_handle, [symbol("in$i") for i=1:n_used_vars]...) + _scalars = Expr(:ref, :MX_float, [symbol("sca$i") for i=1:n_scalars]...) + _mut_vars = Expr(:ref, :MX_handle, [symbol("out$i") for i=1:n_mutate_vars]...) + stmt_call = Expr(:call, :_invoke_mxfunction, func_handle, _use_vars, _scalars, _mut_vars) + if n_mutate_vars == 1 + stmt_ret = :(return out1) + else + stmt_ret = Expr(:return, Expr(:tuple, [symbol("out$i") for i=1:n_mutate_vars]...)) + end + + func_body = Expr(:block, stmt_call, stmt_ret) + func_head = Expr(:call, func_name, args...) + + func_def = Expr(:function, func_head, func_body) + eval(func_def) + + if accept_empty_mutate + args0 = args[1:n_used_vars+n_scalars] + func_head0 = Expr(:call, func_name, args0...) + _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] + stmt_call0 = Expr(:call, func_name, args0..., _mut_vars0...) + func_body0 = Expr(:block, stmt_call0) + func_head0 = Expr(:call, func_name, args0...) + + func_def0 = Expr(:function, func_head0, func_body0) + eval(func_def0) end end end From 5ed258f609c28223a85072a8b8c90b5642743ae0 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 3 Oct 2015 22:39:50 -0400 Subject: [PATCH 013/630] common array-like interface functions --- src/ndarray.jl | 86 ++++++++++++++++++++++++++++++++++++++++++++++---- 1 file changed, 80 insertions(+), 6 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 4ddd7ed6afdf..57fc8f1ee24f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -47,6 +47,9 @@ function empty(shape :: Int...) empty(shape) end +#------------------------------------------------------------ +# Interface functions similar to Julia Arrays +#------------------------------------------------------------ function Base.size(arr :: NDArray) ref_ndim = Ref{MX_uint}(0) ref_shape = Ref{Ptr{MX_uint}}(0) @@ -54,14 +57,85 @@ function Base.size(arr :: NDArray) arr, ref_ndim, ref_shape) tuple(map(Int, pointer_to_array(ref_shape[], ref_ndim[]))...) end +function Base.size(arr :: NDArray, dim :: Int) + size(arr)[dim] +end +function Base.length(arr :: NDArray) + prod(size(arr)) +end +function Base.ndims(arr :: NDArray) + length(size(arr)) +end +function Base.eltype(arr :: NDArray) + MX_float +end + +"Create zero-ed NDArray of specific shape" +function zeros{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) + arr = empty(shape, ctx) + arr[:] = 0 + return arr +end +function zeros(shape :: Int...) + zeros(shape) +end + +"Assign all elements of an NDArray to a scalar" +function Base.setindex!(arr :: NDArray, val :: Real, ::Colon) + ℵ_set_value(val, arr) + return arr +end + +#------------------------------------------------------------ +# Copying functions +#------------------------------------------------------------ +"Copy data between NDArrays" +function Base.copy!(dst :: NDArray, src :: NDArray) + if dst.handle == src.handle + warn("Copying an NDArray to itself") + return + end -function to_array(arr :: NDArray) - out = Array(MX_float, size(arr)) + ℵ_copy_to(src, dst) + return dst +end + +"Copy data from NDArray to Julia Array" +function Base.copy!(dst :: Array{MX_float}, src :: NDArray) + @assert size(dst) == size(src) @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{MX_float}, Csize_t), - arr, pointer(out), length(out)) - return out + src, pointer(dst), length(dst)) + return dst +end + +"Copy data from Julia Array to NDArray" +function Base.copy!{T<:Real}(dst :: NDArray, src :: Array{T}) + @assert size(dst) == size(src) + src = convert(Array{MX_float}, src) # this might involve copying + @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), + dst.handle, pointer(src), length(src)) + return dst +end + +"Create copy: NDArray -> Julia Array" +function Base.copy(arr :: NDArray) + j_arr = Array(MX_float, size(arr)) + Base.copy!(j_arr, arr) end +"Create copy: NDArray -> NDArray in a given context" +function Base.copy(arr :: NDArray, ctx :: Context) + dst = NDArray(_ndarray_alloc(size(arr), ctx, true)) + Base.copy!(dst, arr) +end + +"Create copy: Julia Array -> NDArray in a given context" +function Base.copy{T<:Real}(arr :: Array{T}, ctx :: Context) + dst = NDArray(_ndarray_alloc(size(arr), ctx, true)) + Base.copy!(dst, arr) +end + + ################################################################################ # NDArray functions dynamically exported from libmx ################################################################################ @@ -132,10 +206,10 @@ function _import_ndarray_functions() # general ndarray function if arg_before_scalar args = vcat([Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), symbol("sca$i"), AbstractFloat) for i=1:n_scalars], + [Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) else - args = vcat([Expr(:(::), symbol("sca$i"), AbstractFloat) for i=1:n_scalars], + args = vcat([Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], [Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) end From 59dcb7ead324b50206077e48f8ff6f6da71c7ac3 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 3 Oct 2015 23:43:57 -0400 Subject: [PATCH 014/630] inplace operator for + --- src/context.jl | 4 ++-- src/ndarray.jl | 57 +++++++++++++++++++++++++++++++++++++++++++++++++- 2 files changed, 58 insertions(+), 3 deletions(-) diff --git a/src/context.jl b/src/context.jl index af8cfd725a49..3dbf7e6e482a 100644 --- a/src/context.jl +++ b/src/context.jl @@ -6,8 +6,8 @@ type Context old_ctx :: Nullable{Context} end -Context(dev_type :: CONTEXT_TYPE, dev_id = 0) = - Context(dev_type, dev_id, Nullable{Context}()) +Context(dev_type :: Union{CONTEXT_TYPE, Integer}, dev_id :: Integer = 0) = + Context(convert(CONTEXT_TYPE, dev_type), convert(Cint, dev_id), Nullable{Context}()) # global default context diff --git a/src/ndarray.jl b/src/ndarray.jl index 57fc8f1ee24f..1a05aabc9e69 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -40,6 +40,14 @@ Base.cconvert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) ################################################################################ # NDArray functions exported to the users ################################################################################ +function context(arr :: NDArray) + ref_typeid = Ref{Cint}(0) + ref_devid = Ref{Cint}(0) + @mxcall(:MXNDArrayGetContext, (MX_handle, Ref{Cint}, Ref{Cint}), + arr, ref_typeid, ref_devid) + return Context(ref_typeid[], ref_devid[]) +end + function empty{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) NDArray(_ndarray_alloc(shape, ctx, false)) end @@ -96,7 +104,7 @@ function Base.copy!(dst :: NDArray, src :: NDArray) return end - ℵ_copy_to(src, dst) + ℵ_copyto(src, dst) return dst end @@ -136,6 +144,53 @@ function Base.copy{T<:Real}(arr :: Array{T}, ctx :: Context) end +#------------------------------------------------------------ +# Basic arithmetics +#------------------------------------------------------------ +""" +Julia does not support re-definiton of += operator (like __iadd__ in python), +When one write a += b, it gets translated to a = a+b. a+b will allocate new +memory for the results, and the newly allocated NDArray object is then assigned +back to a, while the original contents in a is discarded. This is very inefficient +when we want to do inplace update. + +This macro is a simple utility to implement this behavior. Write + + @mx.inplace a += b + +will translate into + + mx.add!(a, b) + +which will do inplace adding of the contents of b into a. +""" +macro inplace(stmt) + if stmt.head == :+= + Expr(:call, :add!, esc(stmt.args[1]), esc(stmt.args[2])) + else + error("unsupported inplace translation for $stmt") + end +end + +function add!(dst :: NDArray, args :: Union{Real, NDArray}...) + for arg in args + if isa(arg, Real) + ℵ_plus_scalar(dst, arg, dst) + else + ℵ_plus(dst, arg, dst) + end + end + return dst +end + +# We fix the first arg to be NDArray to avoid ambiguity +import Base.+ +function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) + ret = copy(arg0, context(arg0)) + add!(ret, args...) +end + + ################################################################################ # NDArray functions dynamically exported from libmx ################################################################################ From 678f6f2541c3468da4ab3b0e8553873b8553527e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 5 Oct 2015 01:53:14 -0400 Subject: [PATCH 015/630] basic test for ndarray --- src/ndarray.jl | 52 +++++++++++++++++++--------------------- test/runtests.jl | 3 +-- test/unittest/ndarray.jl | 37 ++++++++++++++++++++++++++++ 3 files changed, 62 insertions(+), 30 deletions(-) create mode 100644 test/unittest/ndarray.jl diff --git a/src/ndarray.jl b/src/ndarray.jl index 1a05aabc9e69..e582b949375f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -58,23 +58,24 @@ end #------------------------------------------------------------ # Interface functions similar to Julia Arrays #------------------------------------------------------------ -function Base.size(arr :: NDArray) +import Base: size, length, ndims, eltype +function size(arr :: NDArray) ref_ndim = Ref{MX_uint}(0) ref_shape = Ref{Ptr{MX_uint}}(0) @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), arr, ref_ndim, ref_shape) tuple(map(Int, pointer_to_array(ref_shape[], ref_ndim[]))...) end -function Base.size(arr :: NDArray, dim :: Int) +function size(arr :: NDArray, dim :: Int) size(arr)[dim] end -function Base.length(arr :: NDArray) +function length(arr :: NDArray) prod(size(arr)) end -function Base.ndims(arr :: NDArray) +function ndims(arr :: NDArray) length(size(arr)) end -function Base.eltype(arr :: NDArray) +function eltype(arr :: NDArray) MX_float end @@ -88,28 +89,30 @@ function zeros(shape :: Int...) zeros(shape) end +import Base: setindex! "Assign all elements of an NDArray to a scalar" -function Base.setindex!(arr :: NDArray, val :: Real, ::Colon) - ℵ_set_value(val, arr) +function setindex!(arr :: NDArray, val :: Real, ::Colon) + _set_value(val, arr) return arr end #------------------------------------------------------------ # Copying functions #------------------------------------------------------------ +import Base: copy!, copy "Copy data between NDArrays" -function Base.copy!(dst :: NDArray, src :: NDArray) +function copy!(dst :: NDArray, src :: NDArray) if dst.handle == src.handle warn("Copying an NDArray to itself") return end - ℵ_copyto(src, dst) + _copyto(src, dst) return dst end "Copy data from NDArray to Julia Array" -function Base.copy!(dst :: Array{MX_float}, src :: NDArray) +function copy!(dst :: Array{MX_float}, src :: NDArray) @assert size(dst) == size(src) @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{MX_float}, Csize_t), src, pointer(dst), length(dst)) @@ -117,7 +120,7 @@ function Base.copy!(dst :: Array{MX_float}, src :: NDArray) end "Copy data from Julia Array to NDArray" -function Base.copy!{T<:Real}(dst :: NDArray, src :: Array{T}) +function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) @assert size(dst) == size(src) src = convert(Array{MX_float}, src) # this might involve copying @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), @@ -126,21 +129,21 @@ function Base.copy!{T<:Real}(dst :: NDArray, src :: Array{T}) end "Create copy: NDArray -> Julia Array" -function Base.copy(arr :: NDArray) +function copy(arr :: NDArray) j_arr = Array(MX_float, size(arr)) - Base.copy!(j_arr, arr) + copy!(j_arr, arr) end "Create copy: NDArray -> NDArray in a given context" -function Base.copy(arr :: NDArray, ctx :: Context) +function copy(arr :: NDArray, ctx :: Context) dst = NDArray(_ndarray_alloc(size(arr), ctx, true)) - Base.copy!(dst, arr) + copy!(dst, arr) end "Create copy: Julia Array -> NDArray in a given context" -function Base.copy{T<:Real}(arr :: Array{T}, ctx :: Context) - dst = NDArray(_ndarray_alloc(size(arr), ctx, true)) - Base.copy!(dst, arr) +function copy{T<:Real}(arr :: Array{T}, ctx :: Context) + dst = NDArray(_ndarray_alloc(size(arr), ctx, false)) + copy!(dst, arr) end @@ -175,9 +178,9 @@ end function add!(dst :: NDArray, args :: Union{Real, NDArray}...) for arg in args if isa(arg, Real) - ℵ_plus_scalar(dst, arg, dst) + _plus_scalar(dst, arg, dst) else - ℵ_plus(dst, arg, dst) + _plus(dst, arg, dst) end end return dst @@ -230,13 +233,7 @@ function _import_ndarray_functions() (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), func_handle, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) - # We attach the symbol ℵ (\aleph) to those functions to indicate that they are - # dynamically imported from libmxnet - # - # A first attempt was to collect all those functions in a submodule _lib. But working - # with submodules in Julia is really painful, especially when macros (@mxcall) are - # involved in a function that is to be dynamically generated via eval. - func_name = symbol("ℵ" * bytestring(ref_name[])) + func_name = symbol(bytestring(ref_name[])) #---------------------------------------- # get function specification @@ -257,7 +254,6 @@ function _import_ndarray_functions() accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 arg_before_scalar = (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 - println("defining generic $func_name") # general ndarray function if arg_before_scalar args = vcat([Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], diff --git a/test/runtests.jl b/test/runtests.jl index d6005fcf699d..d1aa01edbc29 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -1,5 +1,4 @@ using MXNet using Base.Test -# write your own tests here -@test 1 == 1 +include("unittest/ndarray.jl") diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl new file mode 100644 index 000000000000..7ead256fcb66 --- /dev/null +++ b/test/unittest/ndarray.jl @@ -0,0 +1,37 @@ +module TestNDArray +using MXNet +using Base.Test + +################################################################################ +# Test Implementations +################################################################################ +function reldiff(a, b) + diff = sum(abs(a - b)) + norm = sum(abs(a)) + return diff / norm +end + +function test_copy() + dims = tuple(rand(1:10, rand(1:6))...) + tensor = rand(mx.MX_float, dims) + + info("NDArray::copy::dims = $dims") + + # copy to NDArray and back + array = copy(tensor, mx.DEFAULT_CONTEXT) + tensor2 = copy(array) + @test reldiff(tensor, tensor2) < 1e-6 + + # copy between NDArray + array2 = copy(array, mx.DEFAULT_CONTEXT) + tensor2 = copy(array2) + @test reldiff(tensor, tensor2) < 1e-6 +end + + +################################################################################ +# Run tests +################################################################################ +test_copy() + +end From 525c5b246bbad97629deaed96b0bbb60bf43571d Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 5 Oct 2015 01:55:39 -0400 Subject: [PATCH 016/630] comment out release testing until v0.4 is released --- .travis.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.travis.yml b/.travis.yml index 00656a7e0f7d..90bb9e569aea 100644 --- a/.travis.yml +++ b/.travis.yml @@ -4,7 +4,7 @@ os: - linux - osx julia: - - release + #- release - nightly notifications: email: false From e0a0bbe17191503414fcbeb762f2bc0b57ef3bfd Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 5 Oct 2015 10:55:05 -0400 Subject: [PATCH 017/630] fix copy from and to CPU --- src/ndarray.jl | 2 +- test/runtests.jl | 1 + 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index e582b949375f..13ddf983050a 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -142,7 +142,7 @@ end "Create copy: Julia Array -> NDArray in a given context" function copy{T<:Real}(arr :: Array{T}, ctx :: Context) - dst = NDArray(_ndarray_alloc(size(arr), ctx, false)) + dst = empty(size(arr), ctx) copy!(dst, arr) end diff --git a/test/runtests.jl b/test/runtests.jl index d1aa01edbc29..73cc6eae494d 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -2,3 +2,4 @@ using MXNet using Base.Test include("unittest/ndarray.jl") + From 6294c93623d20619e0a75e1860ca289ed71a6e98 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 6 Oct 2015 00:15:48 -0400 Subject: [PATCH 018/630] ndarray plus and minus unit-tests --- src/ndarray.jl | 27 ++++++++++++++-- test/unittest/ndarray.jl | 67 +++++++++++++++++++++++++++++++++++++++- 2 files changed, 91 insertions(+), 3 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 13ddf983050a..32ae66e1cf80 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -168,8 +168,10 @@ will translate into which will do inplace adding of the contents of b into a. """ macro inplace(stmt) - if stmt.head == :+= + if stmt.head == :+= || stmt.head == :.+= Expr(:call, :add!, esc(stmt.args[1]), esc(stmt.args[2])) + elseif stmt.head == :-= || stmt.head == :.-= + Expr(:call, :sub!, esc(stmt.args[1]), esc(stmt.args[2])) else error("unsupported inplace translation for $stmt") end @@ -187,12 +189,33 @@ function add!(dst :: NDArray, args :: Union{Real, NDArray}...) end # We fix the first arg to be NDArray to avoid ambiguity -import Base.+ +import Base: +, .+ function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) ret = copy(arg0, context(arg0)) add!(ret, args...) end +function .+(arg0 :: NDArray, args :: Union{Real, NDArray}...) + +(arg0, args...) +end +function sub!(dst :: NDArray, arg :: Union{Real, NDArray}) + if isa(arg, Real) + _minus_scalar(dst, arg, dst) + else + _minus(dst, arg, dst) + end +end +import Base: -, .- +function -(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) + ret = copy(arg0, context(arg0)) + sub!(ret, arg1) +end +function .-(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) + -(arg0, arg1) +end +function -(arg0 :: NDArray) + _mul_scalar(arg0, -1.0) +end ################################################################################ # NDArray functions dynamically exported from libmx diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 7ead256fcb66..c066745f79ca 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -11,8 +11,17 @@ function reldiff(a, b) return diff / norm end +function rand_dims() + tuple(rand(1:10, rand(1:6))...) +end +function rand_tensors{N}(dims::NTuple{N, Int}) + tensor = rand(mx.MX_float, dims) + array = copy(tensor, mx.DEFAULT_CONTEXT) + return (tensor, array) +end + function test_copy() - dims = tuple(rand(1:10, rand(1:6))...) + dims = rand_dims() tensor = rand(mx.MX_float, dims) info("NDArray::copy::dims = $dims") @@ -28,10 +37,66 @@ function test_copy() @test reldiff(tensor, tensor2) < 1e-6 end +function test_plus() + dims = rand_dims() + t1, a1 = rand_tensors(dims) + t2, a2 = rand_tensors(dims) + t3, a3 = rand_tensors(dims) + + info("NDArray::plus::dims = $dims") + + @test reldiff(t1+t2, copy(a1+a2)) < 1e-6 + @test reldiff(t1.+t2, copy(a1.+a2)) < 1e-6 + + @test reldiff(t1+t2+t3, copy(a1+a2+a3)) < 1e-6 + + # test inplace += operation + a0 = a1 # keep a reference to a1 + @mx.inplace a1 += a2 # perform inplace += + @test a0 == a1 # make sure they are still the same object + @test reldiff(copy(a0), copy(a1)) < 1e-6 + @test reldiff(copy(a1), t1+t2) < 1e-6 + + # test scalar + scalar = rand() + @test reldiff(t3 + scalar, copy(a3 + scalar)) < 1e-6 + @test reldiff(t2+scalar+t3, copy(a2+scalar+a3)) < 1e-6 +end + +function test_minus() + dims = rand_dims() + t1, a1 = rand_tensors(dims) + t2, a2 = rand_tensors(dims) + + info("NDArray::minus::dims = $dims") + + @test reldiff(t1-t2, copy(a1-a2)) < 1e-6 + @test reldiff(t1.-t2, copy(a1.-a2)) < 1e-6 + + @test reldiff(-t1, copy(-a1)) < 1e-6 + + # make sure the negation is not in-place, so a1 is not changed after previous + # statement is executed + @test reldiff(t1, copy(a1)) < 1e-6 + + # test inplace -= operation + a0 = a1 # keep a reference to a1 + @mx.inplace a1 -= a2 # perform inplace -= + @test a0 == a1 # make sure they are still the same object + @test reldiff(copy(a0), copy(a1)) < 1e-6 + @test reldiff(copy(a1), t1-t2) < 1e-6 + + # test scalar + scalar = rand() + @test reldiff(t2 - scalar, copy(a2 - scalar)) < 1e-6 +end + ################################################################################ # Run tests ################################################################################ test_copy() +test_plus() +test_minus() end From d6a13671ae6db393b7dfbca97729b6e653bfc059 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 09:09:14 -0400 Subject: [PATCH 019/630] use more meaningful name for sub! and add! --- src/ndarray.jl | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 32ae66e1cf80..482adcb4f154 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -163,21 +163,21 @@ This macro is a simple utility to implement this behavior. Write will translate into - mx.add!(a, b) + mx.add_to!(a, b) which will do inplace adding of the contents of b into a. """ macro inplace(stmt) if stmt.head == :+= || stmt.head == :.+= - Expr(:call, :add!, esc(stmt.args[1]), esc(stmt.args[2])) + Expr(:call, :add_to!, esc(stmt.args[1]), esc(stmt.args[2])) elseif stmt.head == :-= || stmt.head == :.-= - Expr(:call, :sub!, esc(stmt.args[1]), esc(stmt.args[2])) + Expr(:call, :sub_from!, esc(stmt.args[1]), esc(stmt.args[2])) else error("unsupported inplace translation for $stmt") end end -function add!(dst :: NDArray, args :: Union{Real, NDArray}...) +function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) for arg in args if isa(arg, Real) _plus_scalar(dst, arg, dst) @@ -192,13 +192,13 @@ end import Base: +, .+ function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) ret = copy(arg0, context(arg0)) - add!(ret, args...) + add_to!(ret, args...) end function .+(arg0 :: NDArray, args :: Union{Real, NDArray}...) +(arg0, args...) end -function sub!(dst :: NDArray, arg :: Union{Real, NDArray}) +function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) if isa(arg, Real) _minus_scalar(dst, arg, dst) else @@ -208,7 +208,7 @@ end import Base: -, .- function -(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) - sub!(ret, arg1) + sub_from!(ret, arg1) end function .-(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) -(arg0, arg1) From d33dff8c214696924a78a2bdcbf981206224f717 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 09:16:23 -0400 Subject: [PATCH 020/630] assignment operator for NDArray --- src/ndarray.jl | 6 ++++++ test/unittest/ndarray.jl | 27 ++++++++++++++++++++++++++- 2 files changed, 32 insertions(+), 1 deletion(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 482adcb4f154..b1d9e2790204 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -95,6 +95,12 @@ function setindex!(arr :: NDArray, val :: Real, ::Colon) _set_value(val, arr) return arr end +function setindex!{T<:Real}(arr :: NDArray, val :: Array{T}, ::Colon) + copy!(arr, val) +end +function setindex!(arr :: NDArray, val :: NDArray, ::Colon) + copy!(arr, val) +end #------------------------------------------------------------ # Copying functions diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index c066745f79ca..084545bd3514 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -8,7 +8,7 @@ using Base.Test function reldiff(a, b) diff = sum(abs(a - b)) norm = sum(abs(a)) - return diff / norm + return diff / (norm + 1e-10) end function rand_dims() @@ -37,6 +37,30 @@ function test_copy() @test reldiff(tensor, tensor2) < 1e-6 end +function test_assign() + dims = rand_dims() + tensor = rand(mx.MX_float, dims) + + info("NDArray::assign::dims = $dims") + + # Julia Array -> NDArray assignment + array = mx.empty(size(tensor)) + array[:]= tensor + @test reldiff(tensor, copy(array)) < 1e-6 + + array2 = mx.zeros(size(tensor)) + @test reldiff(zeros(size(tensor)), copy(array2)) < 1e-6 + + # scalar -> NDArray assignment + scalar = rand() + array2[:] = scalar + @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < 1e-6 + + # NDArray -> NDArray assignment + array[:] = array2 + @test reldiff(zeros(size(tensor))+scalar, copy(array)) < 1e-6 +end + function test_plus() dims = rand_dims() t1, a1 = rand_tensors(dims) @@ -96,6 +120,7 @@ end # Run tests ################################################################################ test_copy() +test_assign() test_plus() test_minus() From b2acdc719fb0b0ac1c8264b29b8ccbd53cd5d1cf Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 09:31:38 -0400 Subject: [PATCH 021/630] test ndarray elem-wise mul --- src/ndarray.jl | 31 +++++++++++++++++++++++++++++++ test/unittest/ndarray.jl | 22 ++++++++++++++++++++++ 2 files changed, 53 insertions(+) diff --git a/src/ndarray.jl b/src/ndarray.jl index b1d9e2790204..48385cd31d26 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -178,6 +178,10 @@ macro inplace(stmt) Expr(:call, :add_to!, esc(stmt.args[1]), esc(stmt.args[2])) elseif stmt.head == :-= || stmt.head == :.-= Expr(:call, :sub_from!, esc(stmt.args[1]), esc(stmt.args[2])) + elseif stmt.head == :.*= + Expr(:call, :mul_to!, esc(stmt.args[1]), esc(stmt.args[2])) + elseif stmt.head == :./= + Expr(:call, :div_from!, esc(stmt.args[1]), esc(stmt.args[2])) else error("unsupported inplace translation for $stmt") end @@ -223,6 +227,33 @@ function -(arg0 :: NDArray) _mul_scalar(arg0, -1.0) end +function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) + if isa(arg, Real) + _mul_scalar(dst, arg, dst) + else + _mul(dst, arg, dst) + end + return dst +end +import Base: .*, * +function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) + ret = copy(arg0, context(arg0)) + mul_to!(ret, arg) +end + +function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) + if isa(arg, Real) + _div_scalar(dst, arg, dst) + else + _div(dst, arg, dst) + end +end +import Base: ./ +function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) + ret = copy(arg0, context(arg0)) + div_from!(ret, arg) +end + ################################################################################ # NDArray functions dynamically exported from libmx ################################################################################ diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 084545bd3514..ddf2084e1ed3 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -115,6 +115,27 @@ function test_minus() @test reldiff(t2 - scalar, copy(a2 - scalar)) < 1e-6 end +function test_mul() + dims = rand_dims() + t1, a1 = rand_tensors(dims) + t2, a2 = rand_tensors(dims) + t3, a3 = rand_tensors(dims) + + info("NDArray::mul::dims = $dims") + + @test reldiff(t1.*t2, copy(a1.*a2)) < 1e-6 + + # test inplace .*= operation + a0 = a1 # keep a reference to a1 + @mx.inplace a1 .*= a2 # perform inplace .*= + @test reldiff(copy(a0), copy(a1)) < 1e-6 + @test reldiff(copy(a1), t1.*t2) < 1e-6 + + # test scalar + scalar = rand() + @test reldiff(t3 * scalar, copy(a3 .* scalar)) < 1e-6 +end + ################################################################################ # Run tests @@ -123,5 +144,6 @@ test_copy() test_assign() test_plus() test_minus() +test_mul() end From 46675836e9cf0b600e8aca0582f1d72a20005172 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 09:36:38 -0400 Subject: [PATCH 022/630] unittest ndarray div --- test/unittest/ndarray.jl | 25 +++++++++++++++++++++++++ 1 file changed, 25 insertions(+) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index ddf2084e1ed3..15a3fea334ed 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -128,6 +128,7 @@ function test_mul() # test inplace .*= operation a0 = a1 # keep a reference to a1 @mx.inplace a1 .*= a2 # perform inplace .*= + @test a0 == a1 # make sure they are still the same object @test reldiff(copy(a0), copy(a1)) < 1e-6 @test reldiff(copy(a1), t1.*t2) < 1e-6 @@ -136,6 +137,29 @@ function test_mul() @test reldiff(t3 * scalar, copy(a3 .* scalar)) < 1e-6 end +function test_div() + dims = rand_dims() + t1, a1 = rand_tensors(dims) + t2, a2 = rand_tensors(dims) + + info("NDArray::div::dims = $dims") + t2 .+= 2 # avoid numerical instability + @mx.inplace a2 .+= 2 + + @test reldiff(t1 ./ t2, copy(a1 ./ a2)) < 1e-6 + + # test inplace -= operation + a0 = a1 # keep a reference to a2 + @mx.inplace a1 ./= a2 # perform inplace ./= + @test a0 == a1 # make sure they are still the same object + @test reldiff(copy(a0), copy(a1)) < 1e-6 + @test reldiff(copy(a1), t1 ./ t2) < 1e-6 + + # test scalar + scalar = rand() + 2 + @test reldiff(t2./scalar, copy(a2./scalar)) < 1e-6 +end + ################################################################################ # Run tests @@ -145,5 +169,6 @@ test_assign() test_plus() test_minus() test_mul() +test_div() end From 12ca85a6161fabc85a7941f654a1dad5b51d98e2 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 10:09:47 -0400 Subject: [PATCH 023/630] require julia v0.4 to run --- REQUIRE | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/REQUIRE b/REQUIRE index 2c4ef82cb1ab..d5d646713dcf 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1 +1 @@ -julia 0.3 +julia 0.4 From 65cc788a9c161c0626a0508043b264373b12551f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 10:39:57 -0400 Subject: [PATCH 024/630] basic symbol type --- src/MXNet.jl | 1 + src/init.jl | 1 + src/ndarray.jl | 3 +-- src/symbol.jl | 19 +++++++++++++++++++ 4 files changed, 22 insertions(+), 2 deletions(-) create mode 100644 src/symbol.jl diff --git a/src/MXNet.jl b/src/MXNet.jl index efdf1c76c0c9..63748b278d15 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -8,6 +8,7 @@ module mx include("init.jl") include("context.jl") include("ndarray.jl") +include("symbol.jl") end # mx diff --git a/src/init.jl b/src/init.jl index 2a9844b0cd2f..6baa894cdd4f 100644 --- a/src/init.jl +++ b/src/init.jl @@ -93,4 +93,5 @@ end @mx_define_handle_t(MX_NDArrayHandle, MXNDArrayFree) @mx_define_handle_t(MX_FunctionHandle, nop) +@mx_define_handle_t(MX_SymbolHandle, MXSymbolFree) diff --git a/src/ndarray.jl b/src/ndarray.jl index 48385cd31d26..9845edd7eedd 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1,5 +1,4 @@ export NDArray -export empty # create a NDArray handle of specific shape function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) @@ -255,7 +254,7 @@ function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) end ################################################################################ -# NDArray functions dynamically exported from libmx +# NDArray functions dynamically imported from libmxnet ################################################################################ function _invoke_mxfunction(func_handle::MX_handle, use_vars, scalars, mut_vars) @mxcall(:MXFuncInvoke, diff --git a/src/symbol.jl b/src/symbol.jl new file mode 100644 index 000000000000..e15d69859a72 --- /dev/null +++ b/src/symbol.jl @@ -0,0 +1,19 @@ +export Symbol + + +################################################################################ +# Symbol Type +################################################################################ +type Symbol + handle :: MX_SymbolHandle +end + +function variable(name :: Union{Base.Symbol, AbstractString}) + hdr_ref = Ref{MX_handle} + @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) + Symbol(MX_SymbolHandle(hdr_ref[])) +end + +################################################################################ +# Atomic Symbol functions dynamically exported from libmxnet +################################################################################ From 4170e376119534f52b4c851aeba637579a5c171b Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 11:06:25 -0400 Subject: [PATCH 025/630] possibility to add dynamic doc string to imported functions --- src/ndarray.jl | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) diff --git a/src/ndarray.jl b/src/ndarray.jl index 9845edd7eedd..4d6bd5407eaa 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -267,6 +267,25 @@ end ACCEPT_EMPTY_MUTATE_TARGET = (1 << 2) ) +""" +Import dynamic functions for NDArrays. The arguments to the functions are typically ordered +as + + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) + +unless NDARRAY_ARG_BEFORE_SCALAR is not set. In this case, the scalars are put before the input arguments: + + func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) + +If ACCEPT_EMPTY_MUTATE_TARGET is set. An overloaded function without the output arguments will also be defined: + + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) + +Upon calling, the output arguments will be automatically initialized with empty NDArrays. + +Those functions always return the output arguments. If there is only one output (the typical situation), that +object (NDArray) is returned. Otherwise, a tuple containing all the outputs will be returned. +""" function _import_ndarray_functions() n_ref = Ref{MX_uint}(0) h_ref = Ref{Ptr{MX_handle}}(0) @@ -351,6 +370,9 @@ function _import_ndarray_functions() func_def0 = Expr(:function, func_head0, func_body0) eval(func_def0) end + + # TODO: add doc string + # eval(:(@doc($doc_str, $func_name))) end end From 6490928f4ee776e6527b070baacde3b4453acbc4 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 12:20:36 -0400 Subject: [PATCH 026/630] try setting up travis CI --- .travis.yml | 25 ++++++++++++++++++++++++- src/init.jl | 2 +- test/travis/build_mxnet.sh | 12 ++++++++++++ test/travis/setup_env.sh | 1 + 4 files changed, 38 insertions(+), 2 deletions(-) create mode 100755 test/travis/build_mxnet.sh create mode 100755 test/travis/setup_env.sh diff --git a/.travis.yml b/.travis.yml index 90bb9e569aea..687835d65a97 100644 --- a/.travis.yml +++ b/.travis.yml @@ -2,10 +2,33 @@ language: julia os: - linux - - osx + #- osx julia: #- release - nightly + +# dependent apt packages +addons: + apt: + sources: + - ubuntu-toolchain-r-test + packages: + - doxygen + - wget + - git + - libcurl4-openssl-dev + - unzip + - libatlas-dev + - libopencv-dev + - gcc-4.8 + - g++-4.8 + - clang + +before_install: + - export TRAVIS=tests/travis + - source $TRAVIS/setup_env.sh + - source $TRAVIS/build_mxnet.sh + notifications: email: false # uncomment the following lines to override the default test script diff --git a/src/init.jl b/src/init.jl index 6baa894cdd4f..cef8e54c03e0 100644 --- a/src/init.jl +++ b/src/init.jl @@ -18,7 +18,7 @@ typealias char_pp Ptr{char_p} ################################################################################ # Initialization and library API entrance ################################################################################ -const MXNET_LIB = Libdl.find_library(["libmxnet.so"], ["/Users/chiyuan/work/mxnet/mxnet/lib"]) +const MXNET_LIB = Libdl.find_library(["libmxnet.so"], ["$(get(ENV,"MXNET_HOME",""))/lib"]) function __init__() _import_ndarray_functions() diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh new file mode 100755 index 000000000000..e6ff20221a39 --- /dev/null +++ b/test/travis/build_mxnet.sh @@ -0,0 +1,12 @@ +#!/bin/bash + +git clone --recursive https://github.com/dmlc/mxnet +cd mxnet + +if [ ! -f config.mk ]; then + echo "Use the default config.m" + cp make/config.mk config.mk +fi + +make -j4 +export MXNET_HOME=$PWD diff --git a/test/travis/setup_env.sh b/test/travis/setup_env.sh new file mode 100755 index 000000000000..a9bf588e2f88 --- /dev/null +++ b/test/travis/setup_env.sh @@ -0,0 +1 @@ +#!/bin/bash From 573eedd2129da5ad3167328badaa09531139bd1b Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 12:23:00 -0400 Subject: [PATCH 027/630] fix travis script --- .travis.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.travis.yml b/.travis.yml index 687835d65a97..8bbbd4101b76 100644 --- a/.travis.yml +++ b/.travis.yml @@ -1,4 +1,5 @@ # Documentation: http://docs.travis-ci.com/user/languages/julia/ +sudo: false language: julia os: - linux @@ -25,7 +26,7 @@ addons: - clang before_install: - - export TRAVIS=tests/travis + - export TRAVIS=test/travis - source $TRAVIS/setup_env.sh - source $TRAVIS/build_mxnet.sh From b1ca0625d9244ca286acd02bce9f632d20d746cf Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 12:30:25 -0400 Subject: [PATCH 028/630] more fix for travis script --- .travis.yml | 8 +++----- src/symbol.jl | 3 ++- test/travis/build_mxnet.sh | 7 ++++--- test/travis/run_test.sh | 4 ++++ test/travis/setup_env.sh | 5 +++++ 5 files changed, 18 insertions(+), 9 deletions(-) create mode 100755 test/travis/run_test.sh diff --git a/.travis.yml b/.travis.yml index 8bbbd4101b76..dc09f6b4252d 100644 --- a/.travis.yml +++ b/.travis.yml @@ -23,7 +23,6 @@ addons: - libopencv-dev - gcc-4.8 - g++-4.8 - - clang before_install: - export TRAVIS=test/travis @@ -32,7 +31,6 @@ before_install: notifications: email: false -# uncomment the following lines to override the default test script -#script: -# - if [[ -a .git/shallow ]]; then git fetch --unshallow; fi -# - julia -e 'Pkg.clone(pwd()); Pkg.build("MXNet"); Pkg.test("MXNet"; coverage=true)' + +script: + - source $TRAVIS/run_test.sh diff --git a/src/symbol.jl b/src/symbol.jl index e15d69859a72..9ff835703091 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -14,6 +14,7 @@ function variable(name :: Union{Base.Symbol, AbstractString}) Symbol(MX_SymbolHandle(hdr_ref[])) end + ################################################################################ -# Atomic Symbol functions dynamically exported from libmxnet +# Atomic Symbol functions dynamically imported from libmxnet ################################################################################ diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh index e6ff20221a39..4e95ad32590d 100755 --- a/test/travis/build_mxnet.sh +++ b/test/travis/build_mxnet.sh @@ -1,12 +1,13 @@ #!/bin/bash -git clone --recursive https://github.com/dmlc/mxnet -cd mxnet +git clone --recursive https://github.com/dmlc/mxnet __mxnet_build +cd __mxnet_build if [ ! -f config.mk ]; then echo "Use the default config.m" cp make/config.mk config.mk fi -make -j4 +make -j4 || exit 1 + export MXNET_HOME=$PWD diff --git a/test/travis/run_test.sh b/test/travis/run_test.sh new file mode 100755 index 000000000000..a576c69f6979 --- /dev/null +++ b/test/travis/run_test.sh @@ -0,0 +1,4 @@ +#!/bin/bash + +if [[ -a .git/shallow ]]; then git fetch --unshallow; fi +julia -e 'Pkg.clone(pwd()); Pkg.build("MXNet"); Pkg.test("MXNet"; coverage=true)' diff --git a/test/travis/setup_env.sh b/test/travis/setup_env.sh index a9bf588e2f88..73d3b52acc55 100755 --- a/test/travis/setup_env.sh +++ b/test/travis/setup_env.sh @@ -1 +1,6 @@ #!/bin/bash + +if [ ${TRAVIS_OS_NAME} == "linux" ]; then + export CXX="g++-4.8" + export CC="gcc-4.8" +fi From 7a66ef4a723ddad0a24da2dcb201d1b38ce92389 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 12:35:23 -0400 Subject: [PATCH 029/630] enable osx build on travis --- .travis.yml | 2 +- test/travis/setup_env.sh | 15 +++++++++++++-- 2 files changed, 14 insertions(+), 3 deletions(-) diff --git a/.travis.yml b/.travis.yml index dc09f6b4252d..cae2bfbb7a22 100644 --- a/.travis.yml +++ b/.travis.yml @@ -3,7 +3,7 @@ sudo: false language: julia os: - linux - #- osx + - osx julia: #- release - nightly diff --git a/test/travis/setup_env.sh b/test/travis/setup_env.sh index 73d3b52acc55..b71b30761359 100755 --- a/test/travis/setup_env.sh +++ b/test/travis/setup_env.sh @@ -1,6 +1,17 @@ #!/bin/bash +echo "##########################" +echo $TRAVIS_OS_NAME + if [ ${TRAVIS_OS_NAME} == "linux" ]; then - export CXX="g++-4.8" - export CC="gcc-4.8" + alias g++="g++-4.8" + alias gcc="gcc-4.8" +fi + +if [ ${TRAVIS_OS_NAME} == "osx" ]; then + brew update + brew tap homebrew/science + brew info opencv + brew install graphviz + brew install opencv fi From b22c83f62eec779cf055cea46cfafa94ae52e3e4 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 12:42:07 -0400 Subject: [PATCH 030/630] fix build script --- test/travis/build_mxnet.sh | 14 ++++++++++++++ test/travis/setup_env.sh | 5 ----- 2 files changed, 14 insertions(+), 5 deletions(-) diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh index 4e95ad32590d..549afb66e37e 100755 --- a/test/travis/build_mxnet.sh +++ b/test/travis/build_mxnet.sh @@ -6,6 +6,20 @@ cd __mxnet_build if [ ! -f config.mk ]; then echo "Use the default config.m" cp make/config.mk config.mk + + if [ ${TRAVIS_OS_NAME} == "linux" ]; then + sed -i 's/export CC = gcc/export CC = gcc-4.8/g' config.mk + sed -i 's/export CXX = g++/export CXX = g++4.8/g' config.mk + echo "==============================" + gcc --version + gcc-4.8 --version + fi + + if [ ${TRAVIS_OS_NAME} == "osx" ]; then + sed -i 's%ADD_CFLAGS =%ADD_CFLAGS = -I/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers/%' config.mk + fi + + cat config.mk fi make -j4 || exit 1 diff --git a/test/travis/setup_env.sh b/test/travis/setup_env.sh index b71b30761359..c654b1d95533 100755 --- a/test/travis/setup_env.sh +++ b/test/travis/setup_env.sh @@ -3,11 +3,6 @@ echo "##########################" echo $TRAVIS_OS_NAME -if [ ${TRAVIS_OS_NAME} == "linux" ]; then - alias g++="g++-4.8" - alias gcc="gcc-4.8" -fi - if [ ${TRAVIS_OS_NAME} == "osx" ]; then brew update brew tap homebrew/science From f9b88b0b81de116d2e1152b07dce8b815351e6eb Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 12:44:49 -0400 Subject: [PATCH 031/630] fix typo --- test/travis/build_mxnet.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh index 549afb66e37e..6d58db9a7461 100755 --- a/test/travis/build_mxnet.sh +++ b/test/travis/build_mxnet.sh @@ -9,7 +9,7 @@ if [ ! -f config.mk ]; then if [ ${TRAVIS_OS_NAME} == "linux" ]; then sed -i 's/export CC = gcc/export CC = gcc-4.8/g' config.mk - sed -i 's/export CXX = g++/export CXX = g++4.8/g' config.mk + sed -i 's/export CXX = g++/export CXX = g++-4.8/g' config.mk echo "==============================" gcc --version gcc-4.8 --version From bdd798ae0857b45f4fc922264c77f365c1a903d6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 12:48:32 -0400 Subject: [PATCH 032/630] properly switch directory --- test/travis/build_mxnet.sh | 1 + test/travis/setup_env.sh | 2 +- 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh index 6d58db9a7461..35a064a8528b 100755 --- a/test/travis/build_mxnet.sh +++ b/test/travis/build_mxnet.sh @@ -25,3 +25,4 @@ fi make -j4 || exit 1 export MXNET_HOME=$PWD +cd .. diff --git a/test/travis/setup_env.sh b/test/travis/setup_env.sh index c654b1d95533..242e034120b2 100755 --- a/test/travis/setup_env.sh +++ b/test/travis/setup_env.sh @@ -4,7 +4,7 @@ echo "##########################" echo $TRAVIS_OS_NAME if [ ${TRAVIS_OS_NAME} == "osx" ]; then - brew update + brew update >/dev/null 2>&1 brew tap homebrew/science brew info opencv brew install graphviz From 7713589761802ca5d22f5154b2ae286013fe346e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 12:50:05 -0400 Subject: [PATCH 033/630] fix sed option --- test/travis/build_mxnet.sh | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh index 35a064a8528b..28073f0b05a5 100755 --- a/test/travis/build_mxnet.sh +++ b/test/travis/build_mxnet.sh @@ -10,13 +10,10 @@ if [ ! -f config.mk ]; then if [ ${TRAVIS_OS_NAME} == "linux" ]; then sed -i 's/export CC = gcc/export CC = gcc-4.8/g' config.mk sed -i 's/export CXX = g++/export CXX = g++-4.8/g' config.mk - echo "==============================" - gcc --version - gcc-4.8 --version fi if [ ${TRAVIS_OS_NAME} == "osx" ]; then - sed -i 's%ADD_CFLAGS =%ADD_CFLAGS = -I/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers/%' config.mk + sed -i -s 's%ADD_CFLAGS =%ADD_CFLAGS = -I/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers/%' config.mk fi cat config.mk From 8950df511562a57b1225899b24bb9d3a8fc0528e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 14:37:24 -0400 Subject: [PATCH 034/630] disable openmp for osx build --- test/travis/build_mxnet.sh | 3 +++ 1 file changed, 3 insertions(+) diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh index 28073f0b05a5..5c2baf6da17e 100755 --- a/test/travis/build_mxnet.sh +++ b/test/travis/build_mxnet.sh @@ -13,7 +13,10 @@ if [ ! -f config.mk ]; then fi if [ ${TRAVIS_OS_NAME} == "osx" ]; then + # add built-in blas header file to path sed -i -s 's%ADD_CFLAGS =%ADD_CFLAGS = -I/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers/%' config.mk + # disable openmp + sed -i -s 's%USE_OPENMP = 1%USE_OPENMP = 0%g' config.mk fi cat config.mk From 694f0bb4dce82afdfa2c244da01753dbd515378c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Oct 2015 15:21:53 -0400 Subject: [PATCH 035/630] add badges --- README.md | 3 +++ 1 file changed, 3 insertions(+) diff --git a/README.md b/README.md index e9ce3583fcae..85cd8cc114e8 100644 --- a/README.md +++ b/README.md @@ -1,5 +1,8 @@ # MXNet [![Build Status](https://travis-ci.org/dmlc/MXNet.jl.svg?branch=master)](https://travis-ci.org/dmlc/MXNet.jl) +[![Coverage Status](https://img.shields.io/coveralls/dmlc/MXNet.jl.svg?style=flat)](https://coveralls.io/r/dmlc/MXNet.jl?branch=master) +[![License](https://img.shields.io/github/license/dmlc/MXNet.jl.svg?style=flat)](LICENSE.md) + Julia wrapper of [MXNet](https://github.com/dmlc/mxnet). From efb0b90739611b3ea05299a8baa806dfc3ae8657 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 8 Oct 2015 00:22:24 -0400 Subject: [PATCH 036/630] clean up built script --- test/travis/build_mxnet.sh | 26 ++++++++++++-------------- 1 file changed, 12 insertions(+), 14 deletions(-) diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh index 5c2baf6da17e..7b7f421d3cdb 100755 --- a/test/travis/build_mxnet.sh +++ b/test/travis/build_mxnet.sh @@ -4,22 +4,20 @@ git clone --recursive https://github.com/dmlc/mxnet __mxnet_build cd __mxnet_build if [ ! -f config.mk ]; then - echo "Use the default config.m" - cp make/config.mk config.mk + echo "Use the default config.m" + cp make/config.mk config.mk - if [ ${TRAVIS_OS_NAME} == "linux" ]; then - sed -i 's/export CC = gcc/export CC = gcc-4.8/g' config.mk - sed -i 's/export CXX = g++/export CXX = g++-4.8/g' config.mk - fi + if [ ${TRAVIS_OS_NAME} == "linux" ]; then + sed -i 's/export CC = gcc/export CC = gcc-4.8/g' config.mk + sed -i 's/export CXX = g++/export CXX = g++-4.8/g' config.mk + fi - if [ ${TRAVIS_OS_NAME} == "osx" ]; then - # add built-in blas header file to path - sed -i -s 's%ADD_CFLAGS =%ADD_CFLAGS = -I/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers/%' config.mk - # disable openmp - sed -i -s 's%USE_OPENMP = 1%USE_OPENMP = 0%g' config.mk - fi - - cat config.mk + if [ ${TRAVIS_OS_NAME} == "osx" ]; then + # add built-in blas header file to path + sed -i -s 's%ADD_CFLAGS =%ADD_CFLAGS = -I/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers/%' config.mk + # disable openmp + sed -i -s 's%USE_OPENMP = 1%USE_OPENMP = 0%g' config.mk + fi fi make -j4 || exit 1 From 7626fe7e3168359fee11e2c21733efe8ad2dfadd Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 8 Oct 2015 00:57:24 -0400 Subject: [PATCH 037/630] list symbol creator functions --- src/init.jl | 2 ++ src/symbol.jl | 33 ++++++++++++++++++++++++++++++++- 2 files changed, 34 insertions(+), 1 deletion(-) diff --git a/src/init.jl b/src/init.jl index cef8e54c03e0..31ab5436c6cc 100644 --- a/src/init.jl +++ b/src/init.jl @@ -22,6 +22,8 @@ const MXNET_LIB = Libdl.find_library(["libmxnet.so"], ["$(get(ENV,"MXNET_HOME"," function __init__() _import_ndarray_functions() + _import_atomic_symbol_creators() + atexit() do # notify libmxnet we are shutting down ccall( ("MXNotifyShutdown", MXNET_LIB), Cint, () ) diff --git a/src/symbol.jl b/src/symbol.jl index 9ff835703091..0f14ce346007 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -1,6 +1,5 @@ export Symbol - ################################################################################ # Symbol Type ################################################################################ @@ -18,3 +17,35 @@ end ################################################################################ # Atomic Symbol functions dynamically imported from libmxnet ################################################################################ +function _define_atomic_symbol_creator(hdr :: MX_handle) + ref_name = Ref{char_p}(0) + ref_desc = Ref{char_p}(0) + ref_kv_nargs = Ref{char_p}(0) + ref_nargs = Ref{MX_uint}(0) + ref_arg_names = Ref{char_pp}(0) + ref_arg_types = Ref{char_pp}(0) + ref_arg_descs = Ref{char_pp}(0) + + @mxcall(:MXSymbolGetAtomicSymbolInfo, + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, + Ref{char_pp}, Ref{char_p}), + hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, ref_kv_nargs) + + func_name = symbol(bytestring(ref_name[])) + kv_nargs = symbol(bytestring(ref_kv_nargs[])) + info("defining $func_name, kv_nargs = ($kv_nargs)") +end + +function _import_atomic_symbol_creators() + n_ref = Ref{MX_uint}(0) + h_ref = Ref{Ptr{MX_handle}}(0) + @mxcall(:MXSymbolListAtomicSymbolCreators, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) + + n_creators = n_ref[] + h_creators = pointer_to_array(h_ref[], n_creators) + + for i = 1:n_creators + creator_hdr = h_creators[i] + _define_atomic_symbol_creator(creator_hdr) + end +end From 627a8e5d571fc299391a2cf134e72f25e5d1f6db Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 8 Oct 2015 09:54:58 -0400 Subject: [PATCH 038/630] name manager --- src/MXNet.jl | 2 ++ src/name.jl | 46 +++++++++++++++++++++++++++++++++++++++++++ test/runtests.jl | 1 + test/unittest/name.jl | 31 +++++++++++++++++++++++++++++ 4 files changed, 80 insertions(+) create mode 100644 src/name.jl create mode 100644 test/unittest/name.jl diff --git a/src/MXNet.jl b/src/MXNet.jl index 63748b278d15..02cda42fbd25 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -7,7 +7,9 @@ module mx include("init.jl") include("context.jl") + include("ndarray.jl") +include("name.jl") include("symbol.jl") end # mx diff --git a/src/name.jl b/src/name.jl new file mode 100644 index 000000000000..5644809c79f9 --- /dev/null +++ b/src/name.jl @@ -0,0 +1,46 @@ +abstract AbstractNameManager +typealias NameType Union{Base.Symbol, AbstractString} +typealias NameCounter Dict{Base.Symbol, Int} + +import Base: get! + +"""Default implementation for generating a name for a symbol. + +When a name is specified by the user, it will be used. Otherwise, a name +is automatically generated based on the hint string. +""" +function _default_get_name!(counter :: NameCounter, name :: NameType, hint :: NameType) + if isa(name, Base.Symbol) || !isempty(name) + return symbol(name) + end + + hint = symbol(hint) + if !haskey(counter, hint) + counter[hint] = 0 + end + name = symbol("$hint$(counter[hint])") + counter[hint] += 1 + return name +end + +type BasicNameManager <: AbstractNameManager + counter :: NameCounter +end +BasicNameManager() = BasicNameManager(NameCounter()) + +function get!(manager :: BasicNameManager, name :: NameType, hint :: NameType) + _default_get_name!(manager.counter, name, hint) +end + +type PrefixNameManager <: AbstractNameManager + prefix :: Base.Symbol + counter :: NameCounter +end +PrefixNameManager(prefix :: NameType) = PrefixNameManager(symbol(prefix), NameCounter()) + +function get!(manager :: PrefixNameManager, name :: NameType, hint :: NameType) + name = _default_get_name!(manager.counter, name, hint) + return symbol("$(manager.prefix)$name") +end + +DEFAULT_NAME_MANAGER = BasicNameManager() diff --git a/test/runtests.jl b/test/runtests.jl index 73cc6eae494d..6b9e4e82384d 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -2,4 +2,5 @@ using MXNet using Base.Test include("unittest/ndarray.jl") +include("unittest/name.jl") diff --git a/test/unittest/name.jl b/test/unittest/name.jl new file mode 100644 index 000000000000..a7dd6f7bfc35 --- /dev/null +++ b/test/unittest/name.jl @@ -0,0 +1,31 @@ +module TestNameManager +using MXNet +using Base.Test + +function test_default() + info("NameManager::default") + + name = :_____aaaaa_____ + @test get!(mx.DEFAULT_NAME_MANAGER, name, "") == name + @test get!(mx.DEFAULT_NAME_MANAGER, string(name), "") == name + + hint = name + @test get!(mx.DEFAULT_NAME_MANAGER, "", hint) == symbol("$(hint)0") + @test get!(mx.DEFAULT_NAME_MANAGER, "", string(hint)) == symbol("$(hint)1") +end + +function test_prefix() + info("NameManager::prefix") + + name = :_____bbbbb_____ + prefix = :_____foobar_____ + + prefix_manager = mx.PrefixNameManager(prefix) + @test get!(prefix_manager, name, "") == symbol("$prefix$name") + @test get!(prefix_manager, "", name) == symbol("$prefix$(name)0") +end + +test_default() +test_prefix() + +end From 5fea0040a1a6001355f3b985a82fb904de0af1ab Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 8 Oct 2015 13:00:17 -0400 Subject: [PATCH 039/630] symbol constructor --- src/symbol.jl | 57 +++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 57 insertions(+) diff --git a/src/symbol.jl b/src/symbol.jl index 0f14ce346007..2fef2055a5dd 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -34,6 +34,63 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) func_name = symbol(bytestring(ref_name[])) kv_nargs = symbol(bytestring(ref_kv_nargs[])) info("defining $func_name, kv_nargs = ($kv_nargs)") + + # function $func_name(args...; kwargs...) + func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) + func_body = quote + idx = findfirst(x -> x[1] == :name, kwargs) + if idx > 0 + name = kwargs[idx][2] + else + name = "" + end + + param_keys = AbstractString[] + param_vals = AbstractString[] + symbol_kws = Dict{Base.Symbol, Symbol}() + + if $kv_nargs != symbol("") && !in($kv_nargs, param_keys) + push!(param_keys, string($kv_nargs)) + push!(param_vals, string(length(args))) + end + + for (k,v) in kwargs + if k == :name; continue; end + if isa(v, Symbol) + symbol_kws[k] = v + else + push!(param_keys, string(k)) + push!(param_vals, string(v)) + end + end + + if length(args) != 0 && length(symbol_kws) != 0 + @assert(false, "$func_name only accepts Symbols either as positional or keyword arguments, not both.") + end + if $kv_nargs != symbol("") && length(symbol_kws) + @assert(false, "$func_name takes variable number of Symbol arguments, please pass input Symbols " * + "via positional arguments, instead of keyword arguments.") + end + + # create the symbol + ref_sym_hdr = Ref{MX_handle}() + @mxcall(:MXSymbolCreateAtomicSymbol, + (MX_handle, MX_unit, Ptr{char_p}, Ptr{char_p}, Ref{MX_handle}), + hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) + sym_hdr = ref_sym_hdr[] + + sym = Symbol(MX_SymbolHandle(sym_hdr)) + hint = lowercase(string($func_name)) + name = get!(DEFAULT_NAME_MANAGER, name, hint) + + return sym + end + + func_def = Expr(:function, func_head, Expr(:block, func_body)) + eval(func_def) + + # TODO: add doc string + # eval(:(@doc($doc_str, $func_name))) end function _import_atomic_symbol_creators() From ce68e59351be81bb8d8beae3efe54cdcd3649f0c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 8 Oct 2015 19:40:03 -0400 Subject: [PATCH 040/630] symbol basic test --- src/symbol.jl | 116 ++++++++++++++++++++++++++++++++++++++++++----- test/runtests.jl | 3 ++ 2 files changed, 107 insertions(+), 12 deletions(-) diff --git a/src/symbol.jl b/src/symbol.jl index 2fef2055a5dd..ee3b773bc031 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -6,13 +6,96 @@ export Symbol type Symbol handle :: MX_SymbolHandle end +function Base.unsafe_convert(::Type{MX_handle}, obj::Symbol) + Base.unsafe_convert(MX_handle, obj.handle) +end +Base.convert(t::Type{MX_handle}, obj::Symbol) = Base.unsafe_convert(t, obj) +Base.cconvert(t::Type{MX_handle}, obj::Symbol) = Base.unsafe_convert(t, obj) + +function Base.deepcopy(self :: Symbol) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolCopy, (MX_handle, Ref{MX_handle}), self, ref_hdr) + return Symbol(MX_SymbolHandle(ref_hdr[])) +end +function Base.copy(self :: Symbol) + Base.deepcopy(self) +end + +function Base.call(self :: Symbol, args :: Symbol...) + s = deepcopy(self) + _compose!(s, args...) +end +function Base.call(self :: Symbol; kwargs...) + s = deepcopy(self) + _compose!(s; kwargs...) +end + +macro _list_symbol_info(self, func_name) + quote + ref_sz = Ref{MX_uint}(0) + ref_names = Ref{char_pp}(0) + @mxcall($func_name, (MX_handle, Ref{MX_uint}, Ref{char_pp}), + $self, ref_sz, ref_names) + narg = ref_sz[] + names = pointer_to_array(ref_names[], narg) + names = [symbol(bytestring(x)) for x in names] + return names + end +end +function list_arguments(self :: Symbol) + @_list_symbol_info(self, :MXSymbolListArguments) +end +function list_outputs(self :: Symbol) + @_list_symbol_info(self, :MXSymbolListOutputs) +end +"""List all auxiliary states in the symbool. + +Auxiliary states are special states of symbols that do not corresponds to an argument, +and do not have gradient. But still be useful for the specific operations. +A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. +Most operators do not have Auxiliary states. +""" +function list_auxiliary_states(self :: Symbol) + @_list_symbol_info(self, :MXSymbolListAuxiliaryStates) +end function variable(name :: Union{Base.Symbol, AbstractString}) - hdr_ref = Ref{MX_handle} + hdr_ref = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) Symbol(MX_SymbolHandle(hdr_ref[])) end +"Compose symbol on inputs" +function _compose!(sym :: Symbol; kwargs...) + name = char_p(0) + arg_keys = AbstractString[] + arg_vals = MX_handle[] + + for (k,v) in kwargs + if k == :name + name = string(v) + else + @assert(isa(v, Symbol), "Compose expect `Symbol` as arguments") + push!(arg_keys, string(k)) + push!(arg_vals, v) + end + end + + @mxcall(:MXSymbolCompose, + (MX_handle, char_p, MX_uint, Ptr{char_p}, Ptr{MX_handle}), + sym, name, length(arg_keys), arg_keys, arg_vals) + return sym +end +function _compose!(sym :: Symbol, args::Symbol...) + name = char_p(0) + arg_keys = Ptr{char_p}(0) + arg_vals = MX_handle[args...] + + @mxcall(:MXSymbolCompose, + (MX_handle, char_p, MX_uint, Ptr{char_p}, Ptr{MX_handle}), + sym, name, length(arg_keys), arg_keys, arg_vals) + return sym +end ################################################################################ # Atomic Symbol functions dynamically imported from libmxnet @@ -33,7 +116,6 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) func_name = symbol(bytestring(ref_name[])) kv_nargs = symbol(bytestring(ref_kv_nargs[])) - info("defining $func_name, kv_nargs = ($kv_nargs)") # function $func_name(args...; kwargs...) func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) @@ -49,10 +131,14 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) param_vals = AbstractString[] symbol_kws = Dict{Base.Symbol, Symbol}() - if $kv_nargs != symbol("") && !in($kv_nargs, param_keys) - push!(param_keys, string($kv_nargs)) - push!(param_vals, string(length(args))) - end + $(if kv_nargs != symbol("") + quote + if !in("$kv_narg", param_keys) + push!(param_keys, string("$kv_nargs")) + push!(param_vals, string(length(args))) + end + end + end) for (k,v) in kwargs if k == :name; continue; end @@ -67,22 +153,28 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) if length(args) != 0 && length(symbol_kws) != 0 @assert(false, "$func_name only accepts Symbols either as positional or keyword arguments, not both.") end - if $kv_nargs != symbol("") && length(symbol_kws) - @assert(false, "$func_name takes variable number of Symbol arguments, please pass input Symbols " * - "via positional arguments, instead of keyword arguments.") - end + $(if kv_nargs != symbol("") + quote + if length(symbol_kws) > 0 + @assert(false, "$func_name takes variable number of Symbol arguments, please pass input Symbols " * + "via positional arguments, instead of keyword arguments.") + end + end + end) # create the symbol ref_sym_hdr = Ref{MX_handle}() @mxcall(:MXSymbolCreateAtomicSymbol, - (MX_handle, MX_unit, Ptr{char_p}, Ptr{char_p}, Ref{MX_handle}), - hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) + (MX_handle, MX_uint, Ptr{char_p}, Ptr{char_p}, Ref{MX_handle}), + $hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) sym_hdr = ref_sym_hdr[] sym = Symbol(MX_SymbolHandle(sym_hdr)) hint = lowercase(string($func_name)) name = get!(DEFAULT_NAME_MANAGER, name, hint) + _compose!(sym; name=name, symbol_kws...) + return sym end diff --git a/test/runtests.jl b/test/runtests.jl index 6b9e4e82384d..d3c8684cbee8 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -1,6 +1,9 @@ using MXNet using Base.Test +include("unittest/common.jl") + include("unittest/ndarray.jl") include("unittest/name.jl") +include("unittest/symbol.jl") From 8701e0ae02c208711600bff62abe7f1ecd14caac Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 8 Oct 2015 20:01:52 -0400 Subject: [PATCH 041/630] symbol test_internal --- src/symbol.jl | 21 +++++++++++++++++++++ test/unittest/common.jl | 10 ++++++++++ test/unittest/symbol.jl | 39 +++++++++++++++++++++++++++++++++++++++ 3 files changed, 70 insertions(+) create mode 100644 test/unittest/common.jl create mode 100644 test/unittest/symbol.jl diff --git a/src/symbol.jl b/src/symbol.jl index ee3b773bc031..191398d9de25 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -59,12 +59,33 @@ function list_auxiliary_states(self :: Symbol) @_list_symbol_info(self, :MXSymbolListAuxiliaryStates) end +"Get a new grouped symbol whose output contains all the internal outputs of this symbol." +function get_internals(self :: Symbol) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolGetInternals, (MX_handle, Ref{MX_handle}), self, ref_hdr) + return Symbol(MX_SymbolHandle(ref_hdr[])) +end + function variable(name :: Union{Base.Symbol, AbstractString}) hdr_ref = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) Symbol(MX_SymbolHandle(hdr_ref[])) end +function Base.getindex(self :: Symbol, idx :: Union{Base.Symbol, AbstractString}) + idx = symbol(idx) + i_idx = find(idx .== list_outputs(self)) + @assert(length(i_idx) > 0, "Cannot find output with name '$idx'") + @assert(length(i_idx) < 2, "Found duplicated output with name '$idx'") + Base.getindex(self, i_idx[1]) +end +function Base.getindex(self :: Symbol, idx :: Int) + ref_hdr = Ref{MX_handle}(0) + # note Julia is 1-based, while MXNet is 0-based + @mxcall(:MXSymbolGetOutput, (MX_handle, MX_uint, Ref{MX_handle}), self, idx-1, ref_hdr) + return Symbol(MX_SymbolHandle(ref_hdr[])) +end + "Compose symbol on inputs" function _compose!(sym :: Symbol; kwargs...) name = char_p(0) diff --git a/test/unittest/common.jl b/test/unittest/common.jl new file mode 100644 index 000000000000..6c6d8fdb1fd7 --- /dev/null +++ b/test/unittest/common.jl @@ -0,0 +1,10 @@ +################################################################################ +# Common models used in testing +################################################################################ +function mlp2() + data = mx.variable(:data) + out = mx.FullyConnected(data=data, name=:fc1, num_hidden=1000) + out = mx.Activation(data=out, act_type=:relu) + out = mx.FullyConnected(data=out, name=:fc2, num_hidden=10) + return out +end diff --git a/test/unittest/symbol.jl b/test/unittest/symbol.jl new file mode 100644 index 000000000000..5ea8ae7e766b --- /dev/null +++ b/test/unittest/symbol.jl @@ -0,0 +1,39 @@ +module TestSymbol +using MXNet +using Base.Test + +using ..Main: mlp2 + +################################################################################ +# Test Implementations +################################################################################ +function test_basic() + info("Symbol::basic") + + model = mlp2() + @test mx.list_arguments(model) == [:data,:fc1_weight,:fc1_bias,:fc2_weight,:fc2_bias] + @test mx.list_outputs(model) == [:fc2_output] + @test mx.list_auxiliary_states(model) == Symbol[] +end + +function test_internal() + info("Symbol::internal") + + data = mx.variable(:data) + oldfc = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) + net1 = mx.FullyConnected(data=oldfc, name=:fc2, num_hidden=100) + + @test mx.list_arguments(net1) == [:data,:fc1_weight,:fc1_bias,:fc2_weight,:fc2_bias] + + internal = mx.get_internals(net1) + fc1 = internal[:fc1_output] + @test mx.list_arguments(fc1) == mx.list_arguments(oldfc) +end + +################################################################################ +# Run tests +################################################################################ +test_basic() +test_internal() + +end From 320706fe7a86c8303c3dafc21eadad0d16abe513 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 8 Oct 2015 20:10:37 -0400 Subject: [PATCH 042/630] symbol test_compose --- src/symbol.jl | 10 ++++++++++ test/unittest/symbol.jl | 17 +++++++++++++++++ 2 files changed, 27 insertions(+) diff --git a/src/symbol.jl b/src/symbol.jl index 191398d9de25..878c472f7ff5 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -66,12 +66,22 @@ function get_internals(self :: Symbol) return Symbol(MX_SymbolHandle(ref_hdr[])) end +"Create a symbolic variable with the given name" function variable(name :: Union{Base.Symbol, AbstractString}) hdr_ref = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) Symbol(MX_SymbolHandle(hdr_ref[])) end +"Create a symbol that groups symbols together" +function group(symbols :: Symbol...) + handles = MX_handle[symbols...] + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolCreateGroup, (MX_uint, Ptr{MX_handle}, Ref{MX_handle}), + length(handles), handles, ref_hdr) + Symbol(MX_SymbolHandle(ref_hdr[])) +end + function Base.getindex(self :: Symbol, idx :: Union{Base.Symbol, AbstractString}) idx = symbol(idx) i_idx = find(idx .== list_outputs(self)) diff --git a/test/unittest/symbol.jl b/test/unittest/symbol.jl index 5ea8ae7e766b..9506b559a170 100644 --- a/test/unittest/symbol.jl +++ b/test/unittest/symbol.jl @@ -30,10 +30,27 @@ function test_internal() @test mx.list_arguments(fc1) == mx.list_arguments(oldfc) end +function test_compose() + info("Symbol::compose") + + data = mx.variable(:data) + net1 = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) + net1 = mx.FullyConnected(data=net1, name=:fc2, num_hidden=100) + + net2 = mx.FullyConnected(name=:fc3, num_hidden=10) + net2 = mx.Activation(data=net2, act_type=:relu) + net2 = mx.FullyConnected(data=net2, name=:fc4, num_hidden=20) + + composed = net2(fc3_data=net1, name=:composed) + multi_out = mx.group(composed, net1) + @test mx.list_outputs(multi_out) == [:composed_output, :fc2_output] +end + ################################################################################ # Run tests ################################################################################ test_basic() test_internal() +test_compose() end From 631a965167982ecfd833834567c1b09340943080 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 9 Oct 2015 00:31:27 -0400 Subject: [PATCH 043/630] test infer shape --- src/symbol.jl | 64 +++++++++++++++++++++++++++++++++++++++++ test/unittest/symbol.jl | 13 +++++++++ 2 files changed, 77 insertions(+) diff --git a/src/symbol.jl b/src/symbol.jl index 878c472f7ff5..e11754e2eeaa 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -82,6 +82,70 @@ function group(symbols :: Symbol...) Symbol(MX_SymbolHandle(ref_hdr[])) end +macro _infer_shape(self, keys, indptr, sdata) + quote + ref_arg_shape_size = Ref{MX_uint}(0) + ref_arg_shape_ndim = Ref{Ptr{MX_uint}}(0) + ref_arg_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) + ref_out_shape_size = Ref{MX_uint}(0) + ref_out_shape_ndim = Ref{Ptr{MX_uint}}(0) + ref_out_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) + ref_aux_shape_size = Ref{MX_uint}(0) + ref_aux_shape_ndim = Ref{Ptr{MX_uint}}(0) + ref_aux_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) + ref_complete = Ref{Cint}(0) + @mxcall(:MXSymbolInferShape, + (MX_handle, MX_uint, char_pp, Ptr{MX_uint}, Ptr{MX_uint}, + Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, + Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, + Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, + Ref{Cint}), + self, length(indptr)-1, keys, indptr, sdata, + ref_arg_shape_size, ref_arg_shape_ndim, ref_arg_shape_data, + ref_out_shape_size, ref_out_shape_ndim, ref_out_shape_data, + ref_aux_shape_size, ref_aux_shape_ndim, ref_aux_shape_data, + ref_complete) + if ref_complete[] == 0 + return (nothing, nothing, nothing) + else + function build_shapes(shape_size::MX_uint, shape_ndim::Ptr{MX_uint}, shape_data::Ptr{Ptr{MX_uint}}) + shape_ndim = pointer_to_array(shape_ndim, shape_size) + shape_data = pointer_to_array(shape_data, shape_size) + map(1:shape_size) do i + my_shape = pointer_to_array(shape_data[i], shape_ndim[i]) + tuple(Int[my_shape...]...) + end + end + return ( + build_shapes(ref_arg_shape_size[], ref_arg_shape_ndim[], ref_arg_shape_data[]), + build_shapes(ref_out_shape_size[], ref_out_shape_ndim[], ref_out_shape_data[]), + build_shapes(ref_aux_shape_size[], ref_aux_shape_ndim[], ref_aux_shape_data[]) + ) + end + end +end +function infer_shape(self :: Symbol; kwargs...) + sdata = MX_uint[] + indptr = MX_uint[0] + for (k,v) in kwargs + append!(sdata, [v...]) + push!(indptr, length(sdata)) + end + keys = AbstractString[string(x[1]) for x in kwargs] + @_infer_shape(self, keys, indptr, sdata) +end +function infer_shape(self :: Symbol, args :: Union{Tuple, Void}...) + sdata = MX_uint[] + indptr = MX_uint[0] + for arg in args + if isa(arg, Void); continue; end + append!(sdata, [arg...]) + push!(indptr, length(sdata)) + end + keys = Ptr{char_p}(0) + @_infer_shape(self, keys, indptr, sdata) +end + function Base.getindex(self :: Symbol, idx :: Union{Base.Symbol, AbstractString}) idx = symbol(idx) i_idx = find(idx .== list_outputs(self)) diff --git a/test/unittest/symbol.jl b/test/unittest/symbol.jl index 9506b559a170..cd6cdad1b10a 100644 --- a/test/unittest/symbol.jl +++ b/test/unittest/symbol.jl @@ -46,11 +46,24 @@ function test_compose() @test mx.list_outputs(multi_out) == [:composed_output, :fc2_output] end +function test_infer_shape() + info("Symbol::infer_shape::mlp2") + + model = mlp2() + data_shape = (100, 100) + arg_shapes, out_shapes, aux_shapes = mx.infer_shape(model, data=data_shape) + arg_shape_dict = Dict{Symbol,Tuple}(zip(mx.list_arguments(model), arg_shapes)) + @test arg_shape_dict == Dict{Symbol,Tuple}(:fc2_bias => (10,),:fc2_weight => (10,1000), + :fc1_bias => (1000,), :fc1_weight => (1000,100), + :data => data_shape) +end + ################################################################################ # Run tests ################################################################################ test_basic() test_internal() test_compose() +test_infer_shape() end From fca478978b59feba681c86c2d1e634b589b624d7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 9 Oct 2015 00:46:12 -0400 Subject: [PATCH 044/630] test infer_shape with error --- test/unittest/symbol.jl | 13 +++++++++++++ 1 file changed, 13 insertions(+) diff --git a/test/unittest/symbol.jl b/test/unittest/symbol.jl index cd6cdad1b10a..aa5a18be099f 100644 --- a/test/unittest/symbol.jl +++ b/test/unittest/symbol.jl @@ -56,8 +56,20 @@ function test_infer_shape() @test arg_shape_dict == Dict{Symbol,Tuple}(:fc2_bias => (10,),:fc2_weight => (10,1000), :fc1_bias => (1000,), :fc1_weight => (1000,100), :data => data_shape) + @test length(out_shapes) == 1 + @test out_shapes[1] == (100, 10) end +function test_infer_shape_error() + info("Symbol::infer_shape::error") + + model = mlp2() + weight_shape = (1, 100) + data_shape = (100, 100) + @test_throws mx.MXError mx.infer_shape(model, data=data_shape, fc1_weight=weight_shape) +end + + ################################################################################ # Run tests ################################################################################ @@ -65,5 +77,6 @@ test_basic() test_internal() test_compose() test_infer_shape() +test_infer_shape_error() end From c05e6a5d3c1b2782b2ee531260e184b2c1d36b01 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 9 Oct 2015 09:09:19 -0400 Subject: [PATCH 045/630] try out julia v0.4 precompilation --- src/MXNet.jl | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/MXNet.jl b/src/MXNet.jl index 02cda42fbd25..b516908b56f3 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -1,3 +1,5 @@ +__precompile__() + module MXNet # we put everything in the namespace mx, because there are a lot of From dd1922d2b8a20c0155d4d361725e8314c8e5649a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 9 Oct 2015 14:26:58 -0400 Subject: [PATCH 046/630] executor --- src/MXNet.jl | 1 + src/executor.jl | 86 +++++++++++++++++++++++++++++++++++++++++++++++++ src/init.jl | 1 + 3 files changed, 88 insertions(+) create mode 100644 src/executor.jl diff --git a/src/MXNet.jl b/src/MXNet.jl index b516908b56f3..22c3623dd166 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -13,6 +13,7 @@ include("context.jl") include("ndarray.jl") include("name.jl") include("symbol.jl") +include("executor.jl") end # mx diff --git a/src/executor.jl b/src/executor.jl new file mode 100644 index 000000000000..aa515c53e694 --- /dev/null +++ b/src/executor.jl @@ -0,0 +1,86 @@ +type Executor + handle :: MX_ExecutorHandle + symbol :: Symbol + arg_arrays :: Vector{NDArray} + grad_arrays :: Vector{Union{Void,NDArray}} + aux_arrays :: Vector{NDArray} + out_arrays :: Vector{NDArray} +end +function Executor(hdr :: MX_ExecutorHandle, symbol :: Symbol, + arg_arrays :: Vector{NDArray}, grad_arrays :: Vector{Union{Void,NDArray}}, + aux_arrays :: Vector{NDArray}) + # get output arrays + ref_size = Ref{MX_uint} + ref_hdrs = Ref{Ptr{MX_handle}} + @mxcall(:MXExecutorOutputs, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_handle}}), + hdr, ref_size, ref_hdrs) + out_hdrs = pointer_to_array(ref_hdrs[], ref_size[]) + out_arrays = [NDArray(MX_NDArrayHandle(x)) for x in out_hdrs] + + Executor(hdr, symbol, arg_arrays, grad_arrays, aux_arrays, out_arrays) +end + +function Base.unsafe_convert(::Type{MX_handle}, obj::Executor) + Base.unsafe_convert(MX_handle, obj.handle) +end +Base.convert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) +Base.cconvert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) + +@enum GRAD_REQ GRAD_NULL=0 GRAD_WRITE=1 GRAD_ADD=3 +function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; + args_grad :: Union{Void,Vector{NDArray},Dict{Base.Symbol,NDArray}} = nothing, + aux_states :: Union{Void,Vector{NDArray},Dict{Base.Symbol,NDArray}} = nothing, + grad_req :: Union{GRAD_REQ,Vector{GRAD_REQ},Dict{Base.Symbol,GRAD_REQ}} = GRAD_WRITE) + + function get_ndarray_inputs(arg_key::String, args::Vector{NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) + @assert(length(args) == length(arg_names), "Length of $arg_key does not match number of arguments") + return (MX_handle[args...], args) + end + function get_ndarray_inputs(arg_key::String, args::Dict{Base.Symbol,NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) + args_vec = map(arg_names) do name + arr = get(args, name, nothing) + if !allow_missing + @assert(!isa(arr, Void), "Must specify all arguments in $arg_key ($name is missing)") + end + arr + end + args_hdr = MX_handle[(isa(x,Void) ? MX_handle(0) : x) for x in args_vec] + return (args_hdr, args_vec) + end + + arg_names = list_arguments(self) + + args_hdr, args = get_ndarray_inputs("args", args, arg_names, false) + if isa(args_grad, Void) + args_grad_hdr = MX_handle[Ptr{Void}(0) for i=1:length(args)] + else + args_grad_hdr, args_grad = get_ndarray_inputs("args_grad", args_grad, arg_names, true) + end + + if isa(aux_states, Void); aux_states = NDArray[]; end + aux_args_hdr, aux_states = get_ndarray_inputs("aux_states", aux_states, list_auxiliary_states(self), false) + + if isa(grad_req, GRAD_REQ) + reqs = MX_uint[grad_req for i=1:length(args)] + elseif isa(grad_req, Vector{GRAD_REQ}) + @assert(length(grad_req) == length(args)) + reqs = MX_uint[grad_req...] + elseif isa(grad_req, Dict{Base.Symbol, GRAD_REQ}) + reqs = MX_uint[get(grad_req, name, GRAD_NULL) for name in arg_names] + end + + ref_hdr = Ref{MX_handle} + @mxcall(:MXExecutorBind, + (MX_handle, Cint, Cint, MX_uint, Ptr{MX_handle}, Ptr{MX_handle}, Ptr{MX_uint}, + MX_uint, Ptr{MX_handle}, Ref{MX_handle}), + self, ctx.device_type, ctx.device_id, length(args), args_hdr, + args_grad_hdr, reqs, length(aux_states), uax_args_hdr, ref_hdr) + executor = Executor(MX_ExecutorHandle(ref_hdr[]), self, + args, args_grad, aux_states) +end + + +function forward(self :: Executor; is_train::Bool=false, kwargs...) + # TODO: kwargs + @mxcall(:MXExecutorForward, (MX_handle, Cint), self, is_train) +end diff --git a/src/init.jl b/src/init.jl index 31ab5436c6cc..3385e8dc403f 100644 --- a/src/init.jl +++ b/src/init.jl @@ -96,4 +96,5 @@ end @mx_define_handle_t(MX_NDArrayHandle, MXNDArrayFree) @mx_define_handle_t(MX_FunctionHandle, nop) @mx_define_handle_t(MX_SymbolHandle, MXSymbolFree) +@mx_define_handle_t(MX_ExecutorHandle, MXExecutorFree) From 0a04f25bdb8a7446c51368ddf96de9c5f905b6a3 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 9 Oct 2015 23:11:46 -0400 Subject: [PATCH 047/630] executor bind forward --- src/executor.jl | 69 +++++++++++++++++++++++++--------------- src/ndarray.jl | 4 +++ src/symbol.jl | 53 ++++++++++++++++++++++++++++-- test/runtests.jl | 1 + test/unittest/common.jl | 11 +++++++ test/unittest/ndarray.jl | 11 ++----- 6 files changed, 111 insertions(+), 38 deletions(-) diff --git a/src/executor.jl b/src/executor.jl index aa515c53e694..8a42309e74a5 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -4,20 +4,30 @@ type Executor arg_arrays :: Vector{NDArray} grad_arrays :: Vector{Union{Void,NDArray}} aux_arrays :: Vector{NDArray} - out_arrays :: Vector{NDArray} + outputs :: Vector{NDArray} + arg_dict :: Dict{Base.Symbol, NDArray} + aux_dict :: Dict{Base.Symbol, NDArray} end function Executor(hdr :: MX_ExecutorHandle, symbol :: Symbol, arg_arrays :: Vector{NDArray}, grad_arrays :: Vector{Union{Void,NDArray}}, aux_arrays :: Vector{NDArray}) # get output arrays - ref_size = Ref{MX_uint} - ref_hdrs = Ref{Ptr{MX_handle}} + ref_size = Ref{MX_uint}(0) + ref_hdrs = Ref{Ptr{MX_handle}}(0) @mxcall(:MXExecutorOutputs, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_handle}}), hdr, ref_size, ref_hdrs) out_hdrs = pointer_to_array(ref_hdrs[], ref_size[]) out_arrays = [NDArray(MX_NDArrayHandle(x)) for x in out_hdrs] - Executor(hdr, symbol, arg_arrays, grad_arrays, aux_arrays, out_arrays) + arg_names = list_arguments(symbol) + @assert(length(arg_names) == length(unique(arg_names)), "Duplicated names in arguments: $arg_names") + arg_dict = Dict{Base.Symbol,NDArray}(zip(arg_names, arg_arrays)) + + aux_names = list_auxiliary_states(symbol) + @assert(length(aux_names) == length(unique(aux_names)), "Duplicated names in auxiliary states: $aux_names") + aux_dict = Dict{Base.Symbol,NDArray}(zip(aux_names, aux_arrays)) + + Executor(hdr, symbol, arg_arrays, grad_arrays, aux_arrays, out_arrays, arg_dict, aux_dict) end function Base.unsafe_convert(::Type{MX_handle}, obj::Executor) @@ -26,39 +36,40 @@ end Base.convert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) Base.cconvert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) +function _get_ndarray_inputs(arg_key::AbstractString, args::Vector{NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) + @assert(length(args) == length(arg_names), "Length of $arg_key does not match number of arguments") + return (MX_handle[args...], args) +end +function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) + args_vec = map(arg_names) do name + arr = get(args, name, nothing) + if !allow_missing + @assert(!isa(arr, Void), "Must specify all arguments in $arg_key ($name is missing)") + end + arr + end + args_hdr = MX_handle[(isa(x,Void) ? MX_handle(0) : x) for x in args_vec] + return (args_hdr, args_vec) +end + @enum GRAD_REQ GRAD_NULL=0 GRAD_WRITE=1 GRAD_ADD=3 function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; args_grad :: Union{Void,Vector{NDArray},Dict{Base.Symbol,NDArray}} = nothing, aux_states :: Union{Void,Vector{NDArray},Dict{Base.Symbol,NDArray}} = nothing, grad_req :: Union{GRAD_REQ,Vector{GRAD_REQ},Dict{Base.Symbol,GRAD_REQ}} = GRAD_WRITE) - function get_ndarray_inputs(arg_key::String, args::Vector{NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) - @assert(length(args) == length(arg_names), "Length of $arg_key does not match number of arguments") - return (MX_handle[args...], args) - end - function get_ndarray_inputs(arg_key::String, args::Dict{Base.Symbol,NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) - args_vec = map(arg_names) do name - arr = get(args, name, nothing) - if !allow_missing - @assert(!isa(arr, Void), "Must specify all arguments in $arg_key ($name is missing)") - end - arr - end - args_hdr = MX_handle[(isa(x,Void) ? MX_handle(0) : x) for x in args_vec] - return (args_hdr, args_vec) - end - arg_names = list_arguments(self) - args_hdr, args = get_ndarray_inputs("args", args, arg_names, false) + args_hdr, args = _get_ndarray_inputs("args", args, arg_names, false) if isa(args_grad, Void) + args_grad = [nothing for i=1:length(args)] args_grad_hdr = MX_handle[Ptr{Void}(0) for i=1:length(args)] else - args_grad_hdr, args_grad = get_ndarray_inputs("args_grad", args_grad, arg_names, true) + args_grad_hdr, args_grad = _get_ndarray_inputs("args_grad", args_grad, arg_names, true) end if isa(aux_states, Void); aux_states = NDArray[]; end - aux_args_hdr, aux_states = get_ndarray_inputs("aux_states", aux_states, list_auxiliary_states(self), false) + aux_args_hdr, aux_states = _get_ndarray_inputs("aux_states", aux_states, list_auxiliary_states(self), false) if isa(grad_req, GRAD_REQ) reqs = MX_uint[grad_req for i=1:length(args)] @@ -69,18 +80,24 @@ function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict reqs = MX_uint[get(grad_req, name, GRAD_NULL) for name in arg_names] end - ref_hdr = Ref{MX_handle} + ref_hdr = Ref{MX_handle}(0) @mxcall(:MXExecutorBind, (MX_handle, Cint, Cint, MX_uint, Ptr{MX_handle}, Ptr{MX_handle}, Ptr{MX_uint}, MX_uint, Ptr{MX_handle}, Ref{MX_handle}), self, ctx.device_type, ctx.device_id, length(args), args_hdr, - args_grad_hdr, reqs, length(aux_states), uax_args_hdr, ref_hdr) + args_grad_hdr, reqs, length(aux_states), aux_args_hdr, ref_hdr) + args_grad = convert(Vector{Union{Void,NDArray}}, args_grad) executor = Executor(MX_ExecutorHandle(ref_hdr[]), self, args, args_grad, aux_states) end function forward(self :: Executor; is_train::Bool=false, kwargs...) - # TODO: kwargs + for (k,v) in kwargs + @assert(k ∈ self.arg_dict, "Unknown argument $k") + @assert(isa(v, NDArray), "Keyword argument $k must be an NDArray") + copy!(self.arg_dict[k], v) + end + @mxcall(:MXExecutorForward, (MX_handle, Cint), self, is_train) end diff --git a/src/ndarray.jl b/src/ndarray.jl index 4d6bd5407eaa..035f465fa230 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -30,6 +30,10 @@ type NDArray end end +function NDArray{T<:Real}(data :: Array{T}) + copy(data, mx.DEFAULT_CONTEXT) +end + function Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) Base.unsafe_convert(MX_handle, obj.handle) end diff --git a/src/symbol.jl b/src/symbol.jl index e11754e2eeaa..d8f45cb1f9eb 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -160,6 +160,40 @@ function Base.getindex(self :: Symbol, idx :: Int) return Symbol(MX_SymbolHandle(ref_hdr[])) end +import Base: +, .+ +function +(self :: Symbol, args :: Symbol...) + ret = self + for arg in args + ret = _Plus(ret, arg) + end + ret +end +function .+(self :: Symbol, args :: Symbol...) + +(self, args...) +end + +import Base: -, .- +function -(self :: Symbol, arg :: Symbol) + _Minus(self, arg) +end +function .-(self :: Symbol, arg :: Symbol) + -(self, arg) +end + +import Base: .* +function .*(self :: Symbol, args :: Symbol...) + ret = self + for arg in args + ret = _Mul(ret, arg) + end + ret +end + +import Base: ./ +function ./(self :: Symbol, arg :: Symbol) + _Div(self, arg) +end + "Compose symbol on inputs" function _compose!(sym :: Symbol; kwargs...) name = char_p(0) @@ -182,16 +216,25 @@ function _compose!(sym :: Symbol; kwargs...) return sym end function _compose!(sym :: Symbol, args::Symbol...) - name = char_p(0) + _compose!(sym, char_p(0), args...) +end +function _compose!(sym :: Symbol, name :: Union{Base.Symbol, char_p}, args::Symbol...) + if isa(name, Base.Symbol); name = string(name); end arg_keys = Ptr{char_p}(0) arg_vals = MX_handle[args...] @mxcall(:MXSymbolCompose, (MX_handle, char_p, MX_uint, Ptr{char_p}, Ptr{MX_handle}), - sym, name, length(arg_keys), arg_keys, arg_vals) + sym, name, length(arg_vals), arg_keys, arg_vals) return sym end +function to_json(self :: Symbol) + ref_json = Ref{char_p}(0) + @mxcall(:MXSymbolSaveToJSON, (MX_handle, Ref{char_p}), self, ref_json) + return bytestring(ref_json[]) +end + ################################################################################ # Atomic Symbol functions dynamically imported from libmxnet ################################################################################ @@ -268,7 +311,11 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) hint = lowercase(string($func_name)) name = get!(DEFAULT_NAME_MANAGER, name, hint) - _compose!(sym; name=name, symbol_kws...) + if length(args) != 0 + _compose!(sym, name, args...) + else + _compose!(sym; name=name, symbol_kws...) + end return sym end diff --git a/test/runtests.jl b/test/runtests.jl index d3c8684cbee8..b328f2c8f565 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -6,4 +6,5 @@ include("unittest/common.jl") include("unittest/ndarray.jl") include("unittest/name.jl") include("unittest/symbol.jl") +include("unittest/bind.jl") diff --git a/test/unittest/common.jl b/test/unittest/common.jl index 6c6d8fdb1fd7..51dc1ed43ec4 100644 --- a/test/unittest/common.jl +++ b/test/unittest/common.jl @@ -1,6 +1,16 @@ ################################################################################ # Common models used in testing ################################################################################ +function reldiff(a, b) + diff = sum(abs(a - b)) + norm = sum(abs(a)) + return diff / (norm + 1e-10) +end + +function rand_dims(max_ndim=6) + tuple(rand(1:10, rand(1:max_ndim))...) +end + function mlp2() data = mx.variable(:data) out = mx.FullyConnected(data=data, name=:fc1, num_hidden=1000) @@ -8,3 +18,4 @@ function mlp2() out = mx.FullyConnected(data=out, name=:fc2, num_hidden=10) return out end + diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 15a3fea334ed..0d8b3aed0b3c 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -2,18 +2,11 @@ module TestNDArray using MXNet using Base.Test +using ..Main: rand_dims, reldiff + ################################################################################ # Test Implementations ################################################################################ -function reldiff(a, b) - diff = sum(abs(a - b)) - norm = sum(abs(a)) - return diff / (norm + 1e-10) -end - -function rand_dims() - tuple(rand(1:10, rand(1:6))...) -end function rand_tensors{N}(dims::NTuple{N, Int}) tensor = rand(mx.MX_float, dims) array = copy(tensor, mx.DEFAULT_CONTEXT) From 2074d12c776ad2d8277225b175c49c2892cb4db7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 9 Oct 2015 23:20:05 -0400 Subject: [PATCH 048/630] executor backward --- src/executor.jl | 11 +++++++ test/unittest/bind.jl | 70 +++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 81 insertions(+) create mode 100644 test/unittest/bind.jl diff --git a/src/executor.jl b/src/executor.jl index 8a42309e74a5..249a5684d16e 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -101,3 +101,14 @@ function forward(self :: Executor; is_train::Bool=false, kwargs...) @mxcall(:MXExecutorForward, (MX_handle, Cint), self, is_train) end + +function backward(self :: Executor) + backward(self, NDArray[]) +end +function backward(self :: Executor, out_grad :: NDArray) + backward(self, [out_grad]) +end +function backward(self :: Executor, out_grads :: Vector{NDArray}) + out_grads = MX_handle[out_grads...] + @mxcall(:MXExecutorBackward, (MX_handle, MX_uint, Ptr{MX_handle}), self, length(out_grads), out_grads) +end diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl new file mode 100644 index 000000000000..9f480f3f20f3 --- /dev/null +++ b/test/unittest/bind.jl @@ -0,0 +1,70 @@ +module TestBind +using MXNet +using Base.Test + +using ..Main: rand_dims, reldiff + +################################################################################ +# Test Implementations +################################################################################ +function test_arithmetic(uf, gf) + shape = rand_dims() + info("Bind::arithmetic::$uf::dims = $shape") + + lhs = mx.variable(:lhs) + rhs = mx.variable(:rhs) + ret = uf(lhs, rhs) + @test mx.list_arguments(ret) == [:lhs, :rhs] + + lhs_arr = mx.NDArray(rand(shape)) + rhs_arr = mx.NDArray(rand(shape)) + lhs_grad = mx.empty(shape) + rhs_grad = mx.empty(shape) + + exec2 = mx.bind(ret, mx.Context(mx.CPU), [lhs_arr, rhs_arr], args_grad=[lhs_grad, rhs_grad]) + exec3 = mx.bind(ret, mx.Context(mx.CPU), [lhs_arr, rhs_arr]) + exec4 = mx.bind(ret, mx.Context(mx.CPU), Dict(:lhs=>lhs_arr, :rhs=>rhs_arr), + args_grad=Dict(:rhs=>rhs_grad, :lhs=>lhs_grad)) + + mx.forward(exec2) + mx.forward(exec3) + mx.forward(exec4) + + out1 = uf(copy(lhs_arr), copy(rhs_arr)) + out2 = copy(exec2.outputs[1]) + out3 = copy(exec3.outputs[1]) + out4 = copy(exec4.outputs[1]) + @test reldiff(out1, out2) < 1e-6 + @test reldiff(out1, out3) < 1e-6 + @test reldiff(out1, out4) < 1e-6 + + # test gradients + out_grad = mx.NDArray(ones(shape)) + lhs_grad2, rhs_grad2 = gf(copy(out_grad), copy(lhs_arr), copy(rhs_arr)) + mx.backward(exec2, out_grad) + @test reldiff(copy(lhs_grad), lhs_grad2) < 1e-6 + @test reldiff(copy(rhs_grad), rhs_grad2) < 1e-6 + + # reset grads + lhs_grad[:] = 0 + rhs_grad[:] = 0 + # compute using another binding + mx.backward(exec4, out_grad) + @test reldiff(copy(lhs_grad), lhs_grad2) < 1e-6 + @test reldiff(copy(rhs_grad), rhs_grad2) < 1e-6 +end + +function test_arithmetic() + test_arithmetic(.+, (g,x,y) -> (g,g)) + test_arithmetic(.-, (g,x,y) -> (g,-g)) + test_arithmetic(.*, (g,x,y) -> (y.*g, x.*g)) + test_arithmetic(./, (g,x,y) -> (g ./ y, -x .* g ./ (y.^2))) +end + +################################################################################ +# Run tests +################################################################################ +test_arithmetic() + +end + From 6dc48bbf13f97c71d157f44534ea30626cfb2338 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 11 Oct 2015 19:49:17 -0400 Subject: [PATCH 049/630] simple_bind --- src/executor.jl | 25 +++++++++++++++++++++++-- test/unittest/symbol.jl | 2 +- 2 files changed, 24 insertions(+), 3 deletions(-) diff --git a/src/executor.jl b/src/executor.jl index 249a5684d16e..96c379a1bd25 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -52,7 +52,7 @@ function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDA return (args_hdr, args_vec) end -@enum GRAD_REQ GRAD_NULL=0 GRAD_WRITE=1 GRAD_ADD=3 +@enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; args_grad :: Union{Void,Vector{NDArray},Dict{Base.Symbol,NDArray}} = nothing, aux_states :: Union{Void,Vector{NDArray},Dict{Base.Symbol,NDArray}} = nothing, @@ -77,7 +77,7 @@ function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict @assert(length(grad_req) == length(args)) reqs = MX_uint[grad_req...] elseif isa(grad_req, Dict{Base.Symbol, GRAD_REQ}) - reqs = MX_uint[get(grad_req, name, GRAD_NULL) for name in arg_names] + reqs = MX_uint[get(grad_req, name, GRAD_NOP) for name in arg_names] end ref_hdr = Ref{MX_handle}(0) @@ -91,6 +91,27 @@ function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict args, args_grad, aux_states) end +function simple_bind(self :: Symbol, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) + arg_shapes, grad_shapes, aux_shapes = infer_shape(self; kwargs...) + @assert(!isa(arg_shapes, Void), "Information not enough to perform complete shape inference") + + arg_arrays = NDArray[zeros(shape, ctx) for shape in arg_shapes] + if grad_req == GRAD_NOP + grad_arrays = nothing + else + grad_arrays = Dict{Base.Symbol, NDArray} + for (name, shape) in zip(list_arguments(self), grad_shapes) + # TODO: use a better way to identify data + if !(endswith(string(name), "data") || endswith(string(name), "label")) + grad_arrays[name] = zeros(shape, ctx) + end + end + end + + aux_arrays = [zeros(shape, ctx) for shape in aux_shapes] + return bind(self, ctx, arg_ndarrays, grad_arrays, grad_req, aux_arrays) +end + function forward(self :: Executor; is_train::Bool=false, kwargs...) for (k,v) in kwargs diff --git a/test/unittest/symbol.jl b/test/unittest/symbol.jl index aa5a18be099f..9fa11789701f 100644 --- a/test/unittest/symbol.jl +++ b/test/unittest/symbol.jl @@ -61,7 +61,7 @@ function test_infer_shape() end function test_infer_shape_error() - info("Symbol::infer_shape::error") + info("Symbol::infer_shape::throws") model = mlp2() weight_shape = (1, 100) From 9dd26e5ef5d10933bd4a7b440db740fc0dba6cb7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 11 Oct 2015 21:07:40 -0400 Subject: [PATCH 050/630] random module --- src/MXNet.jl | 2 ++ src/random.jl | 19 ++++++++++++++++++ test/runtests.jl | 2 ++ test/unittest/random.jl | 43 +++++++++++++++++++++++++++++++++++++++++ 4 files changed, 66 insertions(+) create mode 100644 src/random.jl create mode 100644 test/unittest/random.jl diff --git a/src/MXNet.jl b/src/MXNet.jl index 22c3623dd166..195ebfd52cb9 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -11,6 +11,8 @@ include("init.jl") include("context.jl") include("ndarray.jl") +include("random.jl") + include("name.jl") include("symbol.jl") include("executor.jl") diff --git a/src/random.jl b/src/random.jl new file mode 100644 index 000000000000..82b0aea97582 --- /dev/null +++ b/src/random.jl @@ -0,0 +1,19 @@ +function rand!(low::Real, high::Real, out::NDArray) + _random_uniform(low, high, out) +end +function rand(low::Real, high::Real, shape::Tuple, ctx::Context=DEFAULT_CONTEXT) + out = empty(shape, ctx) + rand!(low, high, out) +end + +function randn!(mean::Real, stdvar::Real, out::NDArray) + _random_gaussian(mean, stdvar, out) +end +function randn(mean::Real, stdvar::Real, shape::Tuple, ctx::Context=DEFAULT_CONTEXT) + out = empty(shape, ctx) + randn!(mean, stdvar, out) +end + +function srand!(seed_state::Int) + @mxcall(:MXRandomSeed, (Cint,), seed_state) +end diff --git a/test/runtests.jl b/test/runtests.jl index b328f2c8f565..ebed98227084 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -4,6 +4,8 @@ using Base.Test include("unittest/common.jl") include("unittest/ndarray.jl") +include("unittest/random.jl") + include("unittest/name.jl") include("unittest/symbol.jl") include("unittest/bind.jl") diff --git a/test/unittest/random.jl b/test/unittest/random.jl new file mode 100644 index 000000000000..5328aff26906 --- /dev/null +++ b/test/unittest/random.jl @@ -0,0 +1,43 @@ +module TestRandom +using MXNet +using Base.Test + +function test_uniform() + dims = (100, 100, 2) + info("random::uniform::dims = $dims") + + low = -10; high = 10 + seed = 123 + mx.srand!(seed) + ret1 = mx.rand(low, high, dims) + + mx.srand!(seed) + ret2 = mx.empty(dims) + mx.rand!(low, high, ret2) + + @test copy(ret1) == copy(ret2) + @test abs(mean(copy(ret1)) - (high+low)/2) < 0.1 +end + +function test_gaussian() + dims = (80, 80, 4) + info("random::gaussian::dims = $dims") + + μ = 10; σ = 2 + seed = 456 + mx.srand!(seed) + ret1 = mx.randn(μ, σ, dims) + + mx.srand!(seed) + ret2 = mx.empty(dims) + mx.randn!(μ, σ, ret2) + + @test copy(ret1) == copy(ret2) + @test abs(mean(copy(ret1)) - μ) < 0.1 + @test abs(std(copy(ret1)) - σ) < 0.1 +end + +test_uniform() +test_gaussian() + +end From 357a105cdff45c9b58bcbd9b8fdb146bfe67198e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 11 Oct 2015 21:14:14 -0400 Subject: [PATCH 051/630] default initializers --- src/initializer.jl | 62 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 62 insertions(+) create mode 100644 src/initializer.jl diff --git a/src/initializer.jl b/src/initializer.jl new file mode 100644 index 000000000000..fcc353502b1b --- /dev/null +++ b/src/initializer.jl @@ -0,0 +1,62 @@ +abstract AbstractInitializer + +function call(self :: AbstractInitializer, name :: Symbol, array :: NDArray) + name = string(name) + if endswith(name, "bias") + _init_bias(self, name, array) + elseif endswith(name, "gamma") + _init_gamma(self, name, array) + elseif endswith(name, "beta") + _init_beta(self, name, array) + elseif endswith(name, "weight") + _init_weight(self, name, array) + elseif endswith(name, "moving_mean") + _init_zero(self, name, array) + elseif endswith(name, "moving_var") + _init_zero(self, name, array) + else + _init_default(self, name, array) + end +end + +function _init_bias(self :: AbstractInitializer, name :: Symbol, array :: NDArray) + array[:] = 0 +end +function _init_gamma(self :: AbstractInitializer, name :: Symbol, array :: NDArray) + array[:] = 1 +end +function _init_beta(self :: AbstractInitializer, name :: Symbol, array :: NDArray) + array[:] = 0 +end +function _init_zero(self :: AbstractInitializer, name :: Symbol, array :: NDArray) + array[:] = 0 +end + +immutable UniformInitializer <: AbstractInitializer + scale :: AbstractFloat +end +UniformInitializer() = UniformInitializer(0.07) + +function _init_weight(self :: UniformInitializer, name :: Symbol, array :: NDArray) + rand!(-self.scale, self.scale, array) +end + +immutable NormalInitializer <: AbstractInitializer + μ :: AbstractFloat + σ :: AbstractFloat +end +NormalInitializer(; μ=0, σ=0.01) = NormalInitializer(μ, σ) + +function _init_weight(self :: NormalInitializer, name :: Symbol, array :: NDArray) + randn!(self.μ, self.σ, array) +end + +immutable XaiverInitializer <: AbstractInitializer +end +function _init_weight(self :: NormalInitializer, name :: Symbol, array :: NDArray) + dims = size(array) + fan_in = prod(dims[2:end]) + fan_out = dims[1] + scale = sqrt(3 / (fan_in + fan_out)) + rand!(-scale, scale, array) +end From f3e4e95321cebdcfff4d12ce39ea066723953a89 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 12 Oct 2015 22:19:18 -0400 Subject: [PATCH 052/630] non-unicode name for initializer parameters --- src/initializer.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/initializer.jl b/src/initializer.jl index fcc353502b1b..5a3dc5ef005c 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -45,7 +45,7 @@ immutable NormalInitializer <: AbstractInitializer μ :: AbstractFloat σ :: AbstractFloat end -NormalInitializer(; μ=0, σ=0.01) = NormalInitializer(μ, σ) +NormalInitializer(; mu=0, sigma=0.01) = NormalInitializer(mu, sigma) function _init_weight(self :: NormalInitializer, name :: Symbol, array :: NDArray) randn!(self.μ, self.σ, array) From 7f35875377033bdc21a7f84f87fa118002e36401 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 13 Oct 2015 21:16:24 -0400 Subject: [PATCH 053/630] make clear the meaning of row-major vs. column-major in array conversion --- src/MXNet.jl | 2 ++ src/init.jl | 3 ++- src/ndarray.jl | 38 ++++++++++++++++++++++++++++++++++++-- test/unittest/ndarray.jl | 8 ++++++++ 4 files changed, 48 insertions(+), 3 deletions(-) diff --git a/src/MXNet.jl b/src/MXNet.jl index 195ebfd52cb9..dee95f9f6115 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -17,6 +17,8 @@ include("name.jl") include("symbol.jl") include("executor.jl") +include("io.jl") + end # mx end # module MXNet diff --git a/src/init.jl b/src/init.jl index 3385e8dc403f..894edbf83bd8 100644 --- a/src/init.jl +++ b/src/init.jl @@ -23,6 +23,7 @@ const MXNET_LIB = Libdl.find_library(["libmxnet.so"], ["$(get(ENV,"MXNET_HOME"," function __init__() _import_ndarray_functions() _import_atomic_symbol_creators() + _import_io_iterators() atexit() do # notify libmxnet we are shutting down @@ -97,4 +98,4 @@ end @mx_define_handle_t(MX_FunctionHandle, nop) @mx_define_handle_t(MX_SymbolHandle, MXSymbolFree) @mx_define_handle_t(MX_ExecutorHandle, MXExecutorFree) - +@mx_define_handle_t(MX_DataIterHandle, MXDataIterFree) diff --git a/src/ndarray.jl b/src/ndarray.jl index 035f465fa230..527d53f21ac3 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -3,7 +3,7 @@ export NDArray # create a NDArray handle of specific shape function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) h_ref = Ref{MX_handle}(0) - shape = MX_uint[shape...] + shape = flipdim(MX_uint[shape...],1) @mxcall(:MXNDArrayCreate, (Ptr{MX_uint}, MX_uint, Cint, Cint, Cint, Ref{MX_handle}), shape, length(shape), ctx.device_type, ctx.device_id, delay_alloc, h_ref) handle = MX_NDArrayHandle(h_ref[]) @@ -21,6 +21,16 @@ end ################################################################################ # NDArray Type ################################################################################ +"""Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block + of tensor-based computation. + + **Note** since C/C++ use row-major ordering for arrays while Julia follows a + column-major ordering. To keep things consistent, we keep the underlying data + in their original layout, but use *language-native* convention when we talk + about shapes. For example, a mini-batch of 100 MNIST images is a tensor of + C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory + have shape (28,28,1,100). +""" type NDArray handle :: MX_NDArrayHandle writable :: Bool @@ -62,12 +72,16 @@ end # Interface functions similar to Julia Arrays #------------------------------------------------------------ import Base: size, length, ndims, eltype +"""Get the shape of an `NDArray`. Note the shape is converted to Julia convention. + So the same piece of memory, in Julia (column-major), with shape (K, M, N), will be of the + shape (N, M, K) in the Python (row-major) binding. +""" function size(arr :: NDArray) ref_ndim = Ref{MX_uint}(0) ref_shape = Ref{Ptr{MX_uint}}(0) @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), arr, ref_ndim, ref_shape) - tuple(map(Int, pointer_to_array(ref_shape[], ref_ndim[]))...) + tuple(map(Int, flipdim(pointer_to_array(ref_shape[], ref_ndim[]),1))...) end function size(arr :: NDArray, dim :: Int) size(arr)[dim] @@ -92,6 +106,23 @@ function zeros(shape :: Int...) zeros(shape) end +import Base: sub +function sub(arr :: NDArray, ::Colon) + arr +end +function sub(arr :: NDArray, slice::UnitRange{Int}) + dim1 = size(arr)[end] + @assert(1 <= slice.start <= slice.stop <= dim1) + + hdr_ref = Ref{MX_handle}(0) + # note Julia is 1-based, inclusive-inclusive indexing, while C++ is + # 0-based, inclusive-exclusive indexing. So 1:3 in Julia should + # translates into 0:3 in C++. + @mxcall(:MXNDArraySlice, (MX_handle, MX_uint, MX_uint, Ref{MX_handle}), + arr, slice.start-1, slice.stop, hdr_ref) + return NDArray(MX_NDArrayHandle(hdr_ref[]), arr.writable) +end + import Base: setindex! "Assign all elements of an NDArray to a scalar" function setindex!(arr :: NDArray, val :: Real, ::Colon) @@ -104,6 +135,9 @@ end function setindex!(arr :: NDArray, val :: NDArray, ::Colon) copy!(arr, val) end +function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, slice::UnitRange{Int}) + copy!(sub(arr, slice), val) +end #------------------------------------------------------------ # Copying functions diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 0d8b3aed0b3c..b070f6edfa93 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -54,6 +54,13 @@ function test_assign() @test reldiff(zeros(size(tensor))+scalar, copy(array)) < 1e-6 end +function test_slice() + array = mx.zeros((2,4)) + array[2:3] = ones(2,2) + @test copy(array) == [0 1 1 0; 0 1 1 0] + @test copy(sub(array, 2:3)) == [1 1; 1 1] +end + function test_plus() dims = rand_dims() t1, a1 = rand_tensors(dims) @@ -159,6 +166,7 @@ end ################################################################################ test_copy() test_assign() +test_slice() test_plus() test_minus() test_mul() From 23c14fcd13f3ee45863bf7ff077077fac8dbb65c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 13 Oct 2015 21:35:50 -0400 Subject: [PATCH 054/630] check writable bit in NDArrays --- src/ndarray.jl | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/src/ndarray.jl b/src/ndarray.jl index 527d53f21ac3..f94b64d1c7d7 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -126,6 +126,7 @@ end import Base: setindex! "Assign all elements of an NDArray to a scalar" function setindex!(arr :: NDArray, val :: Real, ::Colon) + @assert(arr.writable) _set_value(val, arr) return arr end @@ -145,6 +146,7 @@ end import Base: copy!, copy "Copy data between NDArrays" function copy!(dst :: NDArray, src :: NDArray) + @assert(dst.writable) if dst.handle == src.handle warn("Copying an NDArray to itself") return @@ -164,6 +166,7 @@ end "Copy data from Julia Array to NDArray" function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) + @assert dst.writable @assert size(dst) == size(src) src = convert(Array{MX_float}, src) # this might involve copying @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), @@ -225,6 +228,7 @@ macro inplace(stmt) end function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) + @assert dst.writable for arg in args if isa(arg, Real) _plus_scalar(dst, arg, dst) @@ -246,6 +250,7 @@ function .+(arg0 :: NDArray, args :: Union{Real, NDArray}...) end function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) + @assert dst.writable if isa(arg, Real) _minus_scalar(dst, arg, dst) else @@ -265,6 +270,7 @@ function -(arg0 :: NDArray) end function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) + @assert dst.writable if isa(arg, Real) _mul_scalar(dst, arg, dst) else @@ -279,6 +285,7 @@ function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) end function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) + @assert dst.writable if isa(arg, Real) _div_scalar(dst, arg, dst) else From 7481dab25b1d2444a94ba4921f6b72fb53c2bc26 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 13 Oct 2015 21:56:02 -0400 Subject: [PATCH 055/630] untested io.jl --- src/io.jl | 203 +++++++++++++++++++++++++++++++++++++++ src/ndarray.jl | 12 ++- test/unittest/ndarray.jl | 2 +- 3 files changed, 213 insertions(+), 4 deletions(-) create mode 100644 src/io.jl diff --git a/src/io.jl b/src/io.jl new file mode 100644 index 000000000000..6ea020ec4163 --- /dev/null +++ b/src/io.jl @@ -0,0 +1,203 @@ +"""Root type for data provider + + A data provider provides interface to iterate over a dataset. It should implement the following functions: + + provides(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} + + Returns a list of name-shape pairs, indicating the name and shape of the each data stream. For example, + `[(:data, (100,1,28,28)), (:softmax_label, (100,1))]`. + + A data provider should implement the standard Julia iteration interface, including `Base.start`, + `Base.next`, `Base.done` and `Base.eltype`. It could safely assume that the interface functions will + always be called like + + for batch in provider + # ... + load_data!(batch, targets) + end + + which translates into + + state = Base.start(provider) + while !done(provider, state) + (batch, state) = next(provider, state) + # ... + load_data!(batch, targets) + end + + In other words, it could safely assume that `Base.next` is always called after `Base.done`. And neither + of those function will be called twice consequtively. The detailed interfaces are list below: + + Base.start(provider :: AbstractDataProvider) => AbstractDataProviderState + + Initialize or reset the data iteration. + + Base.next(provider :: AbstractDataProvider, state :: AbstractDataProviderState) + => (AbstractDataBatch, AbstractDataProviderState) + + Return one batch of data. Actual data can be retrieved from the batch by interface functions described + in the document of type `AbstractDataBatch`. + + Base.done(provider :: AbstractDataProvider, state :: AbstractDataProviderState) => Bool + + Return `false` if there is more batch to get. + + Base.eltype(::Type{MyDataProvider}) => MyDataProviderState + + Return the type of the data provider state. +""" +abstract AbstractDataProvider + +"""Root type for states of data provider""" +abstract AbstractDataProviderState + +"""A list of (slice, NDArray) pairs. Usually each NDArray resides on a different device, and each + slice describe which part of a larger piece of data should goto that device. +""" +typealias SlicedNDArray Vector{Tuple{UnitRange{Int},NDArray}} + +"""Root type for data batch + + A data batch must implement the following interface function to actually provide the data. The interface + is designed to make it easy to generate data on the fly. + + load_data!(batch :: AbstractDataBatch, targets :: Dict{Base.Symbol, SlicedNDArray}) + + Load data into targets. The target is a dictionary mapping name to actual `SlicedNDArray` the data should be + copied into. Note `targets` might not contain names of all the data we could *provide*, simply because + some the data we provie is not needed. + + The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. +""" +abstract AbstractDataBatch + + +################################################################################ +# MXDataProvider +################################################################################ + +"""Wrapper of built-in `libmxnet` data iterators. +""" +type MXDataProvider <: AbstractDataProvider + handle :: MX_DataIterHandle + provides :: Vector{Tuple{Base.Symbol, Tuple}} +end + +function _reset_data_iter(handle :: MX_DataIterHandle) + @mxcall(:MXDataIterBeforeFirst, (MX_handle,), handle) +end +function _iter_next(handle :: MX_DataIterHandle) + ref_ret = Ref{Cint}(0) + @mxcall(:MXDataIterNext, (MX_handle, Ref{Cint}), handle, ref_ret) + return Bool(ref_ret[]) +end +function _get_data(handle :: MX_DataIterHandle) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXDataIterGetData, (MX_handle, Ref{MX_handle}), handle, ref_hdr) + return NDArray(MX_NDArrayHandle(ref_hdr[]), false) +end +function _get_label(handle :: MX_DataIterHandle) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXDataIterGetLabel, (MX_handle, Ref{MX_handle}), handle, ref_hdr) + return NDArray(MX_NDArrayHandle(ref_hdr[]), false) +end + +function MXDataProvider(handle :: MX_DataIterHandle; + data_name :: Union{Base.Symbol,Void}=:data, + label_name :: Union{Base.Symbol,Void}=:softmax_label, + kwargs...) # for convenience, we ignore the rest keyword arguments + # init iterator, load the first batch and get shapes + _reset_data_iter(handle) + @assert(_iter_next(handle), "Failed to load the first batch in MXDataProvider") + provides = [(data_name, size(_get_data(handle)))] + if !isa(label_name, Void) + push!(provides, (label_name::Base.Symbol, size(_get_label(handle)))) + end + + MXDataProvider(handle, provides) +end + +type MXDataProviderState <: AbstractDataProviderState + has_next :: Bool +end +type MXDataBatch <: AbstractDataBatch + provider :: MXDataProvider +end + +function Base.eltype(provider :: MXDataProvider) + MXDataBatch +end +function Base.start(provider :: MXDataProvider) + _reset_data_iter(provider.handle) + return MXDataProviderState(true) +end +function Base.done(provider :: MXDataProvider, state :: MXDataProviderState) + state.has_next = _iter_next(provider.handle) + return !state.has_next +end +function Base.next(provider :: MXDataProvider, state :: MXDataProviderState) + return (MXDataBatch(provider.handle), state) +end + +function load_data!(batch :: MXDataBatch, targets :: Dict{Base.Symbol, SlicedNDArray}) + for (k,v) in targets + if k == batch.provider.provides[1][1] + # data + src = _get_data(batch.provider.handle) + elseif k == batch.provider.provides[2][1] + # label + src = _get_label(batch.provider.handle) + else + @assert(false, "Unknown data $k, we only provide $(batch.provider.provides)") + end + + for (idx, target) in v + copy!(target, slice(src, idx)) + end + end +end + + +function _define_data_iter_creator(hdr :: MX_handle) + ref_name = Ref{char_p}(0) + ref_desc = Ref{char_p}(0) + ref_narg = Ref{MX_uint}(0) + ref_arg_names = Ref{char_pp}(0) + ref_arg_types = Ref{char_pp}(0) + ref_arg_descs = Ref{char_pp}(0) + + @mxcall(:MXDataIterGetIterInfo, + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), + hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) + + iter_name = symbol(bytestring(ref_name[])) + println("defining iterator $iter_name") + defun = quote + function $iter_name(; kwargs...) + arg_keys = AbstractString[string(k) for (k,v) in kwargs] + arg_vals = AbstractString[string(v) for (k,v) in kwargs] + ref_hdr = Ref{MX_handle} + + @mxcall(:MXDataIterCreateIter, (MX_handle, MX_uint, char_pp, char_pp, Ref{MX_handle}), + $hdr, length(arg_keys), arg_keys, arg_vals, ref_hdr) + + return MXDataProvider(MX_DataIterHandle(ref_hdr[]); kwargs...) + end + end + eval(defun) + # TODO: add docstring +end + +function _import_io_iterators() + n_ref = Ref{MX_uint}(0) + h_ref = Ref{Ptr{MX_handle}}(0) + @mxcall(:MXListDataIters, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) + + n_creators = n_ref[] + h_creators = pointer_to_array(h_ref[], n_creators) + + for i = 1:n_creators + creator_hdr = h_creators[i] + _define_data_iter_creator(creator_hdr) + end +end diff --git a/src/ndarray.jl b/src/ndarray.jl index f94b64d1c7d7..bc2438de266f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -106,11 +106,17 @@ function zeros(shape :: Int...) zeros(shape) end -import Base: sub -function sub(arr :: NDArray, ::Colon) +import Base: slice +"""`slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest + changing dimension is supported. In Julia's column-major perspective, this is the last + dimension. For example, given an `NDArray` of shape (2,3,4), `sub(array, 2:3)` will create + a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is + used in data parallelization to split mini-batch into sub-batches for different devices. +""" +function slice(arr :: NDArray, ::Colon) arr end -function sub(arr :: NDArray, slice::UnitRange{Int}) +function slice(arr :: NDArray, slice::UnitRange{Int}) dim1 = size(arr)[end] @assert(1 <= slice.start <= slice.stop <= dim1) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index b070f6edfa93..04fc3a632204 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -58,7 +58,7 @@ function test_slice() array = mx.zeros((2,4)) array[2:3] = ones(2,2) @test copy(array) == [0 1 1 0; 0 1 1 0] - @test copy(sub(array, 2:3)) == [1 1; 1 1] + @test copy(slice(array, 2:3)) == [1 1; 1 1] end function test_plus() From 956a2209a8af700821bb18c96838a6a5620d0b90 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 13 Oct 2015 23:25:05 -0400 Subject: [PATCH 056/630] unittest MNIST data provider --- .gitignore | 1 + src/MXNet.jl | 2 ++ src/io.jl | 33 +++++++++++++++++++++++---- src/ndarray.jl | 4 ++-- src/util.jl | 23 +++++++++++++++++++ test/{unittest => }/common.jl | 0 test/runtests.jl | 18 +++++++++------ test/unittest/io.jl | 43 +++++++++++++++++++++++++++++++++++ 8 files changed, 111 insertions(+), 13 deletions(-) create mode 100644 src/util.jl rename test/{unittest => }/common.jl (100%) create mode 100644 test/unittest/io.jl diff --git a/.gitignore b/.gitignore index 8c960ec808d9..2ff5c4a3d770 100644 --- a/.gitignore +++ b/.gitignore @@ -1,3 +1,4 @@ *.jl.cov *.jl.*.cov *.jl.mem +data diff --git a/src/MXNet.jl b/src/MXNet.jl index dee95f9f6115..a5ee9bbae104 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -19,6 +19,8 @@ include("executor.jl") include("io.jl") +include("util.jl") + end # mx end # module MXNet diff --git a/src/io.jl b/src/io.jl index 6ea020ec4163..df7db7375d50 100644 --- a/src/io.jl +++ b/src/io.jl @@ -68,6 +68,17 @@ typealias SlicedNDArray Vector{Tuple{UnitRange{Int},NDArray}} some the data we provie is not needed. The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. + + The following function should also be implemented to handle the case when the mini-batch size does not + divide the size of the whole dataset. So in the last mini-batch, the actual data copied might be fewer + than the mini-batch size. This is usually not an issue during the training as the remaining space may + contain the data and label copied during the previous mini-batch are still valid data. However, during + testing, especially when doing feature extraction, we need to be precise about the number of samples + processed. + + get_pad(batch :: AbstractDataBatch) + + Return the number of *dummy samples* in this mini-batch. """ abstract AbstractDataBatch @@ -109,14 +120,17 @@ function MXDataProvider(handle :: MX_DataIterHandle; # init iterator, load the first batch and get shapes _reset_data_iter(handle) @assert(_iter_next(handle), "Failed to load the first batch in MXDataProvider") - provides = [(data_name, size(_get_data(handle)))] + provides = Tuple{Base.Symbol, Tuple}[(data_name, size(_get_data(handle)))] if !isa(label_name, Void) push!(provides, (label_name::Base.Symbol, size(_get_label(handle)))) end + _reset_data_iter(handle) MXDataProvider(handle, provides) end +provides(provider::MXDataProvider) = provider.provides + type MXDataProviderState <: AbstractDataProviderState has_next :: Bool end @@ -136,7 +150,7 @@ function Base.done(provider :: MXDataProvider, state :: MXDataProviderState) return !state.has_next end function Base.next(provider :: MXDataProvider, state :: MXDataProviderState) - return (MXDataBatch(provider.handle), state) + return (MXDataBatch(provider), state) end function load_data!(batch :: MXDataBatch, targets :: Dict{Base.Symbol, SlicedNDArray}) @@ -157,6 +171,12 @@ function load_data!(batch :: MXDataBatch, targets :: Dict{Base.Symbol, SlicedNDA end end +function get_pad(batch :: MXDataBatch) + ref_pad = Ref{Cint}(0) + @mxcall(:MXDataIterGetPadNum, (MX_handle, Ref{Cint}), batch.provider.handle, ref_pad) + return Int(ref_pad[]) +end + function _define_data_iter_creator(hdr :: MX_handle) ref_name = Ref{char_p}(0) @@ -171,12 +191,11 @@ function _define_data_iter_creator(hdr :: MX_handle) hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) iter_name = symbol(bytestring(ref_name[])) - println("defining iterator $iter_name") defun = quote function $iter_name(; kwargs...) arg_keys = AbstractString[string(k) for (k,v) in kwargs] arg_vals = AbstractString[string(v) for (k,v) in kwargs] - ref_hdr = Ref{MX_handle} + ref_hdr = Ref{MX_handle}(0) @mxcall(:MXDataIterCreateIter, (MX_handle, MX_uint, char_pp, char_pp, Ref{MX_handle}), $hdr, length(arg_keys), arg_keys, arg_vals, ref_hdr) @@ -186,6 +205,12 @@ function _define_data_iter_creator(hdr :: MX_handle) end eval(defun) # TODO: add docstring + + # add an alias XXXProvider => XXXIter + if endswith(string(iter_name), "Iter") + alias_name = symbol(string(iter_name)[1:end-4] * "Provider") + eval(:($alias_name = $iter_name)) + end end function _import_io_iterators() diff --git a/src/ndarray.jl b/src/ndarray.jl index bc2438de266f..5e1e29fa7eb6 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -142,8 +142,8 @@ end function setindex!(arr :: NDArray, val :: NDArray, ::Colon) copy!(arr, val) end -function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, slice::UnitRange{Int}) - copy!(sub(arr, slice), val) +function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, idx::UnitRange{Int}) + copy!(slice(arr, idx), val) end #------------------------------------------------------------ diff --git a/src/util.jl b/src/util.jl new file mode 100644 index 000000000000..48a55348049e --- /dev/null +++ b/src/util.jl @@ -0,0 +1,23 @@ +function get_data_dir() + data_dir = joinpath(Pkg.dir("MXNet"), "data") + mkpath(data_dir) + data_dir +end + +function get_mnist_ubyte() + data_dir = get_data_dir() + mnist_dir = joinpath(data_dir, "mnist") + mkpath(mnist_dir) + filenames = Dict(:train_data => "train-images-idx3-ubyte", + :train_label => "train-labels-idx1-ubyte", + :test_data => "t10k-images-idx3-ubyte", + :test_label => "t10k-labels-idx1-ubyte") + filenames = [k => joinpath(mnist_dir, v) for (k,v) in filenames] + if !all(isfile, values(filenames)) + cd(mnist_dir) do + run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/mnist.zip`) + run(`unzip -u mnist.zip`) + end + end + return filenames +end diff --git a/test/unittest/common.jl b/test/common.jl similarity index 100% rename from test/unittest/common.jl rename to test/common.jl diff --git a/test/runtests.jl b/test/runtests.jl index ebed98227084..1d5f49b4d1f1 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -1,12 +1,16 @@ using MXNet using Base.Test -include("unittest/common.jl") +# run test in the whole directory, latest modified files +# are run first, this makes waiting time shorter when writing +# or modifying unit-tests +function test_dir(dir) + jl_files = sort(filter(x -> ismatch(r".*\.jl$", x), readdir(dir)), by = fn -> stat(joinpath(dir,fn)).mtime) + map(reverse(jl_files)) do file + include("$dir/$file") + end +end -include("unittest/ndarray.jl") -include("unittest/random.jl") - -include("unittest/name.jl") -include("unittest/symbol.jl") -include("unittest/bind.jl") +include("common.jl") +test_dir("unittest") diff --git a/test/unittest/io.jl b/test/unittest/io.jl new file mode 100644 index 000000000000..1ac65ae78464 --- /dev/null +++ b/test/unittest/io.jl @@ -0,0 +1,43 @@ +module TestIO +using MXNet +using Base.Test + +function test_mnist() + info("IO::MNIST") + filenames = mx.get_mnist_ubyte() + + batch_size = 10 + mnist_provider = mx.MNISTProvider(image=filenames[:train_data], + label=filenames[:train_label], + batch_size=batch_size, silent=true, shuffle=false) + spec = mx.provides(mnist_provider) + spec = Dict(spec) + @test haskey(spec, :data) + @test haskey(spec, :softmax_label) + @test spec[:data] == (28,28,1,batch_size) + @test spec[:softmax_label] == (batch_size,) + + n_batch = 0 + for batch in mnist_provider + if n_batch == 0 + data_array = mx.empty(28,28,1,batch_size) + label_array = mx.empty(batch_size) + targets = Dict(:data => [(1:batch_size, data_array)], + :softmax_label => [(1:batch_size, label_array)]) + + mx.load_data!(batch, targets) + + true_labels = [5,0,4,1,9,2,1,3,1,4] # the first 10 labels in MNIST train + got_labels = Int[copy(label_array)...] + @test true_labels == got_labels + end + + n_batch += 1 + end + + @test n_batch == 60000 / batch_size +end + +test_mnist() + +end From 31132563f77e359d5ce7acadb47626414bc0cd65 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 14 Oct 2015 18:07:15 -0400 Subject: [PATCH 057/630] kvstore init / push / pull --- src/MXNet.jl | 1 + src/init.jl | 1 + src/kvstore.jl | 80 ++++++++++++++++++++++++++++++++++++++++ src/ndarray.jl | 10 +++++ test/unittest/kvstore.jl | 31 ++++++++++++++++ 5 files changed, 123 insertions(+) create mode 100644 src/kvstore.jl create mode 100644 test/unittest/kvstore.jl diff --git a/src/MXNet.jl b/src/MXNet.jl index a5ee9bbae104..964b467dcb37 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -18,6 +18,7 @@ include("symbol.jl") include("executor.jl") include("io.jl") +include("kvstore.jl") include("util.jl") diff --git a/src/init.jl b/src/init.jl index 894edbf83bd8..f23d9f3b2207 100644 --- a/src/init.jl +++ b/src/init.jl @@ -99,3 +99,4 @@ end @mx_define_handle_t(MX_SymbolHandle, MXSymbolFree) @mx_define_handle_t(MX_ExecutorHandle, MXExecutorFree) @mx_define_handle_t(MX_DataIterHandle, MXDataIterFree) +@mx_define_handle_t(MX_KVStoreHandle, MXKVStoreFree) diff --git a/src/kvstore.jl b/src/kvstore.jl new file mode 100644 index 000000000000..6c5f58ff20a7 --- /dev/null +++ b/src/kvstore.jl @@ -0,0 +1,80 @@ +type KVStore + handle :: MX_KVStoreHandle +end + +function KVStore(kv_type::Base.Symbol = :local) + @assert(kv_type ∈ [:local]) # TODO: update with allowed types + + ref_hdr = Ref{MX_handle}(0) + kv_type = string(kv_type) + @mxcall(:MXKVStoreCreate, (char_p, Ref{MX_handle}), kv_type, ref_hdr) + return KVStore(MX_KVStoreHandle(ref_hdr[])) +end +function Base.unsafe_convert(::Type{MX_handle}, obj::KVStore) + Base.unsafe_convert(MX_handle, obj.handle) +end +Base.convert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) +Base.cconvert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) + +function _flatten_kvlist(keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) + @assert length(keys) == length(vals) + Keys_flt = Int[] + vals_flt = NDArray[] + for (k,v) in zip(keys, vals) + append!(keys_flt, ones(Int, length(v))*k) + append!(vals_flt, v) + end + return (keys_flt, vals_flt) +end + +function init!(self :: KVStore, key :: Int, val :: NDArray) + init!(self, [key], [val]) +end +function init!(self :: KVStore, key :: Int, vals :: Vector{NDArray}) + init!(self, ones(Int, length(vals))*key, vals) +end +function init!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) + init!(self, _flatten_kvlist(keys, vals)...) +end +function init!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{NDArray}) + @assert length(keys) == length(vals) + keys = Cint[keys...] + vals = MX_handle[vals...] + @mxcall(:MXKVStoreInit, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}), + self, length(keys), keys, vals) +end + +import Base.push! +function push!(self :: KVStore, key :: Int, val :: NDArray; priority :: Int = 0) + push!(self, [key], [val]; priority = priority) +end +function push!(self :: KVStore, key :: Int, vals :: Vector{NDArray}; priority :: Int = 0) + push!(self, ones(Int, length(vals))*key, vals; priority = priority) +end +function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}; priority::Int=0) + push!(self, _flatten_kvlist(keys, vals)...; priority = priority) +end +function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{NDArray}; priority::Int=0) + @assert length(keys) == length(vals) + keys = Cint[keys...] + vals = MX_handle[vals...] + @mxcall(:MXKVStorePush, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}, Cint), + self, length(keys), keys, vals, priority) +end + +function pull!(self :: KVStore, key :: Int, out :: NDArray; priority :: Int = 0) + pull!(self, [key], [out]) +end +function pull!(self :: KVStore, key :: Int, outs :: Vector{NDArray}; priority :: Int = 0) + pull!(self, ones(Int, length(outs))*key, outs; priority = priority) +end +function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{Vector{NDArray}}; priority::Int=0) + pull!(self, _flatten_kvlist(keys, outs)...; priority = priority) +end +function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{NDArray}; priority::Int=0) + @assert length(keys) == length(outs) + keys = Cint[keys...] + outs = MX_handle[outs...] + @mxcall(:MXKVStorePull, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}, Cint), + self, length(keys), keys, outs, priority) +end diff --git a/src/ndarray.jl b/src/ndarray.jl index 5e1e29fa7eb6..3aaf9946814b 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -106,6 +106,16 @@ function zeros(shape :: Int...) zeros(shape) end +"Create NDArray and initialize with 1" +function ones{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) + arr = empty(shape, ctx) + arr[:] = 1 + return arr +end +function ones(shape :: Int...) + ones(shape) +end + import Base: slice """`slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest changing dimension is supported. In Julia's column-major perspective, this is the last diff --git a/test/unittest/kvstore.jl b/test/unittest/kvstore.jl new file mode 100644 index 000000000000..1e3060ff42e7 --- /dev/null +++ b/test/unittest/kvstore.jl @@ -0,0 +1,31 @@ +module TestKVStore +using MXNet +using Base.Test + +using ..Main: rand_dims + +SHAPE = rand_dims() +KEYS = [5,7,11] + +function init_kv() + kv = mx.KVStore() + mx.init!(kv, 3, mx.zeros(SHAPE)) + + vals = [mx.zeros(SHAPE) for k in KEYS] + mx.init!(kv, KEYS, vals) + return kv +end + +function test_single_kv_pair() + info("KVStore::single") + + kv = init_kv() + mx.push!(kv, 3, mx.ones(SHAPE)) + val = mx.empty(SHAPE) + mx.pull!(kv, 3, val) + @test maximum(abs(copy(val) - 1)) == 0 +end + +test_single_kv_pair() + +end From 8e4102f0bf687d2e941f7904e763f1b1d4c56dea Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 14 Oct 2015 18:24:49 -0400 Subject: [PATCH 058/630] kvstore test aggregration --- src/kvstore.jl | 10 +++++----- src/ndarray.jl | 6 ++++++ test/unittest/kvstore.jl | 28 ++++++++++++++++++++++++++++ 3 files changed, 39 insertions(+), 5 deletions(-) diff --git a/src/kvstore.jl b/src/kvstore.jl index 6c5f58ff20a7..d553a65dbd42 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -18,10 +18,10 @@ Base.cconvert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) function _flatten_kvlist(keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) @assert length(keys) == length(vals) - Keys_flt = Int[] + keys_flt = Int[] vals_flt = NDArray[] for (k,v) in zip(keys, vals) - append!(keys_flt, ones(Int, length(v))*k) + append!(keys_flt, Base.ones(Int, length(v))*k) append!(vals_flt, v) end return (keys_flt, vals_flt) @@ -31,7 +31,7 @@ function init!(self :: KVStore, key :: Int, val :: NDArray) init!(self, [key], [val]) end function init!(self :: KVStore, key :: Int, vals :: Vector{NDArray}) - init!(self, ones(Int, length(vals))*key, vals) + init!(self, Base.ones(Int, length(vals))*key, vals) end function init!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) init!(self, _flatten_kvlist(keys, vals)...) @@ -49,7 +49,7 @@ function push!(self :: KVStore, key :: Int, val :: NDArray; priority :: Int = 0) push!(self, [key], [val]; priority = priority) end function push!(self :: KVStore, key :: Int, vals :: Vector{NDArray}; priority :: Int = 0) - push!(self, ones(Int, length(vals))*key, vals; priority = priority) + push!(self, Base.ones(Int, length(vals))*key, vals; priority = priority) end function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}; priority::Int=0) push!(self, _flatten_kvlist(keys, vals)...; priority = priority) @@ -66,7 +66,7 @@ function pull!(self :: KVStore, key :: Int, out :: NDArray; priority :: Int = 0) pull!(self, [key], [out]) end function pull!(self :: KVStore, key :: Int, outs :: Vector{NDArray}; priority :: Int = 0) - pull!(self, ones(Int, length(outs))*key, outs; priority = priority) + pull!(self, Base.ones(Int, length(outs))*key, outs; priority = priority) end function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{Vector{NDArray}}; priority::Int=0) pull!(self, _flatten_kvlist(keys, outs)...; priority = priority) diff --git a/src/ndarray.jl b/src/ndarray.jl index 3aaf9946814b..95757917bd29 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -299,6 +299,12 @@ function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) mul_to!(ret, arg) end +# unlike *, we only allow type Real in arguments, because array-array * operator +# means matrix multiplication in Julia +function *(arg0 :: NDArray, arg :: Real) + ret = copy(arg0, context(arg0)) + mul_to!(ret, arg) +end function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable diff --git a/test/unittest/kvstore.jl b/test/unittest/kvstore.jl index 1e3060ff42e7..bca77a556922 100644 --- a/test/unittest/kvstore.jl +++ b/test/unittest/kvstore.jl @@ -26,6 +26,34 @@ function test_single_kv_pair() @test maximum(abs(copy(val) - 1)) == 0 end +function test_aggregator() + info("KVStore::aggregator") + + kv = init_kv() + + num_devs = 4 + devs = [mx.Context(mx.CPU, i) for i=0:num_devs-1] + vals = [mx.ones(SHAPE, dev) for dev in devs] + + mx.push!(kv, 3, vals) + mx.pull!(kv, 3, vals) + for v in vals + @test maximum(abs(copy(v)) - num_devs) == 0 + end + + # list + vals = [mx.NDArray[mx.ones(SHAPE, dev)*2 for dev in devs] for k in KEYS] + mx.push!(kv, KEYS, vals) + mx.pull!(kv, KEYS, vals) + + for vv in vals + for v in vv + @test maximum(abs(copy(v)) - 2num_devs) == 0 + end + end +end + test_single_kv_pair() +test_aggregator() end From 48a2b208ee8369e8d845b2b3613dfc8515f9a606 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 16 Oct 2015 00:02:02 -0400 Subject: [PATCH 059/630] eval metric --- src/MXNet.jl | 2 ++ src/metric.jl | 30 ++++++++++++++++++++++++++++++ 2 files changed, 32 insertions(+) create mode 100644 src/metric.jl diff --git a/src/MXNet.jl b/src/MXNet.jl index 964b467dcb37..4f703d5e6d18 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -20,6 +20,8 @@ include("executor.jl") include("io.jl") include("kvstore.jl") +include("metric.jl") + include("util.jl") end # mx diff --git a/src/metric.jl b/src/metric.jl new file mode 100644 index 000000000000..94dd97a9b911 --- /dev/null +++ b/src/metric.jl @@ -0,0 +1,30 @@ +abstract AbstractEvalMetric + +type Accuracy <: AbstractEvalMetric + acc_sum :: Float64 + n_sample :: Int + + Accuracy() = new(0.0, 0) +end + +function update!(metric :: Accuracy, label :: NDArray, pred :: NDArray) + label = copy(label) + pred = copy(pred) + + n_sample = size(pred)[end] + metric.n_sample += n_sample + for i = 1:n_sample + klass = indmax(sub(pred,:,i)) + metric.acc_sum += (klass-1) == label[i] + end +end + +import Base: get +function get(metric :: Accuracy) + metric.acc_sum / metric.n_sample +end + +function reset!(metric :: Accuracy) + metric.acc_sum = 0.0 + metric.n_sample = 0 +end From dd02638fb9e3250829094eaa1cdbaee45d18b8d0 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 16 Oct 2015 00:14:40 -0400 Subject: [PATCH 060/630] shape should be translated between Julia<->C in infer_shape --- src/symbol.jl | 6 +++--- test/unittest/symbol.jl | 8 ++++---- 2 files changed, 7 insertions(+), 7 deletions(-) diff --git a/src/symbol.jl b/src/symbol.jl index d8f45cb1f9eb..a352173b7a43 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -113,7 +113,7 @@ macro _infer_shape(self, keys, indptr, sdata) shape_data = pointer_to_array(shape_data, shape_size) map(1:shape_size) do i my_shape = pointer_to_array(shape_data[i], shape_ndim[i]) - tuple(Int[my_shape...]...) + tuple(flipdim(Int[my_shape...],1)...) end end return ( @@ -128,7 +128,7 @@ function infer_shape(self :: Symbol; kwargs...) sdata = MX_uint[] indptr = MX_uint[0] for (k,v) in kwargs - append!(sdata, [v...]) + append!(sdata, flipdim([v...],1)) push!(indptr, length(sdata)) end keys = AbstractString[string(x[1]) for x in kwargs] @@ -139,7 +139,7 @@ function infer_shape(self :: Symbol, args :: Union{Tuple, Void}...) indptr = MX_uint[0] for arg in args if isa(arg, Void); continue; end - append!(sdata, [arg...]) + append!(sdata, flipdim([arg...],1)) push!(indptr, length(sdata)) end keys = Ptr{char_p}(0) diff --git a/test/unittest/symbol.jl b/test/unittest/symbol.jl index 9fa11789701f..b62496d20fbc 100644 --- a/test/unittest/symbol.jl +++ b/test/unittest/symbol.jl @@ -53,18 +53,18 @@ function test_infer_shape() data_shape = (100, 100) arg_shapes, out_shapes, aux_shapes = mx.infer_shape(model, data=data_shape) arg_shape_dict = Dict{Symbol,Tuple}(zip(mx.list_arguments(model), arg_shapes)) - @test arg_shape_dict == Dict{Symbol,Tuple}(:fc2_bias => (10,),:fc2_weight => (10,1000), - :fc1_bias => (1000,), :fc1_weight => (1000,100), + @test arg_shape_dict == Dict{Symbol,Tuple}(:fc2_bias => (10,),:fc2_weight => (1000,10), + :fc1_bias => (1000,), :fc1_weight => (100, 1000), :data => data_shape) @test length(out_shapes) == 1 - @test out_shapes[1] == (100, 10) + @test out_shapes[1] == (10, 100) end function test_infer_shape_error() info("Symbol::infer_shape::throws") model = mlp2() - weight_shape = (1, 100) + weight_shape = (100, 1) data_shape = (100, 100) @test_throws mx.MXError mx.infer_shape(model, data=data_shape, fc1_weight=weight_shape) end From d061a180579281f213f3d4cd09f8838aec4471dc Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 17 Oct 2015 13:43:38 -0400 Subject: [PATCH 061/630] optimizer and estimator --- REQUIRE | 1 + src/MXNet.jl | 6 +- src/estimator.jl | 264 ++++++++++++++++++++++++++++++++++++++++++++ src/executor.jl | 27 ++++- src/io.jl | 67 ++++++----- src/kvstore.jl | 47 +++++++- src/metric.jl | 11 +- src/ndarray.jl | 3 + src/optimizer.jl | 76 +++++++++++++ src/symbol.jl | 3 +- test/unittest/io.jl | 19 ++-- 11 files changed, 479 insertions(+), 45 deletions(-) create mode 100644 src/estimator.jl create mode 100644 src/optimizer.jl diff --git a/REQUIRE b/REQUIRE index d5d646713dcf..76fa30ce5f54 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1 +1,2 @@ julia 0.4 +Formatting diff --git a/src/MXNet.jl b/src/MXNet.jl index 4f703d5e6d18..cd96b3573af5 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -6,6 +6,7 @@ module MXNet # functions with the same names as built-in utilities like "zeros", etc. export mx module mx +using Formatting include("init.jl") include("context.jl") @@ -17,10 +18,13 @@ include("name.jl") include("symbol.jl") include("executor.jl") +include("metric.jl") +include("optimizer.jl") + include("io.jl") include("kvstore.jl") -include("metric.jl") +include("estimator.jl") include("util.jl") diff --git a/src/estimator.jl b/src/estimator.jl new file mode 100644 index 000000000000..b3bd67e19bf4 --- /dev/null +++ b/src/estimator.jl @@ -0,0 +1,264 @@ +abstract AbstractEstimator + +type FeedForward <: AbstractEstimator + arch :: Symbol + ctx :: Vector{Context} + + arg_params :: Dict{Base.Symbol, NDArray} + aux_params :: Dict{Base.Symbol, NDArray} + + # leave the rest fields undefined + FeedForward(arch :: Symbol, ctx :: Vector{Context}) = new(arch, ctx) +end + +function _check_arguments(symbol :: Symbol) + arg_names = list_arguments(symbol) + @assert(length(unique(arg_names)) == length(arg_names), "Duplicated names in arguments $arg_names") +end + +"""Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector + of length `n_split`, with each entry a `UnitRange{Int}` indicating the slice index for that + piece. +""" +function _split_inputs(batch_size :: Int, n_split :: Int) + @assert(batch_size >= n_split) + per_split = floor(Int, batch_size / n_split) + counts = zeros(Int, n_split)+per_split + extra = batch_size - sum(counts) + counts[1:extra] += 1 + + cum = [0, cumsum(counts)...] + idx = [cum[i-1]+1:cum[i] for i = 2:length(cum)] + return idx +end + +function FeedForward(arch :: Symbol; context :: Union{Context, Vector{Context}, Void} = nothing) + if isa(context, Void) + context = [Context(CPU)] + elseif isa(context, Context) + context = [context] + end + FeedForward(arch, context) +end + +function _init_params(self :: FeedForward, data :: AbstractDataProvider) + # all arg names, including data, label, and parameters + arg_names = list_arguments(self.arch) + + data_shapes = provide_data(data) + label_shapes = provide_label(data) + data_names = [x[1] for x in data_shapes] + label_names = [x[1] for x in label_shapes] + + param_names = setdiff(arg_names, data_names ∪ label_names) + aux_names = list_auxiliary_states(self.arch) + + arg_shapes, grad_shapes, aux_shapes = infer_shape(self.arch; data_shapes...) + if !isdefined(self, :arg_params) + param_name_shapes = filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) + self.arg_params = Dict([name => empty(shape) for (name,shape) in param_name_shapes]) + end + if !isdefined(self, :aux_params) + self.aux_params = Dict([name => empty(shape) for (name,shape) in zip(aux_names,aux_shapes)]) + end + + # initialize the contents of the parameters + for (k,v) in self.arg_params + self.initializer(k, v) + end + for (k,v) in self.aux_params + self.initializer(k, v) + end + + return (param_names, aux_names) +end + +function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}) + if num_device == 1 && !ismatch(r"dist", string(kv_type)) + kv = nothing + else + if kv_type == :local + max_size = maximum([prod(size(param)) for (k,param) in arg_params]) + if max_size < 1024 * 1024 * 16 + kv_type = :loca_update_cpu + else + kv_type = :local_allreduce_cpu + end + info("Auto-select kvstore type = $kv_type") + end + kv = KVStore(kv_type) + end + + update_on_kvstore = true + if isa(kv, Void) || ismatch(r"local_allreduce", string(get_type(kv))) + update_on_kvstore = false + end + + return (kv, update_on_kvstore) +end + +function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; + epoch_stop :: Int = 10, epoch_start :: Int = 1, + eval_data :: Union{Void, AbstractDataProvider} = nothing, + eval_metric :: AbstractEvalMetric = Accuracy(), + kvstore :: Union{Base.Symbol, KVStore} = :local) + + info("Start training on $(self.ctx)") + + batch_size = get_batch_size(data) + num_dev = length(self.ctx) + slices = _split_inputs(batch_size, num_dev) + + # initialize parameters + info("Initializing parameters...") + param_names, aux_names = _init_params(self, param_names, aux_names) + + # setup kvstore + if isa(kvstore, Base.Symbol) + info("Creating KVStore...") + kvstore, update_on_kvstore = _create_kvstore(kvstore, length(self.ctx), self.arg_params) + end + + train_execs = Array(Executor, num_dev) + for i = 1:num_dev + data_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)] + train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=GRAD_WRITE, data_shapes...) + end + + # set up input data structures + data_names = [x[1] for x in provide_data(data)] + label_names = [x[1] for x in provide_label(data)] + + data_arrays = Vector{NDArray}[[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] + for name in data_names] + label_arrays = Vector{NDArray}[[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] + for name in label_names] + + param_arrays = Vector{NDArray}[[exec.arg_arrays[i] for exec in train_execs] for i = 1:length(param_names)] + grad_arrays = Vector{NDArray}[[exec.grad_arrays[i] for exec in train_execs] for i = 1:length(param_names)] + + optimizer.inv_batch_size = 1.0/batch_size + + if !update_on_kvstore + updater = get_updater(self.optimizer) + end + + if !isa(kvstore, Void) + if update_on_kvstore + set_optimizer(kvstore, optimizer) + end + + # init kv with gradients + for idx = 1:length(param_arrays) + param_on_devs = param_arrays[idx] + grad_on_devs = grad_arrays[idx] + + init!(kvstore, idx, self.arg_params[param_names[idx]]) + + # pull weights back + pull!(kvstore, idx, param_on_devs, priority=-idx) + end + end + + # set up output and labels in CPU for evaluation metric + output_shapes = [tuple(size(x)[1:end-1]...,batch_size) for x in train_execs[1].outputs] + cpu_dev = Context(CPU) + cpu_output_arrays = [empty(shape, cpu_dev) for shape in output_shapes] + cpu_label_arrays = [empty(shape, cpu_dev) for (name,shape) in provide_label(data)] + cpu_label_arrays_full_slice = [(1:batch_size, x) for x in label_arrays] + + # now start training... + for i_epoch = epoch_start:epoch_stop + time_start = time() + reset!(eval_metric) + n_batch = 0 + + for batch in data + load_data!(batch, data_arrays) + load_label!(batch, label_arrays) + + # forward and backward + for (texec, islice) in zip(train_execs, slices) + forward(texec, is_train=true) + + # copy outputs into cpu ndarray, for evaluation metric + for (cpu_out, dev_out) in zip(cpu_output_arrays, texec.outputs) + copy!(slice(cpu_out, islice), dev_out) + end + + backward(texec) + end + + # update parameters + for idx = 1:length(param_names) + # gradient synchronization + if !isa(kvstore, Void) + # push gradient, priority is negative index + push!(kvstore, idx, grad_arrays[idx], priority=-idx) + if update_on_kvstore + # pull back the weights + pull!(kvstore, idx, param_arrays[idx], priority=-idx) + else + # pull back the sum-ed gradients, to the same locations + pull!(kvstore, idx, grad_arrays[idx], priority=-idx) + end + end + + if !update_on_kvstore + # manual updating + for i_dev = 1:num_dev + # create a fake index, so that the updater create states + # for different param AND different devices, TODO(mli) + # use a better solution later + fake_idx = idx * num_dev + i_dev + updater(fake_idx, grad_arrays[idx][i_dev], param_arrays[idx][i_dev]) + end + end + end + + n_batch += 1 + + # update evaluation metric on training set + load_label!(batch, cpu_label_arrays_full_slice) + update!(eval_metric, cpu_label_arrays, cpu_output_arrays) + end # end of one epoch + + time_stop = time() + info("== Epoch {1:0>3d} ==========", i_epoch) + info("## Training summary") + for (name, value) in get(eval_metric) + info("{1>15s} = {2:.4f}", name, value) + end + info("{1>15s} = {2:.2f} seconds", "time", (time_stop-time_start)/1e9) + + # evaluation on validation set + if !isa(eval_data, Void) + # because we are re-using the memory allocated for the training network, + # the batch_size of the validation dataset must be the same as the training + # batch_size + @assert(get_batch_size(eval_data) == batch_size) + + reset!(eval_metric) + for batch in eval_data + load_data!(batch, data_arrays) + + # forward and backward + for (texec, islice) in zip(train_execs, slices) + forward(texec, is_train=true) + + # copy outputs into cpu ndarray, for evaluation metric + for (cpu_out, dev_out) in zip(cpu_output_arrays, texec.outputs) + copy!(slice(cpu_out, islice), dev_out) + end + end + load_label!(batch, cpu_label_arrays_full_slice) + update!(eval_metric, cpu_label_arrays, cpu_output_arrays) + end + + info("## Validation summary") + for (name, value) in get(eval_metric) + info("{1>15s} = {2:.4f}", name, value) + end + end + end # end of all epochs +end diff --git a/src/executor.jl b/src/executor.jl index 96c379a1bd25..6ddcff91efea 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -100,9 +100,11 @@ function simple_bind(self :: Symbol, ctx :: Context; grad_req :: GRAD_REQ=GRAD_W grad_arrays = nothing else grad_arrays = Dict{Base.Symbol, NDArray} + provided_data_names = keys(kwargs) for (name, shape) in zip(list_arguments(self), grad_shapes) # TODO: use a better way to identify data - if !(endswith(string(name), "data") || endswith(string(name), "label")) + #if !(endswith(string(name), "data") || endswith(string(name), "label")) + if !in(name, provided_data_names) grad_arrays[name] = zeros(shape, ctx) end end @@ -133,3 +135,26 @@ function backward(self :: Executor, out_grads :: Vector{NDArray}) out_grads = MX_handle[out_grads...] @mxcall(:MXExecutorBackward, (MX_handle, MX_uint, Ptr{MX_handle}), self, length(out_grads), out_grads) end + + +function copy_params_from(self::Executor, arg_params::Dict{Base.Symbol,NDArray}, + aux_params::Union{Void,Dict{Base.Symbol,NDArray}}=nothing; + allow_extra_params::Bool=false) + for (name, array) in arg_params + if haskey(self.arg_dict, name) + copy!(self.arg_dict[name], array) + else + @assert(allow_extra_params, "Extra params $name not in the arguments") + end + end + + if !isa(aux_params, Void) + for (name, array) in aux_params + if haskey(self.aux_dict, name) + copy!(self.aux_dict[name], array) + else + @assert(allow_extra_params, "Extra auxiliary state $name not recognized") + end + end + end +end diff --git a/src/io.jl b/src/io.jl index df7db7375d50..834e7ad755a4 100644 --- a/src/io.jl +++ b/src/io.jl @@ -2,10 +2,16 @@ A data provider provides interface to iterate over a dataset. It should implement the following functions: - provides(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} + provide_data(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} + provide_label(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} Returns a list of name-shape pairs, indicating the name and shape of the each data stream. For example, - `[(:data, (100,1,28,28)), (:softmax_label, (100,1))]`. + `[(:data, (100,1,28,28))]` or `[(:softmax_label, (100,1))]`. It should also implement the following convenient + function + + get_batch_size(provider :: AbstractDataProvider) => Int + + which returns the batch size used in this data provider. A data provider should implement the standard Julia iteration interface, including `Base.start`, `Base.next`, `Base.done` and `Base.eltype`. It could safely assume that the interface functions will @@ -58,14 +64,14 @@ typealias SlicedNDArray Vector{Tuple{UnitRange{Int},NDArray}} """Root type for data batch - A data batch must implement the following interface function to actually provide the data. The interface - is designed to make it easy to generate data on the fly. + A data batch must implement the following interface function to actually provide the data and label. - load_data!(batch :: AbstractDataBatch, targets :: Dict{Base.Symbol, SlicedNDArray}) + load_data!(batch :: AbstractDataBatch, targets :: Vector{SlicedNDArray}) + load_label!(batch :: AbstractDataBatch, targets :: Vector{SlicedNDArray}) - Load data into targets. The target is a dictionary mapping name to actual `SlicedNDArray` the data should be - copied into. Note `targets` might not contain names of all the data we could *provide*, simply because - some the data we provie is not needed. + Load data and label into targets. The target is a list of `SlicedNDArray` the data/label should be + copied into. The order in the list is guaranteed to be the same as returned by `provide_data` and + `provide_label`. The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. @@ -90,8 +96,10 @@ abstract AbstractDataBatch """Wrapper of built-in `libmxnet` data iterators. """ type MXDataProvider <: AbstractDataProvider - handle :: MX_DataIterHandle - provides :: Vector{Tuple{Base.Symbol, Tuple}} + handle :: MX_DataIterHandle + data_shape :: Vector{Tuple{Base.Symbol, Tuple}} + label_shape:: Vector{Tuple{Base.Symbol, Tuple}} + batch_size :: Int end function _reset_data_iter(handle :: MX_DataIterHandle) @@ -120,16 +128,20 @@ function MXDataProvider(handle :: MX_DataIterHandle; # init iterator, load the first batch and get shapes _reset_data_iter(handle) @assert(_iter_next(handle), "Failed to load the first batch in MXDataProvider") - provides = Tuple{Base.Symbol, Tuple}[(data_name, size(_get_data(handle)))] + data_shape = Tuple{Base.Symbol, Tuple}[(data_name, size(_get_data(handle)))] if !isa(label_name, Void) - push!(provides, (label_name::Base.Symbol, size(_get_label(handle)))) + label_shape = Tuple{Base.Symbol, Tuple}[(label_name::Base.Symbol, size(_get_label(handle)))] + else + label_shape = Tuple{Base.Symbol, Tuple}[] end _reset_data_iter(handle) - MXDataProvider(handle, provides) + MXDataProvider(handle, data_shape, label_shape, data_shape[1][2][end]) end -provides(provider::MXDataProvider) = provider.provides +provide_data(provider::MXDataProvider) = provider.data_shape +provide_label(provider::MXDataProvider) = provider.label_shape +get_batch_size(provider::MXDataProvider) = provider.batch_size type MXDataProviderState <: AbstractDataProviderState has_next :: Bool @@ -153,24 +165,21 @@ function Base.next(provider :: MXDataProvider, state :: MXDataProviderState) return (MXDataBatch(provider), state) end -function load_data!(batch :: MXDataBatch, targets :: Dict{Base.Symbol, SlicedNDArray}) - for (k,v) in targets - if k == batch.provider.provides[1][1] - # data - src = _get_data(batch.provider.handle) - elseif k == batch.provider.provides[2][1] - # label - src = _get_label(batch.provider.handle) - else - @assert(false, "Unknown data $k, we only provide $(batch.provider.provides)") - end - - for (idx, target) in v - copy!(target, slice(src, idx)) - end +function _load_general!(batch :: MXDataBatch, loader :: Function, targets :: Vector{SlicedNDArray}) + @assert length(targets) == 1 + src = loader(batch.provider.handle) + for (idx, target) in targets[1] + copy!(target, slice(src, idx)) end end +function load_data!(batch :: MXDataBatch, targets :: Vector{SlicedNDArray}) + _load_general!(batch, _get_data, targets) +end +function load_label!(batch :: MXDataBatch, targets :: Vector{SlicedNDArray}) + _load_general!(batch, _get_label, targets) +end + function get_pad(batch :: MXDataBatch) ref_pad = Ref{Cint}(0) @mxcall(:MXDataIterGetPadNum, (MX_handle, Ref{Cint}), batch.provider.handle, ref_pad) diff --git a/src/kvstore.jl b/src/kvstore.jl index d553a65dbd42..6d0642a6d2a7 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -1,5 +1,6 @@ type KVStore - handle :: MX_KVStoreHandle + handle :: MX_KVStoreHandle + updater_c :: Ptr{Void} end function KVStore(kv_type::Base.Symbol = :local) @@ -8,7 +9,7 @@ function KVStore(kv_type::Base.Symbol = :local) ref_hdr = Ref{MX_handle}(0) kv_type = string(kv_type) @mxcall(:MXKVStoreCreate, (char_p, Ref{MX_handle}), kv_type, ref_hdr) - return KVStore(MX_KVStoreHandle(ref_hdr[])) + return KVStore(MX_KVStoreHandle(ref_hdr[]), Ptr{Void}(0)) end function Base.unsafe_convert(::Type{MX_handle}, obj::KVStore) Base.unsafe_convert(MX_handle, obj.handle) @@ -78,3 +79,45 @@ function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{NDArray}; pr @mxcall(:MXKVStorePull, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}, Cint), self, length(keys), keys, outs, priority) end + + +function get_type(self :: KVStore) + type_ref = Ref{char_p}(0) + @mxcall(:MXKVStoreGetType, (MX_handle, Ref{char_p}), self, type_ref) + return symbol(bytestring(type_ref[])) +end + +function get_num_workers(self :: KVStore) + ref_size = Ref{Cint}(0) + @mxcall(:MXKVStoreGetGroupSize, (MX_handle, Ref{Cint}), self, ref_size) + return Int(ref_size[]) +end + +function get_rank(self :: KVStore) + ref_rank = Ref{Cint}(0) + @mxcall(:MXKVStoreGetRank, (MX_handle, Ref{Cint}), self, ref_rank) + return Int(ref_rank[]) +end + + +function set_updater(self :: KVStore, updater :: Function) + function updater_wrapper(index :: Cint, nd_recv :: MX_handle, nd_local :: MX_handle, ::Ptr{Void}) + updater(index, NDArray(MX_NDArrayHandle(nd_recv)), NDArray(MX_NDArrayHandle(nd_local))) + end + self.wrapper_c = cfunction(updater_wrapper, Void, (Cint, MX_handle, MX_handle, Ptr{Void})) + + @mxcall(:MXKVStoreSetUpdater, (MX_handle, Ptr{Void}, Ptr{Void}), + self, self.wrapper_c, Ptr{Void}(0)) +end + +function set_optimizer(self :: KVStore, optimizer :: AbstractOptimizer) + ref_is_worker = Ref{Cint}(0) + @mxcall(:MXKVStoreIsWorkerNode, (Ref{Cint},), ref_is_worker) + is_worker = ref_is_worker[] + + if ismatch(r"dist", string(get_type(self))) && is_worker + # TODO + else + set_updater(self, get_updater(optimizer)) + end +end diff --git a/src/metric.jl b/src/metric.jl index 94dd97a9b911..d4f38e4545f5 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -7,7 +7,7 @@ type Accuracy <: AbstractEvalMetric Accuracy() = new(0.0, 0) end -function update!(metric :: Accuracy, label :: NDArray, pred :: NDArray) +function _update_single_output(metric :: Accuracy, labels :: NDArray, pred :: NDArray) label = copy(label) pred = copy(pred) @@ -19,9 +19,16 @@ function update!(metric :: Accuracy, label :: NDArray, pred :: NDArray) end end +function update!(metric :: Accuracy, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + @assert length(labels) == length(preds) + for i = 1:length(labels) + _update_single_output(labels[i], preds[i]) + end +end + import Base: get function get(metric :: Accuracy) - metric.acc_sum / metric.n_sample + return [(:accuracy, metric.acc_sum / metric.n_sample)] end function reset!(metric :: Accuracy) diff --git a/src/ndarray.jl b/src/ndarray.jl index 95757917bd29..0b8b4c155cc1 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -305,6 +305,9 @@ function *(arg0 :: NDArray, arg :: Real) ret = copy(arg0, context(arg0)) mul_to!(ret, arg) end +function *(arg0 :: Real, arg :: NDArray) + *(arg, arg0) +end function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable diff --git a/src/optimizer.jl b/src/optimizer.jl new file mode 100644 index 000000000000..eb4ca4db3b5e --- /dev/null +++ b/src/optimizer.jl @@ -0,0 +1,76 @@ +abstract AbstractOptimizer + +abstract AbstractLearningRateScheduler +abstract AbstractMomentumScheduler + +type FixedLearningRateScheduler <: AbstractLearningRateScheduler + learning_rate :: Float64 +end +get_learning_rate(self :: FixedLearningRateScheduler, iter :: Int) = self.learning_rate + +type NullMomentumScheduler <: AbstractMomentumScheduler +end +get_momentum(self :: NullMomentumScheduler, iter :: Int) = 0.0 + +type FixedMomentumScheduler <: AbstractMomentumScheduler + momentum :: Float64 +end +get_momentum(self :: FixedMomentumScheduler, iter :: Int) = self.momentum + +type SGD <: AbstractOptimizer + iter :: Int + + lr_scheduler :: AbstractLearningRateScheduler + mom_scheduler :: AbstractMomentumScheduler + weight_decay :: Float64 + grad_scale :: Float64 + grad_clip :: Float64 + inv_batch_size:: Float64 + + function SGD(;lr_scheduler::AbstractLearningRateScheduler=FixedLearningRateScheduler(0.01), + mom_scheduler::AbstractMomentumScheduler=NullMomentumScheduler(), + weight_decay::Float64=0.0001, + grad_scale::Float64=1.0, + clip_grad::Float64=0.0) + new(0, lr_scheduler, mom_scheduler, weight_decay, grad_scale, grad_clip, 1.0) + end +end + +function create_state(self :: SGD, index :: Int, weight :: NDArray) + if isa(self.mom_scheduler, NullMomentumScheduler) + return nothing + else + return zeros(size(weight), context(weight)) + end +end + +function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: Union{Void, NDArray}) + lr = get_learning_rate(self.lr_scheduler, self.iter) + grad_scale = self.grad_scale * self.inv_batch_size + + if isa(state, Void) + @inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) + else + mom = state :: NDArray + coef = get_momentum(self.mom_scheduler, self.iter) + @inplace mom .*= coef + if self.clip_gradient > 0 + # TODO: + else + @inplace mom += -lr * (grad_scale * grad + self.weight_decay * weight) + end + @inplace weight += mom + end +end + + +function get_updater(optimizer :: AbstractOptimizer) + states = Dict{Int,Any}() + function updater(index :: Int, grad :: NDArray, weight :: NDArray) + if !haskey(states, index) + states[index] = create_state(optimizer, index, weight) + end + update(optimizer, index, weight, grad, states[index]) + end + return updater +end diff --git a/src/symbol.jl b/src/symbol.jl index a352173b7a43..b97e7a7594c8 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -111,10 +111,11 @@ macro _infer_shape(self, keys, indptr, sdata) function build_shapes(shape_size::MX_uint, shape_ndim::Ptr{MX_uint}, shape_data::Ptr{Ptr{MX_uint}}) shape_ndim = pointer_to_array(shape_ndim, shape_size) shape_data = pointer_to_array(shape_data, shape_size) - map(1:shape_size) do i + shapes = map(1:shape_size) do i my_shape = pointer_to_array(shape_data[i], shape_ndim[i]) tuple(flipdim(Int[my_shape...],1)...) end + convert(Vector{Tuple}, shapes) end return ( build_shapes(ref_arg_shape_size[], ref_arg_shape_ndim[], ref_arg_shape_data[]), diff --git a/test/unittest/io.jl b/test/unittest/io.jl index 1ac65ae78464..0e9e33f12244 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -10,22 +10,23 @@ function test_mnist() mnist_provider = mx.MNISTProvider(image=filenames[:train_data], label=filenames[:train_label], batch_size=batch_size, silent=true, shuffle=false) - spec = mx.provides(mnist_provider) - spec = Dict(spec) - @test haskey(spec, :data) - @test haskey(spec, :softmax_label) - @test spec[:data] == (28,28,1,batch_size) - @test spec[:softmax_label] == (batch_size,) + data_spec = mx.provide_data(mnist_provider) + label_spec = mx.provide_label(mnist_provider) + @test data_spec == [(:data, (28,28,1,batch_size))] + @test label_spec == [(:softmax_label, (batch_size,))] n_batch = 0 for batch in mnist_provider if n_batch == 0 data_array = mx.empty(28,28,1,batch_size) label_array = mx.empty(batch_size) - targets = Dict(:data => [(1:batch_size, data_array)], - :softmax_label => [(1:batch_size, label_array)]) + # have to use "for i=1:1" to get over the legacy "feature" of using + # [ ] to do concatenation in Julia + data_targets = [[(1:batch_size, data_array)] for i = 1:1] + label_targets = [[(1:batch_size, label_array)] for i = 1:1] - mx.load_data!(batch, targets) + mx.load_data!(batch, data_targets) + mx.load_label!(batch, label_targets) true_labels = [5,0,4,1,9,2,1,3,1,4] # the first 10 labels in MNIST train got_labels = Int[copy(label_array)...] From 8a0a43bcfd5afcd7b5972fb23718cde9019c2777 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 17 Oct 2015 14:07:27 -0400 Subject: [PATCH 062/630] fix initializers --- src/MXNet.jl | 1 + src/estimator.jl | 11 ++++++----- src/initializer.jl | 31 ++++++++++++++++--------------- src/optimizer.jl | 2 +- 4 files changed, 24 insertions(+), 21 deletions(-) diff --git a/src/MXNet.jl b/src/MXNet.jl index cd96b3573af5..cfa56b21d292 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -20,6 +20,7 @@ include("executor.jl") include("metric.jl") include("optimizer.jl") +include("initializer.jl") include("io.jl") include("kvstore.jl") diff --git a/src/estimator.jl b/src/estimator.jl index b3bd67e19bf4..5aa0446cbff1 100644 --- a/src/estimator.jl +++ b/src/estimator.jl @@ -23,7 +23,7 @@ end function _split_inputs(batch_size :: Int, n_split :: Int) @assert(batch_size >= n_split) per_split = floor(Int, batch_size / n_split) - counts = zeros(Int, n_split)+per_split + counts = Base.zeros(Int, n_split)+per_split extra = batch_size - sum(counts) counts[1:extra] += 1 @@ -41,7 +41,7 @@ function FeedForward(arch :: Symbol; context :: Union{Context, Vector{Context}, FeedForward(arch, context) end -function _init_params(self :: FeedForward, data :: AbstractDataProvider) +function _init_params(self :: FeedForward, data :: AbstractDataProvider, initializer) # all arg names, including data, label, and parameters arg_names = list_arguments(self.arch) @@ -64,10 +64,10 @@ function _init_params(self :: FeedForward, data :: AbstractDataProvider) # initialize the contents of the parameters for (k,v) in self.arg_params - self.initializer(k, v) + initializer(k, v) end for (k,v) in self.aux_params - self.initializer(k, v) + initializer(k, v) end return (param_names, aux_names) @@ -98,6 +98,7 @@ function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params : end function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; + initializer :: AbstractInitializer = UniformInitializer(0.01), epoch_stop :: Int = 10, epoch_start :: Int = 1, eval_data :: Union{Void, AbstractDataProvider} = nothing, eval_metric :: AbstractEvalMetric = Accuracy(), @@ -111,7 +112,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # initialize parameters info("Initializing parameters...") - param_names, aux_names = _init_params(self, param_names, aux_names) + param_names, aux_names = _init_params(self, data, initializer) # setup kvstore if isa(kvstore, Base.Symbol) diff --git a/src/initializer.jl b/src/initializer.jl index 5a3dc5ef005c..502baf2189e1 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -1,34 +1,34 @@ abstract AbstractInitializer -function call(self :: AbstractInitializer, name :: Symbol, array :: NDArray) - name = string(name) - if endswith(name, "bias") +function call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + strname = string(name) + if endswith(strname, "bias") _init_bias(self, name, array) - elseif endswith(name, "gamma") + elseif endswith(strname, "gamma") _init_gamma(self, name, array) - elseif endswith(name, "beta") + elseif endswith(strname, "beta") _init_beta(self, name, array) - elseif endswith(name, "weight") + elseif endswith(strname, "weight") _init_weight(self, name, array) - elseif endswith(name, "moving_mean") + elseif endswith(strname, "moving_mean") _init_zero(self, name, array) - elseif endswith(name, "moving_var") + elseif endswith(strname, "moving_var") _init_zero(self, name, array) else _init_default(self, name, array) end end -function _init_bias(self :: AbstractInitializer, name :: Symbol, array :: NDArray) +function _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) array[:] = 0 end -function _init_gamma(self :: AbstractInitializer, name :: Symbol, array :: NDArray) +function _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) array[:] = 1 end -function _init_beta(self :: AbstractInitializer, name :: Symbol, array :: NDArray) +function _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) array[:] = 0 end -function _init_zero(self :: AbstractInitializer, name :: Symbol, array :: NDArray) +function _init_zero(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) array[:] = 0 end @@ -37,7 +37,7 @@ immutable UniformInitializer <: AbstractInitializer end UniformInitializer() = UniformInitializer(0.07) -function _init_weight(self :: UniformInitializer, name :: Symbol, array :: NDArray) +function _init_weight(self :: UniformInitializer, name :: Base.Symbol, array :: NDArray) rand!(-self.scale, self.scale, array) end @@ -47,13 +47,14 @@ immutable NormalInitializer <: AbstractInitializer end NormalInitializer(; mu=0, sigma=0.01) = NormalInitializer(mu, sigma) -function _init_weight(self :: NormalInitializer, name :: Symbol, array :: NDArray) +function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) randn!(self.μ, self.σ, array) end immutable XaiverInitializer <: AbstractInitializer end -function _init_weight(self :: NormalInitializer, name :: Symbol, array :: NDArray) + +function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) dims = size(array) fan_in = prod(dims[2:end]) fan_out = dims[1] diff --git a/src/optimizer.jl b/src/optimizer.jl index eb4ca4db3b5e..050a752f0ad7 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -31,7 +31,7 @@ type SGD <: AbstractOptimizer mom_scheduler::AbstractMomentumScheduler=NullMomentumScheduler(), weight_decay::Float64=0.0001, grad_scale::Float64=1.0, - clip_grad::Float64=0.0) + grad_clip::Float64=0.0) new(0, lr_scheduler, mom_scheduler, weight_decay, grad_scale, grad_clip, 1.0) end end From 92ec4997b6f166555f28190883a466a9f89538e4 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 17 Oct 2015 14:22:21 -0400 Subject: [PATCH 063/630] fix executor --- src/estimator.jl | 3 ++- src/executor.jl | 12 ++++++------ 2 files changed, 8 insertions(+), 7 deletions(-) diff --git a/src/estimator.jl b/src/estimator.jl index 5aa0446cbff1..794db739ff9c 100644 --- a/src/estimator.jl +++ b/src/estimator.jl @@ -123,7 +123,8 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra train_execs = Array(Executor, num_dev) for i = 1:num_dev data_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)] - train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=GRAD_WRITE, data_shapes...) + label_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)] + train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=GRAD_WRITE, data_shapes..., label_shapes...) end # set up input data structures diff --git a/src/executor.jl b/src/executor.jl index 6ddcff91efea..82b10f8982bc 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -96,14 +96,14 @@ function simple_bind(self :: Symbol, ctx :: Context; grad_req :: GRAD_REQ=GRAD_W @assert(!isa(arg_shapes, Void), "Information not enough to perform complete shape inference") arg_arrays = NDArray[zeros(shape, ctx) for shape in arg_shapes] + arg_names = list_arguments(self) if grad_req == GRAD_NOP grad_arrays = nothing else - grad_arrays = Dict{Base.Symbol, NDArray} - provided_data_names = keys(kwargs) - for (name, shape) in zip(list_arguments(self), grad_shapes) - # TODO: use a better way to identify data - #if !(endswith(string(name), "data") || endswith(string(name), "label")) + provided_data_names = [x[1] for x in kwargs] + grad_arrays = Dict{Base.Symbol,NDArray}() + for (name, shape) in zip(arg_names, grad_shapes) + # if not in provided data, should be parameters if !in(name, provided_data_names) grad_arrays[name] = zeros(shape, ctx) end @@ -111,7 +111,7 @@ function simple_bind(self :: Symbol, ctx :: Context; grad_req :: GRAD_REQ=GRAD_W end aux_arrays = [zeros(shape, ctx) for shape in aux_shapes] - return bind(self, ctx, arg_ndarrays, grad_arrays, grad_req, aux_arrays) + return bind(self, ctx, arg_arrays, args_grad=grad_arrays, grad_req=grad_req, aux_states=aux_arrays) end From 8c0e465e7c621dc029273da6073f32871b7c52dd Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 17 Oct 2015 15:44:11 -0400 Subject: [PATCH 064/630] bug fix --- src/context.jl | 4 ++++ src/estimator.jl | 42 ++++++++++++++++++++---------------------- src/executor.jl | 4 ++-- src/io.jl | 19 ++++++++++--------- src/metric.jl | 4 ++-- src/ndarray.jl | 4 ++++ src/optimizer.jl | 2 +- 7 files changed, 43 insertions(+), 36 deletions(-) diff --git a/src/context.jl b/src/context.jl index 3dbf7e6e482a..4a9f4667d4cf 100644 --- a/src/context.jl +++ b/src/context.jl @@ -9,6 +9,10 @@ end Context(dev_type :: Union{CONTEXT_TYPE, Integer}, dev_id :: Integer = 0) = Context(convert(CONTEXT_TYPE, dev_type), convert(Cint, dev_id), Nullable{Context}()) +function Base.show(io :: IO, ctx :: Context) + print(io, "$(ctx.device_type)$(ctx.device_id))") +end + # global default context DEFAULT_CONTEXT = Context(CPU) diff --git a/src/estimator.jl b/src/estimator.jl index 794db739ff9c..e0f2fbc7a6ac 100644 --- a/src/estimator.jl +++ b/src/estimator.jl @@ -11,11 +11,6 @@ type FeedForward <: AbstractEstimator FeedForward(arch :: Symbol, ctx :: Vector{Context}) = new(arch, ctx) end -function _check_arguments(symbol :: Symbol) - arg_names = list_arguments(symbol) - @assert(length(unique(arg_names)) == length(arg_names), "Duplicated names in arguments $arg_names") -end - """Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector of length `n_split`, with each entry a `UnitRange{Int}` indicating the slice index for that piece. @@ -53,7 +48,7 @@ function _init_params(self :: FeedForward, data :: AbstractDataProvider, initial param_names = setdiff(arg_names, data_names ∪ label_names) aux_names = list_auxiliary_states(self.arch) - arg_shapes, grad_shapes, aux_shapes = infer_shape(self.arch; data_shapes...) + arg_shapes, out_shapes, aux_shapes = infer_shape(self.arch; data_shapes...) if !isdefined(self, :arg_params) param_name_shapes = filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) self.arg_params = Dict([name => empty(shape) for (name,shape) in param_name_shapes]) @@ -70,7 +65,7 @@ function _init_params(self :: FeedForward, data :: AbstractDataProvider, initial initializer(k, v) end - return (param_names, aux_names) + return (arg_names, param_names, aux_names) end function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}) @@ -112,7 +107,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # initialize parameters info("Initializing parameters...") - param_names, aux_names = _init_params(self, data, initializer) + arg_names, param_names, aux_names = _init_params(self, data, initializer) # setup kvstore if isa(kvstore, Base.Symbol) @@ -128,21 +123,23 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end # set up input data structures - data_names = [x[1] for x in provide_data(data)] - label_names = [x[1] for x in provide_label(data)] + data_names = [x[1] for x in provide_data(data)] + label_names = [x[1] for x in provide_label(data)] + + data_arrays = [SlicedNDArray[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] + for name in data_names] + label_arrays = [SlicedNDArray[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] + for name in label_names] - data_arrays = Vector{NDArray}[[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] - for name in data_names] - label_arrays = Vector{NDArray}[[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] - for name in label_names] + param_idx = filter(i -> in(arg_names[i], param_names), 1:length(arg_names)) - param_arrays = Vector{NDArray}[[exec.arg_arrays[i] for exec in train_execs] for i = 1:length(param_names)] - grad_arrays = Vector{NDArray}[[exec.grad_arrays[i] for exec in train_execs] for i = 1:length(param_names)] + param_arrays = [NDArray[exec.arg_arrays[i] for exec in train_execs] for i in param_idx] + grad_arrays = [NDArray[exec.grad_arrays[i] for exec in train_execs] for i in param_idx] optimizer.inv_batch_size = 1.0/batch_size if !update_on_kvstore - updater = get_updater(self.optimizer) + updater = get_updater(optimizer) end if !isa(kvstore, Void) @@ -150,6 +147,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra set_optimizer(kvstore, optimizer) end + info("Initializing KVStore...") # init kv with gradients for idx = 1:length(param_arrays) param_on_devs = param_arrays[idx] @@ -167,7 +165,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra cpu_dev = Context(CPU) cpu_output_arrays = [empty(shape, cpu_dev) for shape in output_shapes] cpu_label_arrays = [empty(shape, cpu_dev) for (name,shape) in provide_label(data)] - cpu_label_arrays_full_slice = [(1:batch_size, x) for x in label_arrays] + cpu_label_arrays_full_slice = [SlicedNDArray[(1:batch_size, x)] for x in cpu_label_arrays] # now start training... for i_epoch = epoch_start:epoch_stop @@ -226,12 +224,12 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end # end of one epoch time_stop = time() - info("== Epoch {1:0>3d} ==========", i_epoch) + info(format("== Epoch {1:0>3d} ==========", i_epoch)) info("## Training summary") for (name, value) in get(eval_metric) - info("{1>15s} = {2:.4f}", name, value) + info(format("{1:>15s} = {2:.4f}", name, value)) end - info("{1>15s} = {2:.2f} seconds", "time", (time_stop-time_start)/1e9) + info(format("{1:>15s} = {2:.2f} seconds", "time", (time_stop-time_start)/1e9)) # evaluation on validation set if !isa(eval_data, Void) @@ -259,7 +257,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra info("## Validation summary") for (name, value) in get(eval_metric) - info("{1>15s} = {2:.4f}", name, value) + info(format("{1:>15s} = {2:.4f}", name, value)) end end end # end of all epochs diff --git a/src/executor.jl b/src/executor.jl index 82b10f8982bc..94aabba5ddd5 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -92,7 +92,7 @@ function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict end function simple_bind(self :: Symbol, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) - arg_shapes, grad_shapes, aux_shapes = infer_shape(self; kwargs...) + arg_shapes, out_shapes, aux_shapes = infer_shape(self; kwargs...) @assert(!isa(arg_shapes, Void), "Information not enough to perform complete shape inference") arg_arrays = NDArray[zeros(shape, ctx) for shape in arg_shapes] @@ -102,7 +102,7 @@ function simple_bind(self :: Symbol, ctx :: Context; grad_req :: GRAD_REQ=GRAD_W else provided_data_names = [x[1] for x in kwargs] grad_arrays = Dict{Base.Symbol,NDArray}() - for (name, shape) in zip(arg_names, grad_shapes) + for (name, shape) in zip(arg_names, arg_shapes) # if not in provided data, should be parameters if !in(name, provided_data_names) grad_arrays[name] = zeros(shape, ctx) diff --git a/src/io.jl b/src/io.jl index 834e7ad755a4..5587fbc97575 100644 --- a/src/io.jl +++ b/src/io.jl @@ -57,21 +57,22 @@ abstract AbstractDataProvider """Root type for states of data provider""" abstract AbstractDataProviderState -"""A list of (slice, NDArray) pairs. Usually each NDArray resides on a different device, and each +"""A tuple of (slice, NDArray). Usually each NDArray resides on a different device, and each slice describe which part of a larger piece of data should goto that device. """ -typealias SlicedNDArray Vector{Tuple{UnitRange{Int},NDArray}} +typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} """Root type for data batch A data batch must implement the following interface function to actually provide the data and label. - load_data!(batch :: AbstractDataBatch, targets :: Vector{SlicedNDArray}) - load_label!(batch :: AbstractDataBatch, targets :: Vector{SlicedNDArray}) + load_data!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) + load_label!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) - Load data and label into targets. The target is a list of `SlicedNDArray` the data/label should be + Load data and label into targets. The targets is a list of target that the data/label should be copied into. The order in the list is guaranteed to be the same as returned by `provide_data` and - `provide_label`. + `provide_label`. Each entry in the list is again a list of `SlicedNDArray`, corresponding the + memory buffer for each device. The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. @@ -165,7 +166,7 @@ function Base.next(provider :: MXDataProvider, state :: MXDataProviderState) return (MXDataBatch(provider), state) end -function _load_general!(batch :: MXDataBatch, loader :: Function, targets :: Vector{SlicedNDArray}) +function _load_general!(batch :: MXDataBatch, loader :: Function, targets :: Vector{Vector{SlicedNDArray}}) @assert length(targets) == 1 src = loader(batch.provider.handle) for (idx, target) in targets[1] @@ -173,10 +174,10 @@ function _load_general!(batch :: MXDataBatch, loader :: Function, targets :: Vec end end -function load_data!(batch :: MXDataBatch, targets :: Vector{SlicedNDArray}) +function load_data!(batch :: MXDataBatch, targets :: Vector{Vector{SlicedNDArray}}) _load_general!(batch, _get_data, targets) end -function load_label!(batch :: MXDataBatch, targets :: Vector{SlicedNDArray}) +function load_label!(batch :: MXDataBatch, targets :: Vector{Vector{SlicedNDArray}}) _load_general!(batch, _get_label, targets) end diff --git a/src/metric.jl b/src/metric.jl index d4f38e4545f5..99cdc96a94db 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -7,7 +7,7 @@ type Accuracy <: AbstractEvalMetric Accuracy() = new(0.0, 0) end -function _update_single_output(metric :: Accuracy, labels :: NDArray, pred :: NDArray) +function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDArray) label = copy(label) pred = copy(pred) @@ -22,7 +22,7 @@ end function update!(metric :: Accuracy, labels :: Vector{NDArray}, preds :: Vector{NDArray}) @assert length(labels) == length(preds) for i = 1:length(labels) - _update_single_output(labels[i], preds[i]) + _update_single_output(metric, labels[i], preds[i]) end end diff --git a/src/ndarray.jl b/src/ndarray.jl index 0b8b4c155cc1..cd23eb59cc98 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -40,6 +40,10 @@ type NDArray end end +function Base.show(io :: IO, arr :: NDArray) + print(io, "mx.NDArray$(size(arr))") +end + function NDArray{T<:Real}(data :: Array{T}) copy(data, mx.DEFAULT_CONTEXT) end diff --git a/src/optimizer.jl b/src/optimizer.jl index 050a752f0ad7..191fc6a855c2 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -54,7 +54,7 @@ function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, s mom = state :: NDArray coef = get_momentum(self.mom_scheduler, self.iter) @inplace mom .*= coef - if self.clip_gradient > 0 + if self.grad_clip > 0 # TODO: else @inplace mom += -lr * (grad_scale * grad + self.weight_decay * weight) From 614de3a40ea0b9687a6d47a763d05668c0856e11 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 17 Oct 2015 16:27:13 -0400 Subject: [PATCH 065/630] mnist mlp example --- examples/mnist/mlp.jl | 33 +++++++++++++++++++++++++++++++++ src/estimator.jl | 4 +++- src/metric.jl | 1 + test/unittest/ndarray.jl | 16 ++++++++++++++++ 4 files changed, 53 insertions(+), 1 deletion(-) create mode 100644 examples/mnist/mlp.jl diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl new file mode 100644 index 000000000000..88e4dade744a --- /dev/null +++ b/examples/mnist/mlp.jl @@ -0,0 +1,33 @@ +using MXNet + +# define MLP +data = mx.variable(:data) +fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) +act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) +fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) +act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) +fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) +mlp = mx.Softmax(data = fc3, name=:softmax) + +# download MNIST into Pkg.dir("MXNet")/data/mnist if not exist +filenames = mx.get_mnist_ubyte() + +# data provider +batch_size = 100 +train_provider = mx.MNISTProvider(image=filenames[:train_data], + label=filenames[:train_label], + batch_size=batch_size, shuffle=true, flat=true) +eval_provider = mx.MNISTProvider(image=filenames[:test_data], + label=filenames[:test_label], + batch_size=batch_size, shuffle=false, flat=true) + +# setup estimator +estimator = mx.FeedForward(mlp, context=mx.Context(mx.CPU)) + +# optimizer +optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.1), + mom_scheduler=mx.FixedMomentumScheduler(0.9), + weight_decay=0.00001) + +# fit parameters +mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) diff --git a/src/estimator.jl b/src/estimator.jl index e0f2fbc7a6ac..c4e4859bcfc4 100644 --- a/src/estimator.jl +++ b/src/estimator.jl @@ -120,6 +120,8 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra data_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)] label_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)] train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=GRAD_WRITE, data_shapes..., label_shapes...) + + copy_params_from(train_execs[i], self.arg_params, self.aux_params) end # set up input data structures @@ -229,7 +231,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra for (name, value) in get(eval_metric) info(format("{1:>15s} = {2:.4f}", name, value)) end - info(format("{1:>15s} = {2:.2f} seconds", "time", (time_stop-time_start)/1e9)) + info(format("{1:>15s} = {2:.4f} seconds", "time", time_stop-time_start)) # evaluation on validation set if !isa(eval_data, Void) diff --git a/src/metric.jl b/src/metric.jl index 99cdc96a94db..59acb529a9a7 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -16,6 +16,7 @@ function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDA for i = 1:n_sample klass = indmax(sub(pred,:,i)) metric.acc_sum += (klass-1) == label[i] + #println("$(sub(pred,:,i)) $(klass-1) <=> $(label[i])") end end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 04fc3a632204..d547159af1e2 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -160,6 +160,21 @@ function test_div() @test reldiff(t2./scalar, copy(a2./scalar)) < 1e-6 end +function test_gd() + dims = rand_dims() + tw, aw = rand_tensors(dims) + tg, ag = rand_tensors(dims) + + info("NDArray::gd::dims = $dims") + + lr = rand() + wd = rand() + + @mx.inplace aw += -lr * (ag + wd * aw) + tw += -lr * (tg + wd * tw) + @test reldiff(copy(aw), tw) < 1e-6 +end + ################################################################################ # Run tests @@ -171,5 +186,6 @@ test_plus() test_minus() test_mul() test_div() +test_gd() end From 61fa00c8ad58d368c59a4bef5d69dbbead985ef9 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 17 Oct 2015 16:51:02 -0400 Subject: [PATCH 066/630] lenet example (not tested) --- examples/mnist/lenet.jl | 48 ++++++++++++++++++++++++++++++++++++ examples/mnist/mlp.jl | 8 ++---- examples/mnist/mnist-data.jl | 16 ++++++++++++ 3 files changed, 66 insertions(+), 6 deletions(-) create mode 100644 examples/mnist/lenet.jl create mode 100644 examples/mnist/mnist-data.jl diff --git a/examples/mnist/lenet.jl b/examples/mnist/lenet.jl new file mode 100644 index 000000000000..7efe4c42eedc --- /dev/null +++ b/examples/mnist/lenet.jl @@ -0,0 +1,48 @@ +using MXNet + +#-------------------------------------------------------------------------------- +# define lenet + +# input +data = mx.variable(:data) + +# first conv +conv1 = mx.Convolution(data=data, kernel=(5,5), num_filter=20) +tanh1 = mx.Activation(data=conv1, act_type=:tanh) +pool1 = mx.Pooling(data=tanh1, pool_type=:max, kernel=(2,2), stride=(2,2)) + +# second conv +conv2 = mx.Convolution(data=pool1, kernel=(5,5), num_filter=50) +tanh2 = mx.Activation(data=conv2, act_type=:tanh) +pool2 = mx.Pooling(data=tanh2, pool_type=:max, kernel=(2,2), stride=(2,2)) + +# first fully-connected +flat = mx.Flatten(data=pool2) +fc1 = mx.FullyConnected(data=flat, num_hidden=500) +tanh3 = mx.Activation(data=fc1, act_type=:tanh) + +# second fully-connected +fc2 = mx.FullyConnected(data=tanh3, num_hidden=10) + +# softmax loss +lenet = mx.Softmax(data=fc2, name=:softmax) + + +#-------------------------------------------------------------------------------- +# load data +batch_size = 100 +include("mnist-data.jl") +train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) + +#-------------------------------------------------------------------------------- +# fit model +dev = mx.Context(mx.GPU) +estimator = mx.FeedForward(lenet, context=dev) + +# optimizer +optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.05), + mom_scheduler=mx.FixedMomentumScheduler(0.9), + weight_decay=0.00001) + +# fit parameters +mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 88e4dade744a..446869b46d31 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -14,12 +14,8 @@ filenames = mx.get_mnist_ubyte() # data provider batch_size = 100 -train_provider = mx.MNISTProvider(image=filenames[:train_data], - label=filenames[:train_label], - batch_size=batch_size, shuffle=true, flat=true) -eval_provider = mx.MNISTProvider(image=filenames[:test_data], - label=filenames[:test_label], - batch_size=batch_size, shuffle=false, flat=true) +include("mnist-data.jl") +train_provider, eval_provider = get_mnist_providers(batch_size) # setup estimator estimator = mx.FeedForward(mlp, context=mx.Context(mx.CPU)) diff --git a/examples/mnist/mnist-data.jl b/examples/mnist/mnist-data.jl new file mode 100644 index 000000000000..7349152617f9 --- /dev/null +++ b/examples/mnist/mnist-data.jl @@ -0,0 +1,16 @@ +function get_mnist_providers(batch_size::Int; data_name=:data, label_name=:softmax_label, flat=true) + # download MNIST into Pkg.dir("MXNet")/data/mnist if not exist + filenames = mx.get_mnist_ubyte() + + # data provider + train_provider = mx.MNISTProvider(image=filenames[:train_data], + label=filenames[:train_label], + data_name=data_name, label_name=label_name, + batch_size=batch_size, shuffle=true, flat=flat, silent=true) + eval_provider = mx.MNISTProvider(image=filenames[:test_data], + label=filenames[:test_label], + data_name=data_name, label_name=label_name, + batch_size=batch_size, shuffle=false, flat=flat, silent=true) + + return (train_provider, eval_provider) +end From 383fd98996b49fed4311cfe3b138946fcc3c4467 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 17 Oct 2015 19:07:41 -0400 Subject: [PATCH 067/630] fix kvstore closure --- src/context.jl | 2 +- src/estimator.jl | 2 +- src/init.jl | 1 + src/kvstore.jl | 26 ++++++++++++++++++-------- 4 files changed, 21 insertions(+), 10 deletions(-) diff --git a/src/context.jl b/src/context.jl index 4a9f4667d4cf..20b0c7b14ee6 100644 --- a/src/context.jl +++ b/src/context.jl @@ -1,4 +1,4 @@ -@enum CONTEXT_TYPE CPU=1 GPU=2 +@enum CONTEXT_TYPE CPU=1 GPU=2 CPU_PINNED=3 type Context device_type :: CONTEXT_TYPE diff --git a/src/estimator.jl b/src/estimator.jl index c4e4859bcfc4..e349ec952115 100644 --- a/src/estimator.jl +++ b/src/estimator.jl @@ -75,7 +75,7 @@ function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params : if kv_type == :local max_size = maximum([prod(size(param)) for (k,param) in arg_params]) if max_size < 1024 * 1024 * 16 - kv_type = :loca_update_cpu + kv_type = :local_update_cpu else kv_type = :local_allreduce_cpu end diff --git a/src/init.jl b/src/init.jl index f23d9f3b2207..fd8f57dd32f9 100644 --- a/src/init.jl +++ b/src/init.jl @@ -100,3 +100,4 @@ end @mx_define_handle_t(MX_ExecutorHandle, MXExecutorFree) @mx_define_handle_t(MX_DataIterHandle, MXDataIterFree) @mx_define_handle_t(MX_KVStoreHandle, MXKVStoreFree) + diff --git a/src/kvstore.jl b/src/kvstore.jl index 6d0642a6d2a7..562edc3d4850 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -1,15 +1,18 @@ type KVStore handle :: MX_KVStoreHandle updater_c :: Ptr{Void} + updater :: Function + + KVStore(hdr :: MX_KVStoreHandle) = new(hdr, Ptr{Void}(0)) end function KVStore(kv_type::Base.Symbol = :local) - @assert(kv_type ∈ [:local]) # TODO: update with allowed types + #@assert(kv_type ∈ [:local]) # TODO: update with allowed types ref_hdr = Ref{MX_handle}(0) kv_type = string(kv_type) @mxcall(:MXKVStoreCreate, (char_p, Ref{MX_handle}), kv_type, ref_hdr) - return KVStore(MX_KVStoreHandle(ref_hdr[]), Ptr{Void}(0)) + return KVStore(MX_KVStoreHandle(ref_hdr[])) end function Base.unsafe_convert(::Type{MX_handle}, obj::KVStore) Base.unsafe_convert(MX_handle, obj.handle) @@ -100,14 +103,21 @@ function get_rank(self :: KVStore) end +# TODO: Currently Julia does not support closure in c-callbacks, so we are making use of the +# extra handle parameter of the API to pass the updater object around. Fix this when someday +# full closure cfunction is supported in Julia. +function _kvstore_update_wrapper(index::Cint, nd_recv::MX_handle, nd_local::MX_handle, updater::Ptr{Void}) + x = unsafe_pointer_to_objref(updater) + updater_func = unsafe_pointer_to_objref(updater) :: Function + updater_func(Int(index), NDArray(MX_NDArrayHandle(nd_recv)), NDArray(MX_NDArrayHandle(nd_local))) + return nothing +end function set_updater(self :: KVStore, updater :: Function) - function updater_wrapper(index :: Cint, nd_recv :: MX_handle, nd_local :: MX_handle, ::Ptr{Void}) - updater(index, NDArray(MX_NDArrayHandle(nd_recv)), NDArray(MX_NDArrayHandle(nd_local))) - end - self.wrapper_c = cfunction(updater_wrapper, Void, (Cint, MX_handle, MX_handle, Ptr{Void})) + self.updater = updater # keep a reference to the julia object so that updater_c is kept valid + self.updater_c = cfunction(_kvstore_update_wrapper, Void, (Cint, MX_handle, MX_handle, Ptr{Void})) - @mxcall(:MXKVStoreSetUpdater, (MX_handle, Ptr{Void}, Ptr{Void}), - self, self.wrapper_c, Ptr{Void}(0)) + @mxcall(:MXKVStoreSetUpdater, (MX_handle, Ptr{Void}, Any), + self, self.updater_c, updater) end function set_optimizer(self :: KVStore, optimizer :: AbstractOptimizer) From 7f8612ef209a1bcc3528ee326fe9988bbb23d6b9 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 17 Oct 2015 21:50:39 -0400 Subject: [PATCH 068/630] cifar10 example (pushing to GPU server for testing) --- examples/cifar10/cifar10.jl | 86 +++++++++++++++++++++++++++++++++++++ examples/mnist/mlp.jl | 3 -- src/init.jl | 30 +++++++++++++ src/symbol.jl | 2 +- src/util.jl | 17 ++++++++ 5 files changed, 134 insertions(+), 4 deletions(-) create mode 100644 examples/cifar10/cifar10.jl diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl new file mode 100644 index 000000000000..157bee6dd777 --- /dev/null +++ b/examples/cifar10/cifar10.jl @@ -0,0 +1,86 @@ +using MXNet + +#-------------------------------------------------------------------------------- +# Helper functions to construct larger networks + +# basic Conv + BN + ReLU factory +function conv_factory(data, num_filter, kernel; stride=(1,1), pad=(0,0), act_type=:relu) + conv = mx.Convolution(data=data, num_filter=num_filter, kernel=kernel, stride=stride, pad=pad) + bn = mx.BatchNorm(data=conv) + act = mx.Activation(data=bn, act_type=act_type) + return act +end + +# simple downsampling factory +function downsample_factory(data, ch_3x3) + # conv 3x3 + conv = conv_factory(data, ch_3x3, (3,3), stride=(2,2), pad=(1,1)) + # pool + pool = mx.Pooling(data=data, kernel=(3,3), stride=(2,2), pool_type=:max) + # concat + concat = mx.Concat(conv, pool) + return concat +end + +# a simple module +function simple_factory(data, ch_1x1, ch_3x3) + # 1x1 + conv1x1 = conv_factory(data, ch_1x1, (1,1); pad=(0,0)) + # 3x3 + conv3x3 = conv_factory(data, ch_3x3, (3,3); pad=(1,1)) + # concat + concat = mx.Concat(conv1x1, conv3x3) + return concat +end + + +#-------------------------------------------------------------------------------- +# Actual architecture +data = mx.variable(:data) +conv1 = conv_factory(data, 96, (3,3); pad=(1,1), act_type=:relu) +in3a = simple_factory(conv1, 32, 32) +in3b = simple_factory(in3a, 32, 48) +in3c = downsample_factory(in3b, 80) +in4a = simple_factory(in3c, 112, 48) +in4b = simple_factory(in4a, 96, 64) +in4c = simple_factory(in4b, 80, 80) +in4d = simple_factory(in4b, 48, 96) +in4e = downsample_factory(in4d, 96) +in5a = simple_factory(in4e, 176, 160) +in5b = simple_factory(in5a, 176, 160) +pool = mx.Pooling(data=in5b, pool_type=:avg, kernel=(7,7), name=:global_pool) +flatten = mx.Flatten(data=pool, name=:flatten1) +fc = mx.FullyConnected(data=flatten, num_hidden=10, name=:fc1) +softmax = mx.Softmax(data=fc, name=:loss) + + +#-------------------------------------------------------------------------------- +# Prepare data +filenames = get_cifar10() +batch_size = 128 +num_epoch = 10 +num_gpus = 1 + +train_provider = mx.ImageRecordProvider(label_name=:loss_label, + path_imgrec=filenames[:train], mean_img=filenames[:mean], + rand_crop=true, rand_mirror=true, data_shape=(28,28,3), + batch_size=batch_size, preprocess_threads=1) +test_provider = mx.ImageRecordProvider(label_name=:loss_label, + path_imgrec=filenames[:test], mean_img=filenames[:mean], + rand_crop=false, rand_mirror=false, data_shape=(28,28,3), + batch_size=batch_size, preprocess_threads=1) + + +#-------------------------------------------------------------------------------- +# Training model +gpus = [mx.Context(GPU, i) for i = 0:num_gpus-1] +estimator = mx.FeedForward(softmax, context=gpus) + +# optimizer +optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.05), + mom_scheduler=mx.FixedMomentumScheduler(0.9), + weight_decay=0.0001) + +# fit parameters +mx.fit(estimator, optimizer, train_provider, epoch_stop=num_epoch, eval_data=eval_provider, + initializer=mx.UniformInitializer(0.07)) diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 446869b46d31..c2d30235e0f6 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -9,9 +9,6 @@ act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) mlp = mx.Softmax(data = fc3, name=:softmax) -# download MNIST into Pkg.dir("MXNet")/data/mnist if not exist -filenames = mx.get_mnist_ubyte() - # data provider batch_size = 100 include("mnist-data.jl") diff --git a/src/init.jl b/src/init.jl index fd8f57dd32f9..ac858f926c62 100644 --- a/src/init.jl +++ b/src/init.jl @@ -101,3 +101,33 @@ end @mx_define_handle_t(MX_DataIterHandle, MXDataIterFree) @mx_define_handle_t(MX_KVStoreHandle, MXKVStoreFree) +################################################################################ +# MXNet Params +# +# MXNet API use string to pass some common parameters like the configurations +# when defining layers. Typically, it is enough to use string(obj) to get a +# recognizable representation for libmxnet. However, there is currently a +# caveat: +# +# Because Julia use column-major ordering for tensors. In order to properly +# interact with Julia Arrays, the shape will look "reversed" from the Julia +# side. For example, a typical MNIST mini-batch tensor is of shape (28,28,1,100) +# from Julia side, while the shape information for the same piece of memory +# should be interpreted as (100,1,28,28) from C/C++/Python side. +# +# Therefore, when passing parameters to libmxnet, we should reverse the shape +# parameter. For example, when the user specify a non-square kernel size for +# a convolution or pooling layer. Unfortunately, those operators are automatically +# imported, and information about the type of each parameter is somehow limited. +# One hacky way is to match the type description for the string "Shape(tuple)" +# when importing operators. But currently we simply decided to reverse **all** +# NTuple{N, Int} passed to libmxnet. +# +# TODO: find a better solution in case this cause issues in the future. +################################################################################ +function dump_mx_param(val :: Any) + string(val) +end +function dump_mx_param{N,T<:Integer}(shape :: NTuple{N, T}) + string(tuple(flipdim([shape...],1)...)) +end diff --git a/src/symbol.jl b/src/symbol.jl index b97e7a7594c8..0a6204d40789 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -285,7 +285,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) symbol_kws[k] = v else push!(param_keys, string(k)) - push!(param_vals, string(v)) + push!(param_vals, dump_mx_param(v)) end end diff --git a/src/util.jl b/src/util.jl index 48a55348049e..b85787649c37 100644 --- a/src/util.jl +++ b/src/util.jl @@ -21,3 +21,20 @@ function get_mnist_ubyte() end return filenames end + +function get_cifar10() + data_dir = get_data_dir() + cifar10_dir = joinpath(data_dir, "cifar10") + mkpath(cifar10_dir) + filenames = Dict(:train => "train.rec", :test => "test.rec") + filenames = [k => joinpath(cifar10_dir, v) for (k,v) in filenames] + if !all(isfile, values(filenames)) + cd(cifar10_dir) do + run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/cifar10.zip`) + run(`unzip -u cifar10.zip`) + end + end + + filenames[:mean] = joinpath(cifar10_dir, "cifar_mean.bin") + return filenames +end From edf087194938ed87b5c47e1fa2ac4a10ebe2556d Mon Sep 17 00:00:00 2001 From: pluskid Date: Sat, 17 Oct 2015 22:21:30 -0400 Subject: [PATCH 069/630] working cifar10 example --- examples/cifar10/cifar10.jl | 8 ++++---- src/context.jl | 2 +- src/io.jl | 2 +- src/symbol.jl | 9 +++++---- src/util.jl | 4 ++-- 5 files changed, 13 insertions(+), 12 deletions(-) diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl index 157bee6dd777..9d627b0471c2 100644 --- a/examples/cifar10/cifar10.jl +++ b/examples/cifar10/cifar10.jl @@ -56,10 +56,10 @@ softmax = mx.Softmax(data=fc, name=:loss) #-------------------------------------------------------------------------------- # Prepare data -filenames = get_cifar10() +filenames = mx.get_cifar10() batch_size = 128 num_epoch = 10 -num_gpus = 1 +num_gpus = 8 train_provider = mx.ImageRecordProvider(label_name=:loss_label, path_imgrec=filenames[:train], mean_img=filenames[:mean], @@ -73,7 +73,7 @@ test_provider = mx.ImageRecordProvider(label_name=:loss_label, #-------------------------------------------------------------------------------- # Training model -gpus = [mx.Context(GPU, i) for i = 0:num_gpus-1] +gpus = [mx.Context(mx.GPU, i) for i = 0:num_gpus-1] estimator = mx.FeedForward(softmax, context=gpus) # optimizer @@ -82,5 +82,5 @@ optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.05), weight_decay=0.0001) # fit parameters -mx.fit(estimator, optimizer, train_provider, epoch_stop=num_epoch, eval_data=eval_provider, +mx.fit(estimator, optimizer, train_provider, epoch_stop=num_epoch, eval_data=test_provider, initializer=mx.UniformInitializer(0.07)) diff --git a/src/context.jl b/src/context.jl index 20b0c7b14ee6..06062500be6c 100644 --- a/src/context.jl +++ b/src/context.jl @@ -10,7 +10,7 @@ Context(dev_type :: Union{CONTEXT_TYPE, Integer}, dev_id :: Integer = 0) = Context(convert(CONTEXT_TYPE, dev_type), convert(Cint, dev_id), Nullable{Context}()) function Base.show(io :: IO, ctx :: Context) - print(io, "$(ctx.device_type)$(ctx.device_id))") + print(io, "$(ctx.device_type)$(ctx.device_id)") end diff --git a/src/io.jl b/src/io.jl index 5587fbc97575..cf618be3e4a4 100644 --- a/src/io.jl +++ b/src/io.jl @@ -204,7 +204,7 @@ function _define_data_iter_creator(hdr :: MX_handle) defun = quote function $iter_name(; kwargs...) arg_keys = AbstractString[string(k) for (k,v) in kwargs] - arg_vals = AbstractString[string(v) for (k,v) in kwargs] + arg_vals = AbstractString[dump_mx_param(v) for (k,v) in kwargs] ref_hdr = Ref{MX_handle}(0) @mxcall(:MXDataIterCreateIter, (MX_handle, MX_uint, char_pp, char_pp, Ref{MX_handle}), diff --git a/src/symbol.jl b/src/symbol.jl index 0a6204d40789..85799d524c51 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -253,8 +253,9 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) Ref{char_pp}, Ref{char_p}), hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, ref_kv_nargs) - func_name = symbol(bytestring(ref_name[])) - kv_nargs = symbol(bytestring(ref_kv_nargs[])) + func_name = symbol(bytestring(ref_name[])) + kv_nargs_s = bytestring(ref_kv_nargs[]) + kv_nargs = symbol(kv_nargs_s) # function $func_name(args...; kwargs...) func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) @@ -272,8 +273,8 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) $(if kv_nargs != symbol("") quote - if !in("$kv_narg", param_keys) - push!(param_keys, string("$kv_nargs")) + if !in($kv_nargs_s, param_keys) + push!(param_keys, $kv_nargs_s) push!(param_vals, string(length(args))) end end diff --git a/src/util.jl b/src/util.jl index b85787649c37..4a331fcbfec1 100644 --- a/src/util.jl +++ b/src/util.jl @@ -26,7 +26,7 @@ function get_cifar10() data_dir = get_data_dir() cifar10_dir = joinpath(data_dir, "cifar10") mkpath(cifar10_dir) - filenames = Dict(:train => "train.rec", :test => "test.rec") + filenames = Dict(:train => "cifar/train.rec", :test => "cifar/test.rec") filenames = [k => joinpath(cifar10_dir, v) for (k,v) in filenames] if !all(isfile, values(filenames)) cd(cifar10_dir) do @@ -35,6 +35,6 @@ function get_cifar10() end end - filenames[:mean] = joinpath(cifar10_dir, "cifar_mean.bin") + filenames[:mean] = joinpath(cifar10_dir, "cifar/cifar_mean.bin") return filenames end From aa18e9880436a496c020e8600268bba4e60efdc7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 19 Oct 2015 15:30:54 -0400 Subject: [PATCH 070/630] basic doc building setup --- docs/build.jl | 8 ++++++++ src/init.jl | 2 -- src/ndarray.jl | 2 -- 3 files changed, 8 insertions(+), 4 deletions(-) create mode 100644 docs/build.jl diff --git a/docs/build.jl b/docs/build.jl new file mode 100644 index 000000000000..d6a4ec9ef5d5 --- /dev/null +++ b/docs/build.jl @@ -0,0 +1,8 @@ +using MXNet +using Lexicon + +config = Config(md_permalink = false, mathjax = true) + +index = save("api/MXNet.md", MXNet.mx, config) +save("api/index.md", Index([index]), config; md_subheader = :category) + diff --git a/src/init.jl b/src/init.jl index ac858f926c62..2c4239ce8d25 100644 --- a/src/init.jl +++ b/src/init.jl @@ -1,5 +1,3 @@ -export MXError - "Exception thrown when an error occurred calling MXNet API." immutable MXError <: Exception msg :: AbstractString diff --git a/src/ndarray.jl b/src/ndarray.jl index cd23eb59cc98..1d80dcdbdd51 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1,5 +1,3 @@ -export NDArray - # create a NDArray handle of specific shape function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) h_ref = Ref{MX_handle}(0) From ff055b557b38d4fb2543d8cfa380dec11dd3c6be Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 20 Oct 2015 00:28:58 -0400 Subject: [PATCH 071/630] test rtd hook --- .gitignore | 1 + docs/Makefile | 192 +++++++++++++++++++++ docs/api/MXNet.md | 416 ++++++++++++++++++++++++++++++++++++++++++++++ docs/api/index.md | 81 +++++++++ docs/conf.py | 292 ++++++++++++++++++++++++++++++++ docs/index.rst | 23 +++ docs/make.bat | 263 +++++++++++++++++++++++++++++ 7 files changed, 1268 insertions(+) create mode 100644 docs/Makefile create mode 100644 docs/api/MXNet.md create mode 100644 docs/api/index.md create mode 100644 docs/conf.py create mode 100644 docs/index.rst create mode 100644 docs/make.bat diff --git a/.gitignore b/.gitignore index 2ff5c4a3d770..1b5cdca45b40 100644 --- a/.gitignore +++ b/.gitignore @@ -2,3 +2,4 @@ *.jl.*.cov *.jl.mem data +docs/_build diff --git a/docs/Makefile b/docs/Makefile new file mode 100644 index 000000000000..ce3d7abdbfaa --- /dev/null +++ b/docs/Makefile @@ -0,0 +1,192 @@ +# Makefile for Sphinx documentation +# + +# You can set these variables from the command line. +SPHINXOPTS = +SPHINXBUILD = sphinx-build +PAPER = +BUILDDIR = _build + +# User-friendly check for sphinx-build +ifeq ($(shell which $(SPHINXBUILD) >/dev/null 2>&1; echo $$?), 1) +$(error The '$(SPHINXBUILD)' command was not found. Make sure you have Sphinx installed, then set the SPHINXBUILD environment variable to point to the full path of the '$(SPHINXBUILD)' executable. Alternatively you can add the directory with the executable to your PATH. If you don't have Sphinx installed, grab it from http://sphinx-doc.org/) +endif + +# Internal variables. +PAPEROPT_a4 = -D latex_paper_size=a4 +PAPEROPT_letter = -D latex_paper_size=letter +ALLSPHINXOPTS = -d $(BUILDDIR)/doctrees $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) . +# the i18n builder cannot share the environment and doctrees with the others +I18NSPHINXOPTS = $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) . + +.PHONY: help clean html dirhtml singlehtml pickle json htmlhelp qthelp devhelp epub latex latexpdf text man changes linkcheck doctest coverage gettext + +help: + @echo "Please use \`make ' where is one of" + @echo " html to make standalone HTML files" + @echo " dirhtml to make HTML files named index.html in directories" + @echo " singlehtml to make a single large HTML file" + @echo " pickle to make pickle files" + @echo " json to make JSON files" + @echo " htmlhelp to make HTML files and a HTML help project" + @echo " qthelp to make HTML files and a qthelp project" + @echo " applehelp to make an Apple Help Book" + @echo " devhelp to make HTML files and a Devhelp project" + @echo " epub to make an epub" + @echo " latex to make LaTeX files, you can set PAPER=a4 or PAPER=letter" + @echo " latexpdf to make LaTeX files and run them through pdflatex" + @echo " latexpdfja to make LaTeX files and run them through platex/dvipdfmx" + @echo " text to make text files" + @echo " man to make manual pages" + @echo " texinfo to make Texinfo files" + @echo " info to make Texinfo files and run them through makeinfo" + @echo " gettext to make PO message catalogs" + @echo " changes to make an overview of all changed/added/deprecated items" + @echo " xml to make Docutils-native XML files" + @echo " pseudoxml to make pseudoxml-XML files for display purposes" + @echo " linkcheck to check all external links for integrity" + @echo " doctest to run all doctests embedded in the documentation (if enabled)" + @echo " coverage to run coverage check of the documentation (if enabled)" + +clean: + rm -rf $(BUILDDIR)/* + +html: + $(SPHINXBUILD) -b html $(ALLSPHINXOPTS) $(BUILDDIR)/html + @echo + @echo "Build finished. The HTML pages are in $(BUILDDIR)/html." + +dirhtml: + $(SPHINXBUILD) -b dirhtml $(ALLSPHINXOPTS) $(BUILDDIR)/dirhtml + @echo + @echo "Build finished. The HTML pages are in $(BUILDDIR)/dirhtml." + +singlehtml: + $(SPHINXBUILD) -b singlehtml $(ALLSPHINXOPTS) $(BUILDDIR)/singlehtml + @echo + @echo "Build finished. The HTML page is in $(BUILDDIR)/singlehtml." + +pickle: + $(SPHINXBUILD) -b pickle $(ALLSPHINXOPTS) $(BUILDDIR)/pickle + @echo + @echo "Build finished; now you can process the pickle files." + +json: + $(SPHINXBUILD) -b json $(ALLSPHINXOPTS) $(BUILDDIR)/json + @echo + @echo "Build finished; now you can process the JSON files." + +htmlhelp: + $(SPHINXBUILD) -b htmlhelp $(ALLSPHINXOPTS) $(BUILDDIR)/htmlhelp + @echo + @echo "Build finished; now you can run HTML Help Workshop with the" \ + ".hhp project file in $(BUILDDIR)/htmlhelp." + +qthelp: + $(SPHINXBUILD) -b qthelp $(ALLSPHINXOPTS) $(BUILDDIR)/qthelp + @echo + @echo "Build finished; now you can run "qcollectiongenerator" with the" \ + ".qhcp project file in $(BUILDDIR)/qthelp, like this:" + @echo "# qcollectiongenerator $(BUILDDIR)/qthelp/MXNetjl.qhcp" + @echo "To view the help file:" + @echo "# assistant -collectionFile $(BUILDDIR)/qthelp/MXNetjl.qhc" + +applehelp: + $(SPHINXBUILD) -b applehelp $(ALLSPHINXOPTS) $(BUILDDIR)/applehelp + @echo + @echo "Build finished. The help book is in $(BUILDDIR)/applehelp." + @echo "N.B. You won't be able to view it unless you put it in" \ + "~/Library/Documentation/Help or install it in your application" \ + "bundle." + +devhelp: + $(SPHINXBUILD) -b devhelp $(ALLSPHINXOPTS) $(BUILDDIR)/devhelp + @echo + @echo "Build finished." + @echo "To view the help file:" + @echo "# mkdir -p $$HOME/.local/share/devhelp/MXNetjl" + @echo "# ln -s $(BUILDDIR)/devhelp $$HOME/.local/share/devhelp/MXNetjl" + @echo "# devhelp" + +epub: + $(SPHINXBUILD) -b epub $(ALLSPHINXOPTS) $(BUILDDIR)/epub + @echo + @echo "Build finished. The epub file is in $(BUILDDIR)/epub." + +latex: + $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex + @echo + @echo "Build finished; the LaTeX files are in $(BUILDDIR)/latex." + @echo "Run \`make' in that directory to run these through (pdf)latex" \ + "(use \`make latexpdf' here to do that automatically)." + +latexpdf: + $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex + @echo "Running LaTeX files through pdflatex..." + $(MAKE) -C $(BUILDDIR)/latex all-pdf + @echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex." + +latexpdfja: + $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex + @echo "Running LaTeX files through platex and dvipdfmx..." + $(MAKE) -C $(BUILDDIR)/latex all-pdf-ja + @echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex." + +text: + $(SPHINXBUILD) -b text $(ALLSPHINXOPTS) $(BUILDDIR)/text + @echo + @echo "Build finished. The text files are in $(BUILDDIR)/text." + +man: + $(SPHINXBUILD) -b man $(ALLSPHINXOPTS) $(BUILDDIR)/man + @echo + @echo "Build finished. The manual pages are in $(BUILDDIR)/man." + +texinfo: + $(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo + @echo + @echo "Build finished. The Texinfo files are in $(BUILDDIR)/texinfo." + @echo "Run \`make' in that directory to run these through makeinfo" \ + "(use \`make info' here to do that automatically)." + +info: + $(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo + @echo "Running Texinfo files through makeinfo..." + make -C $(BUILDDIR)/texinfo info + @echo "makeinfo finished; the Info files are in $(BUILDDIR)/texinfo." + +gettext: + $(SPHINXBUILD) -b gettext $(I18NSPHINXOPTS) $(BUILDDIR)/locale + @echo + @echo "Build finished. The message catalogs are in $(BUILDDIR)/locale." + +changes: + $(SPHINXBUILD) -b changes $(ALLSPHINXOPTS) $(BUILDDIR)/changes + @echo + @echo "The overview file is in $(BUILDDIR)/changes." + +linkcheck: + $(SPHINXBUILD) -b linkcheck $(ALLSPHINXOPTS) $(BUILDDIR)/linkcheck + @echo + @echo "Link check complete; look for any errors in the above output " \ + "or in $(BUILDDIR)/linkcheck/output.txt." + +doctest: + $(SPHINXBUILD) -b doctest $(ALLSPHINXOPTS) $(BUILDDIR)/doctest + @echo "Testing of doctests in the sources finished, look at the " \ + "results in $(BUILDDIR)/doctest/output.txt." + +coverage: + $(SPHINXBUILD) -b coverage $(ALLSPHINXOPTS) $(BUILDDIR)/coverage + @echo "Testing of coverage in the sources finished, look at the " \ + "results in $(BUILDDIR)/coverage/python.txt." + +xml: + $(SPHINXBUILD) -b xml $(ALLSPHINXOPTS) $(BUILDDIR)/xml + @echo + @echo "Build finished. The XML files are in $(BUILDDIR)/xml." + +pseudoxml: + $(SPHINXBUILD) -b pseudoxml $(ALLSPHINXOPTS) $(BUILDDIR)/pseudoxml + @echo + @echo "Build finished. The pseudo-XML files are in $(BUILDDIR)/pseudoxml." diff --git a/docs/api/MXNet.md b/docs/api/MXNet.md new file mode 100644 index 000000000000..fbaee9ae02fa --- /dev/null +++ b/docs/api/MXNet.md @@ -0,0 +1,416 @@ +# MXNet.mx + +## Internal + +--- + + +#### _compose!(sym::MXNet.mx.Symbol) +Compose symbol on inputs + +*source:* +[MXNet/src/symbol.jl:199](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L199) + +--- + + +#### _default_get_name!(counter::Dict{Symbol, Int64}, name::Union{AbstractString, Symbol}, hint::Union{AbstractString, Symbol}) +Default implementation for generating a name for a symbol. + +When a name is specified by the user, it will be used. Otherwise, a name +is automatically generated based on the hint string. + + +*source:* +[MXNet/src/name.jl:12](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/name.jl#L12) + +--- + + +#### _import_ndarray_functions() +Import dynamic functions for NDArrays. The arguments to the functions are typically ordered +as + + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) + +unless NDARRAY_ARG_BEFORE_SCALAR is not set. In this case, the scalars are put before the input arguments: + + func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) + +If ACCEPT_EMPTY_MUTATE_TARGET is set. An overloaded function without the output arguments will also be defined: + + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) + +Upon calling, the output arguments will be automatically initialized with empty NDArrays. + +Those functions always return the output arguments. If there is only one output (the typical situation), that +object (NDArray) is returned. Otherwise, a tuple containing all the outputs will be returned. + + +*source:* +[MXNet/src/ndarray.jl:361](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L361) + +--- + + +#### _split_inputs(batch_size::Int64, n_split::Int64) +Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector + of length `n_split`, with each entry a `UnitRange{Int}` indicating the slice index for that + piece. + + +*source:* +[MXNet/src/estimator.jl:18](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/estimator.jl#L18) + +--- + + +#### copy!(dst::Array{Float32, N}, src::MXNet.mx.NDArray) +Copy data from NDArray to Julia Array + +*source:* +[MXNet/src/ndarray.jl:178](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L178) + +--- + + +#### copy!(dst::MXNet.mx.NDArray, src::MXNet.mx.NDArray) +Copy data between NDArrays + +*source:* +[MXNet/src/ndarray.jl:166](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L166) + +--- + + +#### copy!{T<:Real}(dst::MXNet.mx.NDArray, src::Array{T<:Real, N}) +Copy data from Julia Array to NDArray + +*source:* +[MXNet/src/ndarray.jl:186](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L186) + +--- + + +#### copy(arr::MXNet.mx.NDArray) +Create copy: NDArray -> Julia Array + +*source:* +[MXNet/src/ndarray.jl:196](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L196) + +--- + + +#### copy(arr::MXNet.mx.NDArray, ctx::MXNet.mx.Context) +Create copy: NDArray -> NDArray in a given context + +*source:* +[MXNet/src/ndarray.jl:202](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L202) + +--- + + +#### copy{T<:Real}(arr::Array{T<:Real, N}, ctx::MXNet.mx.Context) +Create copy: Julia Array -> NDArray in a given context + +*source:* +[MXNet/src/ndarray.jl:208](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L208) + +--- + + +#### get_internals(self::MXNet.mx.Symbol) +Get a new grouped symbol whose output contains all the internal outputs of this symbol. + +*source:* +[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L63) + +--- + + +#### group(symbols::MXNet.mx.Symbol...) +Create a symbol that groups symbols together + +*source:* +[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L77) + +--- + + +#### list_auxiliary_states(self::MXNet.mx.Symbol) +List all auxiliary states in the symbool. + +Auxiliary states are special states of symbols that do not corresponds to an argument, +and do not have gradient. But still be useful for the specific operations. +A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. +Most operators do not have Auxiliary states. + + +*source:* +[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L58) + +--- + + +#### ones{N}(shape::NTuple{N, Int64}) +Create NDArray and initialize with 1 + +*source:* +[MXNet/src/ndarray.jl:112](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L112) + +--- + + +#### ones{N}(shape::NTuple{N, Int64}, ctx::MXNet.mx.Context) +Create NDArray and initialize with 1 + +*source:* +[MXNet/src/ndarray.jl:112](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L112) + +--- + + +#### setindex!(arr::MXNet.mx.NDArray, val::Real, ::Colon) +Assign all elements of an NDArray to a scalar + +*source:* +[MXNet/src/ndarray.jl:146](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L146) + +--- + + +#### size(arr::MXNet.mx.NDArray) +Get the shape of an `NDArray`. Note the shape is converted to Julia convention. + So the same piece of memory, in Julia (column-major), with shape (K, M, N), will be of the + shape (N, M, K) in the Python (row-major) binding. + + +*source:* +[MXNet/src/ndarray.jl:81](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L81) + +--- + + +#### slice(arr::MXNet.mx.NDArray, ::Colon) +`slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest + changing dimension is supported. In Julia's column-major perspective, this is the last + dimension. For example, given an `NDArray` of shape (2,3,4), `sub(array, 2:3)` will create + a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is + used in data parallelization to split mini-batch into sub-batches for different devices. + + +*source:* +[MXNet/src/ndarray.jl:128](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L128) + +--- + + +#### variable(name::Union{AbstractString, Symbol}) +Create a symbolic variable with the given name + +*source:* +[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L70) + +--- + + +#### zeros{N}(shape::NTuple{N, Int64}) +Create zero-ed NDArray of specific shape + +*source:* +[MXNet/src/ndarray.jl:102](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L102) + +--- + + +#### zeros{N}(shape::NTuple{N, Int64}, ctx::MXNet.mx.Context) +Create zero-ed NDArray of specific shape + +*source:* +[MXNet/src/ndarray.jl:102](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L102) + +--- + + +#### MXNet.mx.AbstractDataBatch +Root type for data batch + + A data batch must implement the following interface function to actually provide the data and label. + + load_data!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) + load_label!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) + + Load data and label into targets. The targets is a list of target that the data/label should be + copied into. The order in the list is guaranteed to be the same as returned by `provide_data` and + `provide_label`. Each entry in the list is again a list of `SlicedNDArray`, corresponding the + memory buffer for each device. + + The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. + + The following function should also be implemented to handle the case when the mini-batch size does not + divide the size of the whole dataset. So in the last mini-batch, the actual data copied might be fewer + than the mini-batch size. This is usually not an issue during the training as the remaining space may + contain the data and label copied during the previous mini-batch are still valid data. However, during + testing, especially when doing feature extraction, we need to be precise about the number of samples + processed. + + get_pad(batch :: AbstractDataBatch) + + Return the number of *dummy samples* in this mini-batch. + + +*source:* +[MXNet/src/io.jl:90](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L90) + +--- + + +#### MXNet.mx.AbstractDataProvider +Root type for data provider + + A data provider provides interface to iterate over a dataset. It should implement the following functions: + + provide_data(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} + provide_label(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} + + Returns a list of name-shape pairs, indicating the name and shape of the each data stream. For example, + `[(:data, (100,1,28,28))]` or `[(:softmax_label, (100,1))]`. It should also implement the following convenient + function + + get_batch_size(provider :: AbstractDataProvider) => Int + + which returns the batch size used in this data provider. + + A data provider should implement the standard Julia iteration interface, including `Base.start`, + `Base.next`, `Base.done` and `Base.eltype`. It could safely assume that the interface functions will + always be called like + + for batch in provider + # ... + load_data!(batch, targets) + end + + which translates into + + state = Base.start(provider) + while !done(provider, state) + (batch, state) = next(provider, state) + # ... + load_data!(batch, targets) + end + + In other words, it could safely assume that `Base.next` is always called after `Base.done`. And neither + of those function will be called twice consequtively. The detailed interfaces are list below: + + Base.start(provider :: AbstractDataProvider) => AbstractDataProviderState + + Initialize or reset the data iteration. + + Base.next(provider :: AbstractDataProvider, state :: AbstractDataProviderState) + => (AbstractDataBatch, AbstractDataProviderState) + + Return one batch of data. Actual data can be retrieved from the batch by interface functions described + in the document of type `AbstractDataBatch`. + + Base.done(provider :: AbstractDataProvider, state :: AbstractDataProviderState) => Bool + + Return `false` if there is more batch to get. + + Base.eltype(::Type{MyDataProvider}) => MyDataProviderState + + Return the type of the data provider state. + + +*source:* +[MXNet/src/io.jl:55](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L55) + +--- + + +#### MXNet.mx.AbstractDataProviderState +Root type for states of data provider + +*source:* +[MXNet/src/io.jl:58](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L58) + +--- + + +#### MXNet.mx.MXDataProvider +Wrapper of built-in `libmxnet` data iterators. + + +*source:* +[MXNet/src/io.jl:99](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L99) + +--- + + +#### MXNet.mx.MXError +Exception thrown when an error occurred calling MXNet API. + +*source:* +[MXNet/src/init.jl:2](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/init.jl#L2) + +--- + + +#### MXNet.mx.NDArray +Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block + of tensor-based computation. + + **Note** since C/C++ use row-major ordering for arrays while Julia follows a + column-major ordering. To keep things consistent, we keep the underlying data + in their original layout, but use *language-native* convention when we talk + about shapes. For example, a mini-batch of 100 MNIST images is a tensor of + C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory + have shape (28,28,1,100). + + +*source:* +[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L32) + +--- + + +#### SlicedNDArray +A tuple of (slice, NDArray). Usually each NDArray resides on a different device, and each + slice describe which part of a larger piece of data should goto that device. + + +*source:* +[MXNet/src/io.jl:63](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L63) + +--- + + +#### @inplace(stmt) +Julia does not support re-definiton of += operator (like __iadd__ in python), +When one write a += b, it gets translated to a = a+b. a+b will allocate new +memory for the results, and the newly allocated NDArray object is then assigned +back to a, while the original contents in a is discarded. This is very inefficient +when we want to do inplace update. + +This macro is a simple utility to implement this behavior. Write + + @mx.inplace a += b + +will translate into + + mx.add_to!(a, b) + +which will do inplace adding of the contents of b into a. + + +*source:* +[MXNet/src/ndarray.jl:234](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L234) + +--- + + +#### @mxcall(fv, argtypes, args...) +Utility macro to call MXNet API functions + +*source:* +[MXNet/src/init.jl:41](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/init.jl#L41) + diff --git a/docs/api/index.md b/docs/api/index.md new file mode 100644 index 000000000000..aa274bb16cd5 --- /dev/null +++ b/docs/api/index.md @@ -0,0 +1,81 @@ +# API-INDEX + + +## MODULE: MXNet.mx + +--- + +## Methods [Internal] + +[_compose!(sym::MXNet.mx.Symbol)](MXNet.md#method___compose.1) Compose symbol on inputs + +[_default_get_name!(counter::Dict{Symbol, Int64}, name::Union{AbstractString, Symbol}, hint::Union{AbstractString, Symbol})](MXNet.md#method___default_get_name.1) Default implementation for generating a name for a symbol. + +[_import_ndarray_functions()](MXNet.md#method___import_ndarray_functions.1) Import dynamic functions for NDArrays. The arguments to the functions are typically ordered + +[_split_inputs(batch_size::Int64, n_split::Int64)](MXNet.md#method___split_inputs.1) Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector + +[copy!(dst::Array{Float32, N}, src::MXNet.mx.NDArray)](MXNet.md#method__copy.1) Copy data from NDArray to Julia Array + +[copy!(dst::MXNet.mx.NDArray, src::MXNet.mx.NDArray)](MXNet.md#method__copy.2) Copy data between NDArrays + +[copy!{T<:Real}(dst::MXNet.mx.NDArray, src::Array{T<:Real, N})](MXNet.md#method__copy.3) Copy data from Julia Array to NDArray + +[copy(arr::MXNet.mx.NDArray)](MXNet.md#method__copy.4) Create copy: NDArray -> Julia Array + +[copy(arr::MXNet.mx.NDArray, ctx::MXNet.mx.Context)](MXNet.md#method__copy.5) Create copy: NDArray -> NDArray in a given context + +[copy{T<:Real}(arr::Array{T<:Real, N}, ctx::MXNet.mx.Context)](MXNet.md#method__copy.6) Create copy: Julia Array -> NDArray in a given context + +[get_internals(self::MXNet.mx.Symbol)](MXNet.md#method__get_internals.1) Get a new grouped symbol whose output contains all the internal outputs of this symbol. + +[group(symbols::MXNet.mx.Symbol...)](MXNet.md#method__group.1) Create a symbol that groups symbols together + +[list_auxiliary_states(self::MXNet.mx.Symbol)](MXNet.md#method__list_auxiliary_states.1) List all auxiliary states in the symbool. + +[ones{N}(shape::NTuple{N, Int64})](MXNet.md#method__ones.1) Create NDArray and initialize with 1 + +[ones{N}(shape::NTuple{N, Int64}, ctx::MXNet.mx.Context)](MXNet.md#method__ones.2) Create NDArray and initialize with 1 + +[setindex!(arr::MXNet.mx.NDArray, val::Real, ::Colon)](MXNet.md#method__setindex.1) Assign all elements of an NDArray to a scalar + +[size(arr::MXNet.mx.NDArray)](MXNet.md#method__size.1) Get the shape of an `NDArray`. Note the shape is converted to Julia convention. + +[slice(arr::MXNet.mx.NDArray, ::Colon)](MXNet.md#method__slice.1) `slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest + +[variable(name::Union{AbstractString, Symbol})](MXNet.md#method__variable.1) Create a symbolic variable with the given name + +[zeros{N}(shape::NTuple{N, Int64})](MXNet.md#method__zeros.1) Create zero-ed NDArray of specific shape + +[zeros{N}(shape::NTuple{N, Int64}, ctx::MXNet.mx.Context)](MXNet.md#method__zeros.2) Create zero-ed NDArray of specific shape + +--- + +## Types [Internal] + +[MXNet.mx.AbstractDataBatch](MXNet.md#type__abstractdatabatch.1) Root type for data batch + +[MXNet.mx.AbstractDataProvider](MXNet.md#type__abstractdataprovider.1) Root type for data provider + +[MXNet.mx.AbstractDataProviderState](MXNet.md#type__abstractdataproviderstate.1) Root type for states of data provider + +[MXNet.mx.MXDataProvider](MXNet.md#type__mxdataprovider.1) Wrapper of built-in `libmxnet` data iterators. + +[MXNet.mx.MXError](MXNet.md#type__mxerror.1) Exception thrown when an error occurred calling MXNet API. + +[MXNet.mx.NDArray](MXNet.md#type__ndarray.1) Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block + +--- + +## Typealiass [Internal] + +[SlicedNDArray](MXNet.md#typealias__slicedndarray.1) A tuple of (slice, NDArray). Usually each NDArray resides on a different device, and each + +--- + +## Macros [Internal] + +[@inplace(stmt)](MXNet.md#macro___inplace.1) Julia does not support re-definiton of += operator (like __iadd__ in python), + +[@mxcall(fv, argtypes, args...)](MXNet.md#macro___mxcall.1) Utility macro to call MXNet API functions + diff --git a/docs/conf.py b/docs/conf.py new file mode 100644 index 000000000000..3aab37726449 --- /dev/null +++ b/docs/conf.py @@ -0,0 +1,292 @@ +# -*- coding: utf-8 -*- +# +# MXNet.jl documentation build configuration file, created by +# sphinx-quickstart on Tue Oct 20 00:09:24 2015. +# +# This file is execfile()d with the current directory set to its +# containing dir. +# +# Note that not all possible configuration values are present in this +# autogenerated file. +# +# All configuration values have a default; values that are commented out +# serve to show the default. + +import sys +import os +import shlex + +# If extensions (or modules to document with autodoc) are in another directory, +# add these directories to sys.path here. If the directory is relative to the +# documentation root, use os.path.abspath to make it absolute, like shown here. +#sys.path.insert(0, os.path.abspath('.')) + +# -- General configuration ------------------------------------------------ + +# If your documentation needs a minimal Sphinx version, state it here. +#needs_sphinx = '1.0' + +# Add any Sphinx extension module names here, as strings. They can be +# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom +# ones. +extensions = [ + 'sphinx.ext.mathjax', +] + +# Add any paths that contain templates here, relative to this directory. +templates_path = ['_templates'] + +# The suffix(es) of source filenames. +# You can specify multiple suffix as a list of string: +# source_suffix = ['.rst', '.md'] +source_suffix = ['.rst', '.md'] + +from recommonmark.parser import CommonMarkParser + +source_parsers = { + '.md': CommonMarkParser, +} + +# The encoding of source files. +#source_encoding = 'utf-8-sig' + +# The master toctree document. +master_doc = 'index' + +# General information about the project. +project = u'MXNet.jl' +copyright = u'2015, pluskid' +author = u'pluskid' + +# The version info for the project you're documenting, acts as replacement for +# |version| and |release|, also used in various other places throughout the +# built documents. +# +# The short X.Y version. +version = '0.0.1' +# The full version, including alpha/beta/rc tags. +release = '0.0.1' + +# The language for content autogenerated by Sphinx. Refer to documentation +# for a list of supported languages. +# +# This is also used if you do content translation via gettext catalogs. +# Usually you set "language" from the command line for these cases. +language = None + +# There are two options for replacing |today|: either, you set today to some +# non-false value, then it is used: +#today = '' +# Else, today_fmt is used as the format for a strftime call. +#today_fmt = '%B %d, %Y' + +# List of patterns, relative to source directory, that match files and +# directories to ignore when looking for source files. +exclude_patterns = ['_build'] + +# The reST default role (used for this markup: `text`) to use for all +# documents. +#default_role = None + +# If true, '()' will be appended to :func: etc. cross-reference text. +#add_function_parentheses = True + +# If true, the current module name will be prepended to all description +# unit titles (such as .. function::). +#add_module_names = True + +# If true, sectionauthor and moduleauthor directives will be shown in the +# output. They are ignored by default. +#show_authors = False + +# The name of the Pygments (syntax highlighting) style to use. +pygments_style = 'sphinx' + +# A list of ignored prefixes for module index sorting. +#modindex_common_prefix = [] + +# If true, keep warnings as "system message" paragraphs in the built documents. +#keep_warnings = False + +# If true, `todo` and `todoList` produce output, else they produce nothing. +todo_include_todos = False + + +# -- Options for HTML output ---------------------------------------------- + +# The theme to use for HTML and HTML Help pages. See the documentation for +# a list of builtin themes. +html_theme = 'alabaster' + +# Theme options are theme-specific and customize the look and feel of a theme +# further. For a list of options available for each theme, see the +# documentation. +#html_theme_options = {} + +# Add any paths that contain custom themes here, relative to this directory. +#html_theme_path = [] + +# The name for this set of Sphinx documents. If None, it defaults to +# " v documentation". +#html_title = None + +# A shorter title for the navigation bar. Default is the same as html_title. +#html_short_title = None + +# The name of an image file (relative to this directory) to place at the top +# of the sidebar. +#html_logo = None + +# The name of an image file (within the static path) to use as favicon of the +# docs. This file should be a Windows icon file (.ico) being 16x16 or 32x32 +# pixels large. +#html_favicon = None + +# Add any paths that contain custom static files (such as style sheets) here, +# relative to this directory. They are copied after the builtin static files, +# so a file named "default.css" will overwrite the builtin "default.css". +html_static_path = ['_static'] + +# Add any extra paths that contain custom files (such as robots.txt or +# .htaccess) here, relative to this directory. These files are copied +# directly to the root of the documentation. +#html_extra_path = [] + +# If not '', a 'Last updated on:' timestamp is inserted at every page bottom, +# using the given strftime format. +#html_last_updated_fmt = '%b %d, %Y' + +# If true, SmartyPants will be used to convert quotes and dashes to +# typographically correct entities. +#html_use_smartypants = True + +# Custom sidebar templates, maps document names to template names. +#html_sidebars = {} + +# Additional templates that should be rendered to pages, maps page names to +# template names. +#html_additional_pages = {} + +# If false, no module index is generated. +#html_domain_indices = True + +# If false, no index is generated. +#html_use_index = True + +# If true, the index is split into individual pages for each letter. +#html_split_index = False + +# If true, links to the reST sources are added to the pages. +#html_show_sourcelink = True + +# If true, "Created using Sphinx" is shown in the HTML footer. Default is True. +#html_show_sphinx = True + +# If true, "(C) Copyright ..." is shown in the HTML footer. Default is True. +#html_show_copyright = True + +# If true, an OpenSearch description file will be output, and all pages will +# contain a tag referring to it. The value of this option must be the +# base URL from which the finished HTML is served. +#html_use_opensearch = '' + +# This is the file name suffix for HTML files (e.g. ".xhtml"). +#html_file_suffix = None + +# Language to be used for generating the HTML full-text search index. +# Sphinx supports the following languages: +# 'da', 'de', 'en', 'es', 'fi', 'fr', 'hu', 'it', 'ja' +# 'nl', 'no', 'pt', 'ro', 'ru', 'sv', 'tr' +#html_search_language = 'en' + +# A dictionary with options for the search language support, empty by default. +# Now only 'ja' uses this config value +#html_search_options = {'type': 'default'} + +# The name of a javascript file (relative to the configuration directory) that +# implements a search results scorer. If empty, the default will be used. +#html_search_scorer = 'scorer.js' + +# Output file base name for HTML help builder. +htmlhelp_basename = 'MXNetjldoc' + +# -- Options for LaTeX output --------------------------------------------- + +latex_elements = { +# The paper size ('letterpaper' or 'a4paper'). +#'papersize': 'letterpaper', + +# The font size ('10pt', '11pt' or '12pt'). +#'pointsize': '10pt', + +# Additional stuff for the LaTeX preamble. +#'preamble': '', + +# Latex figure (float) alignment +#'figure_align': 'htbp', +} + +# Grouping the document tree into LaTeX files. List of tuples +# (source start file, target name, title, +# author, documentclass [howto, manual, or own class]). +latex_documents = [ + (master_doc, 'MXNetjl.tex', u'MXNet.jl Documentation', + u'pluskid', 'manual'), +] + +# The name of an image file (relative to this directory) to place at the top of +# the title page. +#latex_logo = None + +# For "manual" documents, if this is true, then toplevel headings are parts, +# not chapters. +#latex_use_parts = False + +# If true, show page references after internal links. +#latex_show_pagerefs = False + +# If true, show URL addresses after external links. +#latex_show_urls = False + +# Documents to append as an appendix to all manuals. +#latex_appendices = [] + +# If false, no module index is generated. +#latex_domain_indices = True + + +# -- Options for manual page output --------------------------------------- + +# One entry per manual page. List of tuples +# (source start file, name, description, authors, manual section). +man_pages = [ + (master_doc, 'mxnetjl', u'MXNet.jl Documentation', + [author], 1) +] + +# If true, show URL addresses after external links. +#man_show_urls = False + + +# -- Options for Texinfo output ------------------------------------------- + +# Grouping the document tree into Texinfo files. List of tuples +# (source start file, target name, title, author, +# dir menu entry, description, category) +texinfo_documents = [ + (master_doc, 'MXNetjl', u'MXNet.jl Documentation', + author, 'MXNetjl', 'One line description of project.', + 'Miscellaneous'), +] + +# Documents to append as an appendix to all manuals. +#texinfo_appendices = [] + +# If false, no module index is generated. +#texinfo_domain_indices = True + +# How to display URL addresses: 'footnote', 'no', or 'inline'. +#texinfo_show_urls = 'footnote' + +# If true, do not generate a @detailmenu in the "Top" node's menu. +#texinfo_no_detailmenu = False diff --git a/docs/index.rst b/docs/index.rst new file mode 100644 index 000000000000..81b86df5034d --- /dev/null +++ b/docs/index.rst @@ -0,0 +1,23 @@ +.. MXNet.jl documentation master file, created by + sphinx-quickstart on Tue Oct 20 00:09:24 2015. + You can adapt this file completely to your liking, but it should at least + contain the root `toctree` directive. + +Welcome to MXNet.jl's documentation! +==================================== + +Contents: + +.. toctree:: + :maxdepth: 2 + + api/MXNet + + +Indices and tables +================== + +* :ref:`genindex` +* :ref:`modindex` +* :ref:`search` + diff --git a/docs/make.bat b/docs/make.bat new file mode 100644 index 000000000000..e682697a9877 --- /dev/null +++ b/docs/make.bat @@ -0,0 +1,263 @@ +@ECHO OFF + +REM Command file for Sphinx documentation + +if "%SPHINXBUILD%" == "" ( + set SPHINXBUILD=sphinx-build +) +set BUILDDIR=_build +set ALLSPHINXOPTS=-d %BUILDDIR%/doctrees %SPHINXOPTS% . +set I18NSPHINXOPTS=%SPHINXOPTS% . +if NOT "%PAPER%" == "" ( + set ALLSPHINXOPTS=-D latex_paper_size=%PAPER% %ALLSPHINXOPTS% + set I18NSPHINXOPTS=-D latex_paper_size=%PAPER% %I18NSPHINXOPTS% +) + +if "%1" == "" goto help + +if "%1" == "help" ( + :help + echo.Please use `make ^` where ^ is one of + echo. html to make standalone HTML files + echo. dirhtml to make HTML files named index.html in directories + echo. singlehtml to make a single large HTML file + echo. pickle to make pickle files + echo. json to make JSON files + echo. htmlhelp to make HTML files and a HTML help project + echo. qthelp to make HTML files and a qthelp project + echo. devhelp to make HTML files and a Devhelp project + echo. epub to make an epub + echo. latex to make LaTeX files, you can set PAPER=a4 or PAPER=letter + echo. text to make text files + echo. man to make manual pages + echo. texinfo to make Texinfo files + echo. gettext to make PO message catalogs + echo. changes to make an overview over all changed/added/deprecated items + echo. xml to make Docutils-native XML files + echo. pseudoxml to make pseudoxml-XML files for display purposes + echo. linkcheck to check all external links for integrity + echo. doctest to run all doctests embedded in the documentation if enabled + echo. coverage to run coverage check of the documentation if enabled + goto end +) + +if "%1" == "clean" ( + for /d %%i in (%BUILDDIR%\*) do rmdir /q /s %%i + del /q /s %BUILDDIR%\* + goto end +) + + +REM Check if sphinx-build is available and fallback to Python version if any +%SPHINXBUILD% 2> nul +if errorlevel 9009 goto sphinx_python +goto sphinx_ok + +:sphinx_python + +set SPHINXBUILD=python -m sphinx.__init__ +%SPHINXBUILD% 2> nul +if errorlevel 9009 ( + echo. + echo.The 'sphinx-build' command was not found. Make sure you have Sphinx + echo.installed, then set the SPHINXBUILD environment variable to point + echo.to the full path of the 'sphinx-build' executable. Alternatively you + echo.may add the Sphinx directory to PATH. + echo. + echo.If you don't have Sphinx installed, grab it from + echo.http://sphinx-doc.org/ + exit /b 1 +) + +:sphinx_ok + + +if "%1" == "html" ( + %SPHINXBUILD% -b html %ALLSPHINXOPTS% %BUILDDIR%/html + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The HTML pages are in %BUILDDIR%/html. + goto end +) + +if "%1" == "dirhtml" ( + %SPHINXBUILD% -b dirhtml %ALLSPHINXOPTS% %BUILDDIR%/dirhtml + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The HTML pages are in %BUILDDIR%/dirhtml. + goto end +) + +if "%1" == "singlehtml" ( + %SPHINXBUILD% -b singlehtml %ALLSPHINXOPTS% %BUILDDIR%/singlehtml + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The HTML pages are in %BUILDDIR%/singlehtml. + goto end +) + +if "%1" == "pickle" ( + %SPHINXBUILD% -b pickle %ALLSPHINXOPTS% %BUILDDIR%/pickle + if errorlevel 1 exit /b 1 + echo. + echo.Build finished; now you can process the pickle files. + goto end +) + +if "%1" == "json" ( + %SPHINXBUILD% -b json %ALLSPHINXOPTS% %BUILDDIR%/json + if errorlevel 1 exit /b 1 + echo. + echo.Build finished; now you can process the JSON files. + goto end +) + +if "%1" == "htmlhelp" ( + %SPHINXBUILD% -b htmlhelp %ALLSPHINXOPTS% %BUILDDIR%/htmlhelp + if errorlevel 1 exit /b 1 + echo. + echo.Build finished; now you can run HTML Help Workshop with the ^ +.hhp project file in %BUILDDIR%/htmlhelp. + goto end +) + +if "%1" == "qthelp" ( + %SPHINXBUILD% -b qthelp %ALLSPHINXOPTS% %BUILDDIR%/qthelp + if errorlevel 1 exit /b 1 + echo. + echo.Build finished; now you can run "qcollectiongenerator" with the ^ +.qhcp project file in %BUILDDIR%/qthelp, like this: + echo.^> qcollectiongenerator %BUILDDIR%\qthelp\MXNetjl.qhcp + echo.To view the help file: + echo.^> assistant -collectionFile %BUILDDIR%\qthelp\MXNetjl.ghc + goto end +) + +if "%1" == "devhelp" ( + %SPHINXBUILD% -b devhelp %ALLSPHINXOPTS% %BUILDDIR%/devhelp + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. + goto end +) + +if "%1" == "epub" ( + %SPHINXBUILD% -b epub %ALLSPHINXOPTS% %BUILDDIR%/epub + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The epub file is in %BUILDDIR%/epub. + goto end +) + +if "%1" == "latex" ( + %SPHINXBUILD% -b latex %ALLSPHINXOPTS% %BUILDDIR%/latex + if errorlevel 1 exit /b 1 + echo. + echo.Build finished; the LaTeX files are in %BUILDDIR%/latex. + goto end +) + +if "%1" == "latexpdf" ( + %SPHINXBUILD% -b latex %ALLSPHINXOPTS% %BUILDDIR%/latex + cd %BUILDDIR%/latex + make all-pdf + cd %~dp0 + echo. + echo.Build finished; the PDF files are in %BUILDDIR%/latex. + goto end +) + +if "%1" == "latexpdfja" ( + %SPHINXBUILD% -b latex %ALLSPHINXOPTS% %BUILDDIR%/latex + cd %BUILDDIR%/latex + make all-pdf-ja + cd %~dp0 + echo. + echo.Build finished; the PDF files are in %BUILDDIR%/latex. + goto end +) + +if "%1" == "text" ( + %SPHINXBUILD% -b text %ALLSPHINXOPTS% %BUILDDIR%/text + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The text files are in %BUILDDIR%/text. + goto end +) + +if "%1" == "man" ( + %SPHINXBUILD% -b man %ALLSPHINXOPTS% %BUILDDIR%/man + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The manual pages are in %BUILDDIR%/man. + goto end +) + +if "%1" == "texinfo" ( + %SPHINXBUILD% -b texinfo %ALLSPHINXOPTS% %BUILDDIR%/texinfo + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The Texinfo files are in %BUILDDIR%/texinfo. + goto end +) + +if "%1" == "gettext" ( + %SPHINXBUILD% -b gettext %I18NSPHINXOPTS% %BUILDDIR%/locale + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The message catalogs are in %BUILDDIR%/locale. + goto end +) + +if "%1" == "changes" ( + %SPHINXBUILD% -b changes %ALLSPHINXOPTS% %BUILDDIR%/changes + if errorlevel 1 exit /b 1 + echo. + echo.The overview file is in %BUILDDIR%/changes. + goto end +) + +if "%1" == "linkcheck" ( + %SPHINXBUILD% -b linkcheck %ALLSPHINXOPTS% %BUILDDIR%/linkcheck + if errorlevel 1 exit /b 1 + echo. + echo.Link check complete; look for any errors in the above output ^ +or in %BUILDDIR%/linkcheck/output.txt. + goto end +) + +if "%1" == "doctest" ( + %SPHINXBUILD% -b doctest %ALLSPHINXOPTS% %BUILDDIR%/doctest + if errorlevel 1 exit /b 1 + echo. + echo.Testing of doctests in the sources finished, look at the ^ +results in %BUILDDIR%/doctest/output.txt. + goto end +) + +if "%1" == "coverage" ( + %SPHINXBUILD% -b coverage %ALLSPHINXOPTS% %BUILDDIR%/coverage + if errorlevel 1 exit /b 1 + echo. + echo.Testing of coverage in the sources finished, look at the ^ +results in %BUILDDIR%/coverage/python.txt. + goto end +) + +if "%1" == "xml" ( + %SPHINXBUILD% -b xml %ALLSPHINXOPTS% %BUILDDIR%/xml + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The XML files are in %BUILDDIR%/xml. + goto end +) + +if "%1" == "pseudoxml" ( + %SPHINXBUILD% -b pseudoxml %ALLSPHINXOPTS% %BUILDDIR%/pseudoxml + if errorlevel 1 exit /b 1 + echo. + echo.Build finished. The pseudo-XML files are in %BUILDDIR%/pseudoxml. + goto end +) + +:end From 4a25b00b85a1d0083c37ab9024f433f73d2f417c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 20 Oct 2015 00:31:14 -0400 Subject: [PATCH 072/630] add rtd badge --- README.md | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index 85cd8cc114e8..4852bcd52161 100644 --- a/README.md +++ b/README.md @@ -1,8 +1,8 @@ # MXNet [![Build Status](https://travis-ci.org/dmlc/MXNet.jl.svg?branch=master)](https://travis-ci.org/dmlc/MXNet.jl) -[![Coverage Status](https://img.shields.io/coveralls/dmlc/MXNet.jl.svg?style=flat)](https://coveralls.io/r/dmlc/MXNet.jl?branch=master) -[![License](https://img.shields.io/github/license/dmlc/MXNet.jl.svg?style=flat)](LICENSE.md) +[![Documentation Status](https://readthedocs.org/projects/mxnetjl/badge/?version=latest)](http://mxnetjl.readthedocs.org/en/latest/?badge=latest) +[![License](http://dmlc.github.io/img/apache2.svg)](LICENSE.md) Julia wrapper of [MXNet](https://github.com/dmlc/mxnet). From 34a1c89bf2b65351914e00ccd12a033df724a721 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 20 Oct 2015 00:34:47 -0400 Subject: [PATCH 073/630] use rtd theme --- docs/conf.py | 13 ++++++++++++- 1 file changed, 12 insertions(+), 1 deletion(-) diff --git a/docs/conf.py b/docs/conf.py index 3aab37726449..33f8b3ce6a42 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -116,7 +116,18 @@ # The theme to use for HTML and HTML Help pages. See the documentation for # a list of builtin themes. -html_theme = 'alabaster' +html_theme = 'default' + +import os +on_rtd = os.environ.get('READTHEDOCS', None) == 'True' + +if not on_rtd: # only import and set the theme if we're building docs locally + try: + import sphinx_rtd_theme + html_theme = "sphinx_rtd_theme" + html_theme_path = [sphinx_rtd_theme.get_html_theme_path()] + except: + pass # Theme options are theme-specific and customize the look and feel of a theme # further. For a list of options available for each theme, see the From 4eff47d15f3f63fcfbe5fb31b6fa7a4455b5ed1f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 20 Oct 2015 01:07:57 -0400 Subject: [PATCH 074/630] fix some doc markdown formatting --- docs/api/MXNet.md | 214 +++++++++++++++++++++++----------------------- docs/api/index.md | 81 ------------------ docs/build.jl | 3 +- docs/index.rst | 6 ++ src/io.jl | 120 +++++++++++++++----------- src/name.jl | 8 +- src/ndarray.jl | 16 ++-- src/symbol.jl | 1 - 8 files changed, 200 insertions(+), 249 deletions(-) delete mode 100644 docs/api/index.md diff --git a/docs/api/MXNet.md b/docs/api/MXNet.md index fbaee9ae02fa..d4b273ba417d 100644 --- a/docs/api/MXNet.md +++ b/docs/api/MXNet.md @@ -4,51 +4,35 @@ --- - -#### _compose!(sym::MXNet.mx.Symbol) -Compose symbol on inputs - -*source:* -[MXNet/src/symbol.jl:199](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L199) - ---- - - -#### _default_get_name!(counter::Dict{Symbol, Int64}, name::Union{AbstractString, Symbol}, hint::Union{AbstractString, Symbol}) -Default implementation for generating a name for a symbol. - -When a name is specified by the user, it will be used. Otherwise, a name -is automatically generated based on the hint string. - - -*source:* -[MXNet/src/name.jl:12](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/name.jl#L12) - ---- - #### _import_ndarray_functions() Import dynamic functions for NDArrays. The arguments to the functions are typically ordered as - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) +```julia +func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) +``` unless NDARRAY_ARG_BEFORE_SCALAR is not set. In this case, the scalars are put before the input arguments: - func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) +```julia +func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) +``` -If ACCEPT_EMPTY_MUTATE_TARGET is set. An overloaded function without the output arguments will also be defined: +If `ACCEPT_EMPTY_MUTATE_TARGET` is set. An overloaded function without the output arguments will also be defined: - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) +```julia +func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) +``` Upon calling, the output arguments will be automatically initialized with empty NDArrays. Those functions always return the output arguments. If there is only one output (the typical situation), that -object (NDArray) is returned. Otherwise, a tuple containing all the outputs will be returned. +object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. *source:* -[MXNet/src/ndarray.jl:361](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L361) +[MXNet/src/ndarray.jl:367](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L367) --- @@ -60,7 +44,7 @@ Get a split of `batch_size` into `n_split` pieces for data parallelization. Retu *source:* -[MXNet/src/estimator.jl:18](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/estimator.jl#L18) +[MXNet/src/estimator.jl:18](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/estimator.jl#L18) --- @@ -69,7 +53,7 @@ Get a split of `batch_size` into `n_split` pieces for data parallelization. Retu Copy data from NDArray to Julia Array *source:* -[MXNet/src/ndarray.jl:178](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L178) +[MXNet/src/ndarray.jl:178](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L178) --- @@ -78,7 +62,7 @@ Copy data from NDArray to Julia Array Copy data between NDArrays *source:* -[MXNet/src/ndarray.jl:166](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L166) +[MXNet/src/ndarray.jl:166](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L166) --- @@ -87,7 +71,7 @@ Copy data between NDArrays Copy data from Julia Array to NDArray *source:* -[MXNet/src/ndarray.jl:186](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L186) +[MXNet/src/ndarray.jl:186](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L186) --- @@ -96,7 +80,7 @@ Copy data from Julia Array to NDArray Create copy: NDArray -> Julia Array *source:* -[MXNet/src/ndarray.jl:196](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L196) +[MXNet/src/ndarray.jl:196](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L196) --- @@ -105,7 +89,7 @@ Create copy: NDArray -> Julia Array Create copy: NDArray -> NDArray in a given context *source:* -[MXNet/src/ndarray.jl:202](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L202) +[MXNet/src/ndarray.jl:202](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L202) --- @@ -114,7 +98,7 @@ Create copy: NDArray -> NDArray in a given context Create copy: Julia Array -> NDArray in a given context *source:* -[MXNet/src/ndarray.jl:208](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L208) +[MXNet/src/ndarray.jl:208](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L208) --- @@ -123,7 +107,7 @@ Create copy: Julia Array -> NDArray in a given context Get a new grouped symbol whose output contains all the internal outputs of this symbol. *source:* -[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L63) +[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/symbol.jl#L63) --- @@ -132,7 +116,7 @@ Get a new grouped symbol whose output contains all the internal outputs of this Create a symbol that groups symbols together *source:* -[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L77) +[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/symbol.jl#L77) --- @@ -147,7 +131,7 @@ Most operators do not have Auxiliary states. *source:* -[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L58) +[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/symbol.jl#L58) --- @@ -156,7 +140,7 @@ Most operators do not have Auxiliary states. Create NDArray and initialize with 1 *source:* -[MXNet/src/ndarray.jl:112](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L112) +[MXNet/src/ndarray.jl:112](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L112) --- @@ -165,7 +149,7 @@ Create NDArray and initialize with 1 Create NDArray and initialize with 1 *source:* -[MXNet/src/ndarray.jl:112](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L112) +[MXNet/src/ndarray.jl:112](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L112) --- @@ -174,7 +158,7 @@ Create NDArray and initialize with 1 Assign all elements of an NDArray to a scalar *source:* -[MXNet/src/ndarray.jl:146](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L146) +[MXNet/src/ndarray.jl:146](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L146) --- @@ -186,7 +170,7 @@ Get the shape of an `NDArray`. Note the shape is converted to Julia convention. *source:* -[MXNet/src/ndarray.jl:81](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L81) +[MXNet/src/ndarray.jl:81](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L81) --- @@ -200,7 +184,7 @@ Get the shape of an `NDArray`. Note the shape is converted to Julia convention. *source:* -[MXNet/src/ndarray.jl:128](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L128) +[MXNet/src/ndarray.jl:128](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L128) --- @@ -209,7 +193,7 @@ Get the shape of an `NDArray`. Note the shape is converted to Julia convention. Create a symbolic variable with the given name *source:* -[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/symbol.jl#L70) +[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/symbol.jl#L70) --- @@ -218,7 +202,7 @@ Create a symbolic variable with the given name Create zero-ed NDArray of specific shape *source:* -[MXNet/src/ndarray.jl:102](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L102) +[MXNet/src/ndarray.jl:102](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L102) --- @@ -227,7 +211,7 @@ Create zero-ed NDArray of specific shape Create zero-ed NDArray of specific shape *source:* -[MXNet/src/ndarray.jl:102](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L102) +[MXNet/src/ndarray.jl:102](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L102) --- @@ -235,32 +219,36 @@ Create zero-ed NDArray of specific shape #### MXNet.mx.AbstractDataBatch Root type for data batch - A data batch must implement the following interface function to actually provide the data and label. +A data batch must implement the following interface function to actually provide the data and label. - load_data!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) - load_label!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) +```julia +load_data!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) +load_label!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) +``` - Load data and label into targets. The targets is a list of target that the data/label should be - copied into. The order in the list is guaranteed to be the same as returned by `provide_data` and - `provide_label`. Each entry in the list is again a list of `SlicedNDArray`, corresponding the - memory buffer for each device. +Load data and label into targets. The targets is a list of target that the data/label should be +copied into. The order in the list is guaranteed to be the same as returned by `provide_data` and +`provide_label`. Each entry in the list is again a list of `SlicedNDArray`, corresponding the +memory buffer for each device. - The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. +The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. - The following function should also be implemented to handle the case when the mini-batch size does not - divide the size of the whole dataset. So in the last mini-batch, the actual data copied might be fewer - than the mini-batch size. This is usually not an issue during the training as the remaining space may - contain the data and label copied during the previous mini-batch are still valid data. However, during - testing, especially when doing feature extraction, we need to be precise about the number of samples - processed. +The following function should also be implemented to handle the case when the mini-batch size does not +divide the size of the whole dataset. So in the last mini-batch, the actual data copied might be fewer +than the mini-batch size. This is usually not an issue during the training as the remaining space may +contain the data and label copied during the previous mini-batch are still valid data. However, during +testing, especially when doing feature extraction, we need to be precise about the number of samples +processed. - get_pad(batch :: AbstractDataBatch) +```julia +get_pad(batch :: AbstractDataBatch) +``` - Return the number of *dummy samples* in this mini-batch. +Return the number of *dummy samples* in this mini-batch. *source:* -[MXNet/src/io.jl:90](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L90) +[MXNet/src/io.jl:110](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L110) --- @@ -268,61 +256,77 @@ Root type for data batch #### MXNet.mx.AbstractDataProvider Root type for data provider - A data provider provides interface to iterate over a dataset. It should implement the following functions: +A data provider provides interface to iterate over a dataset. It should implement the following functions: - provide_data(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} - provide_label(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} +```julia +provide_data(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} +provide_label(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} +``` - Returns a list of name-shape pairs, indicating the name and shape of the each data stream. For example, - `[(:data, (100,1,28,28))]` or `[(:softmax_label, (100,1))]`. It should also implement the following convenient - function +Returns a list of name-shape pairs, indicating the name and shape of the each data stream. For example, +`[(:data, (100,1,28,28))]` or `[(:softmax_label, (100,1))]`. It should also implement the following convenient +function - get_batch_size(provider :: AbstractDataProvider) => Int +```julia +get_batch_size(provider :: AbstractDataProvider) => Int +``` - which returns the batch size used in this data provider. +which returns the batch size used in this data provider. - A data provider should implement the standard Julia iteration interface, including `Base.start`, - `Base.next`, `Base.done` and `Base.eltype`. It could safely assume that the interface functions will - always be called like +A data provider should implement the standard Julia iteration interface, including `Base.start`, +`Base.next`, `Base.done` and `Base.eltype`. It could safely assume that the interface functions will +always be called like - for batch in provider - # ... - load_data!(batch, targets) - end +```julia +for batch in provider + # ... + load_data!(batch, targets) +end +``` - which translates into +which translates into - state = Base.start(provider) - while !done(provider, state) - (batch, state) = next(provider, state) - # ... - load_data!(batch, targets) - end +```julia +state = Base.start(provider) +while !done(provider, state) + (batch, state) = next(provider, state) + # ... + load_data!(batch, targets) +end +``` - In other words, it could safely assume that `Base.next` is always called after `Base.done`. And neither - of those function will be called twice consequtively. The detailed interfaces are list below: +In other words, it could safely assume that `Base.next` is always called after `Base.done`. And neither +of those function will be called twice consequtively. The detailed interfaces are list below: - Base.start(provider :: AbstractDataProvider) => AbstractDataProviderState +```julia +Base.start(provider :: AbstractDataProvider) => AbstractDataProviderState +``` - Initialize or reset the data iteration. +Initialize or reset the data iteration. - Base.next(provider :: AbstractDataProvider, state :: AbstractDataProviderState) - => (AbstractDataBatch, AbstractDataProviderState) +```julia +Base.next(provider :: AbstractDataProvider, state :: AbstractDataProviderState) + => (AbstractDataBatch, AbstractDataProviderState) +``` - Return one batch of data. Actual data can be retrieved from the batch by interface functions described - in the document of type `AbstractDataBatch`. +Return one batch of data. Actual data can be retrieved from the batch by interface functions described +in the document of type `AbstractDataBatch`. - Base.done(provider :: AbstractDataProvider, state :: AbstractDataProviderState) => Bool +```julia +Base.done(provider :: AbstractDataProvider, state :: AbstractDataProviderState) => Bool +``` - Return `false` if there is more batch to get. +Return `false` if there is more batch to get. - Base.eltype(::Type{MyDataProvider}) => MyDataProviderState +```julia +Base.eltype(::Type{MyDataProvider}) => MyDataProviderState +``` - Return the type of the data provider state. +Return the type of the data provider state. *source:* -[MXNet/src/io.jl:55](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L55) +[MXNet/src/io.jl:71](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L71) --- @@ -331,7 +335,7 @@ Root type for data provider Root type for states of data provider *source:* -[MXNet/src/io.jl:58](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L58) +[MXNet/src/io.jl:74](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L74) --- @@ -341,7 +345,7 @@ Wrapper of built-in `libmxnet` data iterators. *source:* -[MXNet/src/io.jl:99](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L99) +[MXNet/src/io.jl:119](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L119) --- @@ -350,7 +354,7 @@ Wrapper of built-in `libmxnet` data iterators. Exception thrown when an error occurred calling MXNet API. *source:* -[MXNet/src/init.jl:2](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/init.jl#L2) +[MXNet/src/init.jl:2](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/init.jl#L2) --- @@ -368,7 +372,7 @@ Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block *source:* -[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L32) +[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L32) --- @@ -379,7 +383,7 @@ A tuple of (slice, NDArray). Usually each NDArray resides on a different device, *source:* -[MXNet/src/io.jl:63](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/io.jl#L63) +[MXNet/src/io.jl:79](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L79) --- @@ -403,7 +407,7 @@ which will do inplace adding of the contents of b into a. *source:* -[MXNet/src/ndarray.jl:234](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/ndarray.jl#L234) +[MXNet/src/ndarray.jl:234](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L234) --- @@ -412,5 +416,5 @@ which will do inplace adding of the contents of b into a. Utility macro to call MXNet API functions *source:* -[MXNet/src/init.jl:41](https://github.com/dmlc/MXNet.jl/tree/aa18e9880436a496c020e8600268bba4e60efdc7/src/init.jl#L41) +[MXNet/src/init.jl:41](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/init.jl#L41) diff --git a/docs/api/index.md b/docs/api/index.md deleted file mode 100644 index aa274bb16cd5..000000000000 --- a/docs/api/index.md +++ /dev/null @@ -1,81 +0,0 @@ -# API-INDEX - - -## MODULE: MXNet.mx - ---- - -## Methods [Internal] - -[_compose!(sym::MXNet.mx.Symbol)](MXNet.md#method___compose.1) Compose symbol on inputs - -[_default_get_name!(counter::Dict{Symbol, Int64}, name::Union{AbstractString, Symbol}, hint::Union{AbstractString, Symbol})](MXNet.md#method___default_get_name.1) Default implementation for generating a name for a symbol. - -[_import_ndarray_functions()](MXNet.md#method___import_ndarray_functions.1) Import dynamic functions for NDArrays. The arguments to the functions are typically ordered - -[_split_inputs(batch_size::Int64, n_split::Int64)](MXNet.md#method___split_inputs.1) Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector - -[copy!(dst::Array{Float32, N}, src::MXNet.mx.NDArray)](MXNet.md#method__copy.1) Copy data from NDArray to Julia Array - -[copy!(dst::MXNet.mx.NDArray, src::MXNet.mx.NDArray)](MXNet.md#method__copy.2) Copy data between NDArrays - -[copy!{T<:Real}(dst::MXNet.mx.NDArray, src::Array{T<:Real, N})](MXNet.md#method__copy.3) Copy data from Julia Array to NDArray - -[copy(arr::MXNet.mx.NDArray)](MXNet.md#method__copy.4) Create copy: NDArray -> Julia Array - -[copy(arr::MXNet.mx.NDArray, ctx::MXNet.mx.Context)](MXNet.md#method__copy.5) Create copy: NDArray -> NDArray in a given context - -[copy{T<:Real}(arr::Array{T<:Real, N}, ctx::MXNet.mx.Context)](MXNet.md#method__copy.6) Create copy: Julia Array -> NDArray in a given context - -[get_internals(self::MXNet.mx.Symbol)](MXNet.md#method__get_internals.1) Get a new grouped symbol whose output contains all the internal outputs of this symbol. - -[group(symbols::MXNet.mx.Symbol...)](MXNet.md#method__group.1) Create a symbol that groups symbols together - -[list_auxiliary_states(self::MXNet.mx.Symbol)](MXNet.md#method__list_auxiliary_states.1) List all auxiliary states in the symbool. - -[ones{N}(shape::NTuple{N, Int64})](MXNet.md#method__ones.1) Create NDArray and initialize with 1 - -[ones{N}(shape::NTuple{N, Int64}, ctx::MXNet.mx.Context)](MXNet.md#method__ones.2) Create NDArray and initialize with 1 - -[setindex!(arr::MXNet.mx.NDArray, val::Real, ::Colon)](MXNet.md#method__setindex.1) Assign all elements of an NDArray to a scalar - -[size(arr::MXNet.mx.NDArray)](MXNet.md#method__size.1) Get the shape of an `NDArray`. Note the shape is converted to Julia convention. - -[slice(arr::MXNet.mx.NDArray, ::Colon)](MXNet.md#method__slice.1) `slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest - -[variable(name::Union{AbstractString, Symbol})](MXNet.md#method__variable.1) Create a symbolic variable with the given name - -[zeros{N}(shape::NTuple{N, Int64})](MXNet.md#method__zeros.1) Create zero-ed NDArray of specific shape - -[zeros{N}(shape::NTuple{N, Int64}, ctx::MXNet.mx.Context)](MXNet.md#method__zeros.2) Create zero-ed NDArray of specific shape - ---- - -## Types [Internal] - -[MXNet.mx.AbstractDataBatch](MXNet.md#type__abstractdatabatch.1) Root type for data batch - -[MXNet.mx.AbstractDataProvider](MXNet.md#type__abstractdataprovider.1) Root type for data provider - -[MXNet.mx.AbstractDataProviderState](MXNet.md#type__abstractdataproviderstate.1) Root type for states of data provider - -[MXNet.mx.MXDataProvider](MXNet.md#type__mxdataprovider.1) Wrapper of built-in `libmxnet` data iterators. - -[MXNet.mx.MXError](MXNet.md#type__mxerror.1) Exception thrown when an error occurred calling MXNet API. - -[MXNet.mx.NDArray](MXNet.md#type__ndarray.1) Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block - ---- - -## Typealiass [Internal] - -[SlicedNDArray](MXNet.md#typealias__slicedndarray.1) A tuple of (slice, NDArray). Usually each NDArray resides on a different device, and each - ---- - -## Macros [Internal] - -[@inplace(stmt)](MXNet.md#macro___inplace.1) Julia does not support re-definiton of += operator (like __iadd__ in python), - -[@mxcall(fv, argtypes, args...)](MXNet.md#macro___mxcall.1) Utility macro to call MXNet API functions - diff --git a/docs/build.jl b/docs/build.jl index d6a4ec9ef5d5..11a45ec75883 100644 --- a/docs/build.jl +++ b/docs/build.jl @@ -3,6 +3,5 @@ using Lexicon config = Config(md_permalink = false, mathjax = true) -index = save("api/MXNet.md", MXNet.mx, config) -save("api/index.md", Index([index]), config; md_subheader = :category) +index = save("api/MXNet.md", mx, config) diff --git a/docs/index.rst b/docs/index.rst index 81b86df5034d..b2598cac01bb 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -11,6 +11,12 @@ Contents: .. toctree:: :maxdepth: 2 +API Documentation +----------------- + +.. toctree:: + :maxdepth: 1 + api/MXNet diff --git a/src/io.jl b/src/io.jl index cf618be3e4a4..78fb7cefc22c 100644 --- a/src/io.jl +++ b/src/io.jl @@ -1,56 +1,72 @@ """Root type for data provider - A data provider provides interface to iterate over a dataset. It should implement the following functions: +A data provider provides interface to iterate over a dataset. It should implement the following functions: - provide_data(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} - provide_label(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} +```julia +provide_data(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} +provide_label(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} +``` - Returns a list of name-shape pairs, indicating the name and shape of the each data stream. For example, - `[(:data, (100,1,28,28))]` or `[(:softmax_label, (100,1))]`. It should also implement the following convenient - function +Returns a list of name-shape pairs, indicating the name and shape of the each data stream. For example, +`[(:data, (100,1,28,28))]` or `[(:softmax_label, (100,1))]`. It should also implement the following convenient +function - get_batch_size(provider :: AbstractDataProvider) => Int +```julia +get_batch_size(provider :: AbstractDataProvider) => Int +``` - which returns the batch size used in this data provider. +which returns the batch size used in this data provider. - A data provider should implement the standard Julia iteration interface, including `Base.start`, - `Base.next`, `Base.done` and `Base.eltype`. It could safely assume that the interface functions will - always be called like +A data provider should implement the standard Julia iteration interface, including `Base.start`, +`Base.next`, `Base.done` and `Base.eltype`. It could safely assume that the interface functions will +always be called like - for batch in provider - # ... - load_data!(batch, targets) - end +```julia +for batch in provider + # ... + load_data!(batch, targets) +end +``` - which translates into +which translates into - state = Base.start(provider) - while !done(provider, state) - (batch, state) = next(provider, state) - # ... - load_data!(batch, targets) - end +```julia +state = Base.start(provider) +while !done(provider, state) + (batch, state) = next(provider, state) + # ... + load_data!(batch, targets) +end +``` - In other words, it could safely assume that `Base.next` is always called after `Base.done`. And neither - of those function will be called twice consequtively. The detailed interfaces are list below: +In other words, it could safely assume that `Base.next` is always called after `Base.done`. And neither +of those function will be called twice consequtively. The detailed interfaces are list below: - Base.start(provider :: AbstractDataProvider) => AbstractDataProviderState +```julia +Base.start(provider :: AbstractDataProvider) => AbstractDataProviderState +``` - Initialize or reset the data iteration. +Initialize or reset the data iteration. - Base.next(provider :: AbstractDataProvider, state :: AbstractDataProviderState) - => (AbstractDataBatch, AbstractDataProviderState) +```julia +Base.next(provider :: AbstractDataProvider, state :: AbstractDataProviderState) + => (AbstractDataBatch, AbstractDataProviderState) +``` - Return one batch of data. Actual data can be retrieved from the batch by interface functions described - in the document of type `AbstractDataBatch`. +Return one batch of data. Actual data can be retrieved from the batch by interface functions described +in the document of type `AbstractDataBatch`. - Base.done(provider :: AbstractDataProvider, state :: AbstractDataProviderState) => Bool +```julia +Base.done(provider :: AbstractDataProvider, state :: AbstractDataProviderState) => Bool +``` - Return `false` if there is more batch to get. +Return `false` if there is more batch to get. - Base.eltype(::Type{MyDataProvider}) => MyDataProviderState +```julia +Base.eltype(::Type{MyDataProvider}) => MyDataProviderState +``` - Return the type of the data provider state. +Return the type of the data provider state. """ abstract AbstractDataProvider @@ -64,28 +80,32 @@ typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} """Root type for data batch - A data batch must implement the following interface function to actually provide the data and label. +A data batch must implement the following interface function to actually provide the data and label. - load_data!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) - load_label!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) +```julia +load_data!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) +load_label!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) +``` - Load data and label into targets. The targets is a list of target that the data/label should be - copied into. The order in the list is guaranteed to be the same as returned by `provide_data` and - `provide_label`. Each entry in the list is again a list of `SlicedNDArray`, corresponding the - memory buffer for each device. +Load data and label into targets. The targets is a list of target that the data/label should be +copied into. The order in the list is guaranteed to be the same as returned by `provide_data` and +`provide_label`. Each entry in the list is again a list of `SlicedNDArray`, corresponding the +memory buffer for each device. - The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. +The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. - The following function should also be implemented to handle the case when the mini-batch size does not - divide the size of the whole dataset. So in the last mini-batch, the actual data copied might be fewer - than the mini-batch size. This is usually not an issue during the training as the remaining space may - contain the data and label copied during the previous mini-batch are still valid data. However, during - testing, especially when doing feature extraction, we need to be precise about the number of samples - processed. +The following function should also be implemented to handle the case when the mini-batch size does not +divide the size of the whole dataset. So in the last mini-batch, the actual data copied might be fewer +than the mini-batch size. This is usually not an issue during the training as the remaining space may +contain the data and label copied during the previous mini-batch are still valid data. However, during +testing, especially when doing feature extraction, we need to be precise about the number of samples +processed. - get_pad(batch :: AbstractDataBatch) +```julia +get_pad(batch :: AbstractDataBatch) +``` - Return the number of *dummy samples* in this mini-batch. +Return the number of *dummy samples* in this mini-batch. """ abstract AbstractDataBatch diff --git a/src/name.jl b/src/name.jl index 5644809c79f9..5ebf10917ce6 100644 --- a/src/name.jl +++ b/src/name.jl @@ -4,11 +4,9 @@ typealias NameCounter Dict{Base.Symbol, Int} import Base: get! -"""Default implementation for generating a name for a symbol. - -When a name is specified by the user, it will be used. Otherwise, a name -is automatically generated based on the hint string. -""" +# Default implementation for generating a name for a symbol. +# When a name is specified by the user, it will be used. Otherwise, a name +# is automatically generated based on the hint string. function _default_get_name!(counter :: NameCounter, name :: NameType, hint :: NameType) if isa(name, Base.Symbol) || !isempty(name) return symbol(name) diff --git a/src/ndarray.jl b/src/ndarray.jl index 1d80dcdbdd51..bdc9775d5e87 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -343,20 +343,26 @@ end Import dynamic functions for NDArrays. The arguments to the functions are typically ordered as - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) +```julia +func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) +``` unless NDARRAY_ARG_BEFORE_SCALAR is not set. In this case, the scalars are put before the input arguments: - func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) +```julia +func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) +``` -If ACCEPT_EMPTY_MUTATE_TARGET is set. An overloaded function without the output arguments will also be defined: +If `ACCEPT_EMPTY_MUTATE_TARGET` is set. An overloaded function without the output arguments will also be defined: - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) +```julia +func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) +``` Upon calling, the output arguments will be automatically initialized with empty NDArrays. Those functions always return the output arguments. If there is only one output (the typical situation), that -object (NDArray) is returned. Otherwise, a tuple containing all the outputs will be returned. +object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. """ function _import_ndarray_functions() n_ref = Ref{MX_uint}(0) diff --git a/src/symbol.jl b/src/symbol.jl index 85799d524c51..921671e394e9 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -195,7 +195,6 @@ function ./(self :: Symbol, arg :: Symbol) _Div(self, arg) end -"Compose symbol on inputs" function _compose!(sym :: Symbol; kwargs...) name = char_p(0) arg_keys = AbstractString[] From d13ddc6542bdb00e26b87e721a9b0e79a22bbd66 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 20 Oct 2015 01:16:10 -0400 Subject: [PATCH 075/630] clean up Context --- src/context.jl | 19 ++++++++++--------- src/ndarray.jl | 17 +++++++++++++---- src/random.jl | 10 ++++++++-- test/unittest/ndarray.jl | 6 +++--- 4 files changed, 34 insertions(+), 18 deletions(-) diff --git a/src/context.jl b/src/context.jl index 06062500be6c..5146d4afcb64 100644 --- a/src/context.jl +++ b/src/context.jl @@ -1,18 +1,19 @@ @enum CONTEXT_TYPE CPU=1 GPU=2 CPU_PINNED=3 -type Context +immutable Context device_type :: CONTEXT_TYPE - device_id :: Cint - - old_ctx :: Nullable{Context} + device_id :: Int end -Context(dev_type :: Union{CONTEXT_TYPE, Integer}, dev_id :: Integer = 0) = - Context(convert(CONTEXT_TYPE, dev_type), convert(Cint, dev_id), Nullable{Context}()) +Context(dev_type :: Union{CONTEXT_TYPE, Int}, dev_id :: Int = 0) = + Context(convert(CONTEXT_TYPE, dev_type), dev_id) function Base.show(io :: IO, ctx :: Context) print(io, "$(ctx.device_type)$(ctx.device_id)") end - -# global default context -DEFAULT_CONTEXT = Context(CPU) +function cpu(dev_id::Int=0) + return Context(CPU, dev_id) +end +function gpu(dev_id::Int=0) + return Context(GPU, dev_id) +end diff --git a/src/ndarray.jl b/src/ndarray.jl index bdc9775d5e87..d5a61a173a34 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -43,7 +43,7 @@ function Base.show(io :: IO, arr :: NDArray) end function NDArray{T<:Real}(data :: Array{T}) - copy(data, mx.DEFAULT_CONTEXT) + copy(data, cpu()) end function Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) @@ -63,7 +63,10 @@ function context(arr :: NDArray) return Context(ref_typeid[], ref_devid[]) end -function empty{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) +function empty{N}(shape :: NTuple{N, Int}) + empty(shape, cpu()) +end +function empty{N}(shape :: NTuple{N, Int}, ctx :: Context) NDArray(_ndarray_alloc(shape, ctx, false)) end function empty(shape :: Int...) @@ -99,7 +102,10 @@ function eltype(arr :: NDArray) end "Create zero-ed NDArray of specific shape" -function zeros{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) +function zeros{N}(shape :: NTuple{N, Int}) + zeros(shape, cpu()) +end +function zeros{N}(shape :: NTuple{N, Int}, ctx :: Context) arr = empty(shape, ctx) arr[:] = 0 return arr @@ -109,7 +115,10 @@ function zeros(shape :: Int...) end "Create NDArray and initialize with 1" -function ones{N}(shape :: NTuple{N, Int}, ctx :: Context = DEFAULT_CONTEXT) +function ones{N}(shape :: NTuple{N, Int}) + ones(shape, cpu()) +end +function ones{N}(shape :: NTuple{N, Int}, ctx :: Context) arr = empty(shape, ctx) arr[:] = 1 return arr diff --git a/src/random.jl b/src/random.jl index 82b0aea97582..79a8b6e9e20b 100644 --- a/src/random.jl +++ b/src/random.jl @@ -1,7 +1,10 @@ function rand!(low::Real, high::Real, out::NDArray) _random_uniform(low, high, out) end -function rand(low::Real, high::Real, shape::Tuple, ctx::Context=DEFAULT_CONTEXT) +function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}) + rand(low, high, shape, cpu()) +end +function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}, ctx::Context) out = empty(shape, ctx) rand!(low, high, out) end @@ -9,7 +12,10 @@ end function randn!(mean::Real, stdvar::Real, out::NDArray) _random_gaussian(mean, stdvar, out) end -function randn(mean::Real, stdvar::Real, shape::Tuple, ctx::Context=DEFAULT_CONTEXT) +function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}) + randn(mean, stdvar, shape, cpu()) +end +function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}, ctx::Context) out = empty(shape, ctx) randn!(mean, stdvar, out) end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index d547159af1e2..7d5df826f32b 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -9,7 +9,7 @@ using ..Main: rand_dims, reldiff ################################################################################ function rand_tensors{N}(dims::NTuple{N, Int}) tensor = rand(mx.MX_float, dims) - array = copy(tensor, mx.DEFAULT_CONTEXT) + array = copy(tensor, mx.cpu()) return (tensor, array) end @@ -20,12 +20,12 @@ function test_copy() info("NDArray::copy::dims = $dims") # copy to NDArray and back - array = copy(tensor, mx.DEFAULT_CONTEXT) + array = copy(tensor, mx.cpu()) tensor2 = copy(array) @test reldiff(tensor, tensor2) < 1e-6 # copy between NDArray - array2 = copy(array, mx.DEFAULT_CONTEXT) + array2 = copy(array, mx.cpu()) tensor2 = copy(array2) @test reldiff(tensor, tensor2) < 1e-6 end From 70579c4cace6dbdafd34a4fced7fc7d5e83bb842 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 20 Oct 2015 01:59:47 -0400 Subject: [PATCH 076/630] use light-weighted mkdocs for documentation instead --- docs/Makefile | 192 -------------------- docs/api/MXNet.md | 420 -------------------------------------------- docs/api/ndarray.md | 189 ++++++++++++++++++++ docs/api/symbol.md | 46 +++++ docs/build.jl | 16 +- docs/conf.py | 303 -------------------------------- docs/index.md | 0 docs/index.rst | 29 --- docs/make.bat | 263 --------------------------- mkdocs.yml | 9 + src/ndarray.jl | 38 ++-- 11 files changed, 280 insertions(+), 1225 deletions(-) delete mode 100644 docs/Makefile delete mode 100644 docs/api/MXNet.md create mode 100644 docs/api/ndarray.md create mode 100644 docs/api/symbol.md delete mode 100644 docs/conf.py create mode 100644 docs/index.md delete mode 100644 docs/index.rst delete mode 100644 docs/make.bat create mode 100644 mkdocs.yml diff --git a/docs/Makefile b/docs/Makefile deleted file mode 100644 index ce3d7abdbfaa..000000000000 --- a/docs/Makefile +++ /dev/null @@ -1,192 +0,0 @@ -# Makefile for Sphinx documentation -# - -# You can set these variables from the command line. -SPHINXOPTS = -SPHINXBUILD = sphinx-build -PAPER = -BUILDDIR = _build - -# User-friendly check for sphinx-build -ifeq ($(shell which $(SPHINXBUILD) >/dev/null 2>&1; echo $$?), 1) -$(error The '$(SPHINXBUILD)' command was not found. Make sure you have Sphinx installed, then set the SPHINXBUILD environment variable to point to the full path of the '$(SPHINXBUILD)' executable. Alternatively you can add the directory with the executable to your PATH. If you don't have Sphinx installed, grab it from http://sphinx-doc.org/) -endif - -# Internal variables. -PAPEROPT_a4 = -D latex_paper_size=a4 -PAPEROPT_letter = -D latex_paper_size=letter -ALLSPHINXOPTS = -d $(BUILDDIR)/doctrees $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) . -# the i18n builder cannot share the environment and doctrees with the others -I18NSPHINXOPTS = $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) . - -.PHONY: help clean html dirhtml singlehtml pickle json htmlhelp qthelp devhelp epub latex latexpdf text man changes linkcheck doctest coverage gettext - -help: - @echo "Please use \`make ' where is one of" - @echo " html to make standalone HTML files" - @echo " dirhtml to make HTML files named index.html in directories" - @echo " singlehtml to make a single large HTML file" - @echo " pickle to make pickle files" - @echo " json to make JSON files" - @echo " htmlhelp to make HTML files and a HTML help project" - @echo " qthelp to make HTML files and a qthelp project" - @echo " applehelp to make an Apple Help Book" - @echo " devhelp to make HTML files and a Devhelp project" - @echo " epub to make an epub" - @echo " latex to make LaTeX files, you can set PAPER=a4 or PAPER=letter" - @echo " latexpdf to make LaTeX files and run them through pdflatex" - @echo " latexpdfja to make LaTeX files and run them through platex/dvipdfmx" - @echo " text to make text files" - @echo " man to make manual pages" - @echo " texinfo to make Texinfo files" - @echo " info to make Texinfo files and run them through makeinfo" - @echo " gettext to make PO message catalogs" - @echo " changes to make an overview of all changed/added/deprecated items" - @echo " xml to make Docutils-native XML files" - @echo " pseudoxml to make pseudoxml-XML files for display purposes" - @echo " linkcheck to check all external links for integrity" - @echo " doctest to run all doctests embedded in the documentation (if enabled)" - @echo " coverage to run coverage check of the documentation (if enabled)" - -clean: - rm -rf $(BUILDDIR)/* - -html: - $(SPHINXBUILD) -b html $(ALLSPHINXOPTS) $(BUILDDIR)/html - @echo - @echo "Build finished. The HTML pages are in $(BUILDDIR)/html." - -dirhtml: - $(SPHINXBUILD) -b dirhtml $(ALLSPHINXOPTS) $(BUILDDIR)/dirhtml - @echo - @echo "Build finished. The HTML pages are in $(BUILDDIR)/dirhtml." - -singlehtml: - $(SPHINXBUILD) -b singlehtml $(ALLSPHINXOPTS) $(BUILDDIR)/singlehtml - @echo - @echo "Build finished. The HTML page is in $(BUILDDIR)/singlehtml." - -pickle: - $(SPHINXBUILD) -b pickle $(ALLSPHINXOPTS) $(BUILDDIR)/pickle - @echo - @echo "Build finished; now you can process the pickle files." - -json: - $(SPHINXBUILD) -b json $(ALLSPHINXOPTS) $(BUILDDIR)/json - @echo - @echo "Build finished; now you can process the JSON files." - -htmlhelp: - $(SPHINXBUILD) -b htmlhelp $(ALLSPHINXOPTS) $(BUILDDIR)/htmlhelp - @echo - @echo "Build finished; now you can run HTML Help Workshop with the" \ - ".hhp project file in $(BUILDDIR)/htmlhelp." - -qthelp: - $(SPHINXBUILD) -b qthelp $(ALLSPHINXOPTS) $(BUILDDIR)/qthelp - @echo - @echo "Build finished; now you can run "qcollectiongenerator" with the" \ - ".qhcp project file in $(BUILDDIR)/qthelp, like this:" - @echo "# qcollectiongenerator $(BUILDDIR)/qthelp/MXNetjl.qhcp" - @echo "To view the help file:" - @echo "# assistant -collectionFile $(BUILDDIR)/qthelp/MXNetjl.qhc" - -applehelp: - $(SPHINXBUILD) -b applehelp $(ALLSPHINXOPTS) $(BUILDDIR)/applehelp - @echo - @echo "Build finished. The help book is in $(BUILDDIR)/applehelp." - @echo "N.B. You won't be able to view it unless you put it in" \ - "~/Library/Documentation/Help or install it in your application" \ - "bundle." - -devhelp: - $(SPHINXBUILD) -b devhelp $(ALLSPHINXOPTS) $(BUILDDIR)/devhelp - @echo - @echo "Build finished." - @echo "To view the help file:" - @echo "# mkdir -p $$HOME/.local/share/devhelp/MXNetjl" - @echo "# ln -s $(BUILDDIR)/devhelp $$HOME/.local/share/devhelp/MXNetjl" - @echo "# devhelp" - -epub: - $(SPHINXBUILD) -b epub $(ALLSPHINXOPTS) $(BUILDDIR)/epub - @echo - @echo "Build finished. The epub file is in $(BUILDDIR)/epub." - -latex: - $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex - @echo - @echo "Build finished; the LaTeX files are in $(BUILDDIR)/latex." - @echo "Run \`make' in that directory to run these through (pdf)latex" \ - "(use \`make latexpdf' here to do that automatically)." - -latexpdf: - $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex - @echo "Running LaTeX files through pdflatex..." - $(MAKE) -C $(BUILDDIR)/latex all-pdf - @echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex." - -latexpdfja: - $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex - @echo "Running LaTeX files through platex and dvipdfmx..." - $(MAKE) -C $(BUILDDIR)/latex all-pdf-ja - @echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex." - -text: - $(SPHINXBUILD) -b text $(ALLSPHINXOPTS) $(BUILDDIR)/text - @echo - @echo "Build finished. The text files are in $(BUILDDIR)/text." - -man: - $(SPHINXBUILD) -b man $(ALLSPHINXOPTS) $(BUILDDIR)/man - @echo - @echo "Build finished. The manual pages are in $(BUILDDIR)/man." - -texinfo: - $(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo - @echo - @echo "Build finished. The Texinfo files are in $(BUILDDIR)/texinfo." - @echo "Run \`make' in that directory to run these through makeinfo" \ - "(use \`make info' here to do that automatically)." - -info: - $(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo - @echo "Running Texinfo files through makeinfo..." - make -C $(BUILDDIR)/texinfo info - @echo "makeinfo finished; the Info files are in $(BUILDDIR)/texinfo." - -gettext: - $(SPHINXBUILD) -b gettext $(I18NSPHINXOPTS) $(BUILDDIR)/locale - @echo - @echo "Build finished. The message catalogs are in $(BUILDDIR)/locale." - -changes: - $(SPHINXBUILD) -b changes $(ALLSPHINXOPTS) $(BUILDDIR)/changes - @echo - @echo "The overview file is in $(BUILDDIR)/changes." - -linkcheck: - $(SPHINXBUILD) -b linkcheck $(ALLSPHINXOPTS) $(BUILDDIR)/linkcheck - @echo - @echo "Link check complete; look for any errors in the above output " \ - "or in $(BUILDDIR)/linkcheck/output.txt." - -doctest: - $(SPHINXBUILD) -b doctest $(ALLSPHINXOPTS) $(BUILDDIR)/doctest - @echo "Testing of doctests in the sources finished, look at the " \ - "results in $(BUILDDIR)/doctest/output.txt." - -coverage: - $(SPHINXBUILD) -b coverage $(ALLSPHINXOPTS) $(BUILDDIR)/coverage - @echo "Testing of coverage in the sources finished, look at the " \ - "results in $(BUILDDIR)/coverage/python.txt." - -xml: - $(SPHINXBUILD) -b xml $(ALLSPHINXOPTS) $(BUILDDIR)/xml - @echo - @echo "Build finished. The XML files are in $(BUILDDIR)/xml." - -pseudoxml: - $(SPHINXBUILD) -b pseudoxml $(ALLSPHINXOPTS) $(BUILDDIR)/pseudoxml - @echo - @echo "Build finished. The pseudo-XML files are in $(BUILDDIR)/pseudoxml." diff --git a/docs/api/MXNet.md b/docs/api/MXNet.md deleted file mode 100644 index d4b273ba417d..000000000000 --- a/docs/api/MXNet.md +++ /dev/null @@ -1,420 +0,0 @@ -# MXNet.mx - -## Internal - ---- - - -#### _import_ndarray_functions() -Import dynamic functions for NDArrays. The arguments to the functions are typically ordered -as - -```julia -func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) -``` - -unless NDARRAY_ARG_BEFORE_SCALAR is not set. In this case, the scalars are put before the input arguments: - -```julia -func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) -``` - -If `ACCEPT_EMPTY_MUTATE_TARGET` is set. An overloaded function without the output arguments will also be defined: - -```julia -func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) -``` - -Upon calling, the output arguments will be automatically initialized with empty NDArrays. - -Those functions always return the output arguments. If there is only one output (the typical situation), that -object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. - - -*source:* -[MXNet/src/ndarray.jl:367](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L367) - ---- - - -#### _split_inputs(batch_size::Int64, n_split::Int64) -Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector - of length `n_split`, with each entry a `UnitRange{Int}` indicating the slice index for that - piece. - - -*source:* -[MXNet/src/estimator.jl:18](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/estimator.jl#L18) - ---- - - -#### copy!(dst::Array{Float32, N}, src::MXNet.mx.NDArray) -Copy data from NDArray to Julia Array - -*source:* -[MXNet/src/ndarray.jl:178](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L178) - ---- - - -#### copy!(dst::MXNet.mx.NDArray, src::MXNet.mx.NDArray) -Copy data between NDArrays - -*source:* -[MXNet/src/ndarray.jl:166](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L166) - ---- - - -#### copy!{T<:Real}(dst::MXNet.mx.NDArray, src::Array{T<:Real, N}) -Copy data from Julia Array to NDArray - -*source:* -[MXNet/src/ndarray.jl:186](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L186) - ---- - - -#### copy(arr::MXNet.mx.NDArray) -Create copy: NDArray -> Julia Array - -*source:* -[MXNet/src/ndarray.jl:196](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L196) - ---- - - -#### copy(arr::MXNet.mx.NDArray, ctx::MXNet.mx.Context) -Create copy: NDArray -> NDArray in a given context - -*source:* -[MXNet/src/ndarray.jl:202](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L202) - ---- - - -#### copy{T<:Real}(arr::Array{T<:Real, N}, ctx::MXNet.mx.Context) -Create copy: Julia Array -> NDArray in a given context - -*source:* -[MXNet/src/ndarray.jl:208](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L208) - ---- - - -#### get_internals(self::MXNet.mx.Symbol) -Get a new grouped symbol whose output contains all the internal outputs of this symbol. - -*source:* -[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/symbol.jl#L63) - ---- - - -#### group(symbols::MXNet.mx.Symbol...) -Create a symbol that groups symbols together - -*source:* -[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/symbol.jl#L77) - ---- - - -#### list_auxiliary_states(self::MXNet.mx.Symbol) -List all auxiliary states in the symbool. - -Auxiliary states are special states of symbols that do not corresponds to an argument, -and do not have gradient. But still be useful for the specific operations. -A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. -Most operators do not have Auxiliary states. - - -*source:* -[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/symbol.jl#L58) - ---- - - -#### ones{N}(shape::NTuple{N, Int64}) -Create NDArray and initialize with 1 - -*source:* -[MXNet/src/ndarray.jl:112](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L112) - ---- - - -#### ones{N}(shape::NTuple{N, Int64}, ctx::MXNet.mx.Context) -Create NDArray and initialize with 1 - -*source:* -[MXNet/src/ndarray.jl:112](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L112) - ---- - - -#### setindex!(arr::MXNet.mx.NDArray, val::Real, ::Colon) -Assign all elements of an NDArray to a scalar - -*source:* -[MXNet/src/ndarray.jl:146](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L146) - ---- - - -#### size(arr::MXNet.mx.NDArray) -Get the shape of an `NDArray`. Note the shape is converted to Julia convention. - So the same piece of memory, in Julia (column-major), with shape (K, M, N), will be of the - shape (N, M, K) in the Python (row-major) binding. - - -*source:* -[MXNet/src/ndarray.jl:81](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L81) - ---- - - -#### slice(arr::MXNet.mx.NDArray, ::Colon) -`slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest - changing dimension is supported. In Julia's column-major perspective, this is the last - dimension. For example, given an `NDArray` of shape (2,3,4), `sub(array, 2:3)` will create - a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is - used in data parallelization to split mini-batch into sub-batches for different devices. - - -*source:* -[MXNet/src/ndarray.jl:128](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L128) - ---- - - -#### variable(name::Union{AbstractString, Symbol}) -Create a symbolic variable with the given name - -*source:* -[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/symbol.jl#L70) - ---- - - -#### zeros{N}(shape::NTuple{N, Int64}) -Create zero-ed NDArray of specific shape - -*source:* -[MXNet/src/ndarray.jl:102](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L102) - ---- - - -#### zeros{N}(shape::NTuple{N, Int64}, ctx::MXNet.mx.Context) -Create zero-ed NDArray of specific shape - -*source:* -[MXNet/src/ndarray.jl:102](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L102) - ---- - - -#### MXNet.mx.AbstractDataBatch -Root type for data batch - -A data batch must implement the following interface function to actually provide the data and label. - -```julia -load_data!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) -load_label!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) -``` - -Load data and label into targets. The targets is a list of target that the data/label should be -copied into. The order in the list is guaranteed to be the same as returned by `provide_data` and -`provide_label`. Each entry in the list is again a list of `SlicedNDArray`, corresponding the -memory buffer for each device. - -The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. - -The following function should also be implemented to handle the case when the mini-batch size does not -divide the size of the whole dataset. So in the last mini-batch, the actual data copied might be fewer -than the mini-batch size. This is usually not an issue during the training as the remaining space may -contain the data and label copied during the previous mini-batch are still valid data. However, during -testing, especially when doing feature extraction, we need to be precise about the number of samples -processed. - -```julia -get_pad(batch :: AbstractDataBatch) -``` - -Return the number of *dummy samples* in this mini-batch. - - -*source:* -[MXNet/src/io.jl:110](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L110) - ---- - - -#### MXNet.mx.AbstractDataProvider -Root type for data provider - -A data provider provides interface to iterate over a dataset. It should implement the following functions: - -```julia -provide_data(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} -provide_label(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} -``` - -Returns a list of name-shape pairs, indicating the name and shape of the each data stream. For example, -`[(:data, (100,1,28,28))]` or `[(:softmax_label, (100,1))]`. It should also implement the following convenient -function - -```julia -get_batch_size(provider :: AbstractDataProvider) => Int -``` - -which returns the batch size used in this data provider. - -A data provider should implement the standard Julia iteration interface, including `Base.start`, -`Base.next`, `Base.done` and `Base.eltype`. It could safely assume that the interface functions will -always be called like - -```julia -for batch in provider - # ... - load_data!(batch, targets) -end -``` - -which translates into - -```julia -state = Base.start(provider) -while !done(provider, state) - (batch, state) = next(provider, state) - # ... - load_data!(batch, targets) -end -``` - -In other words, it could safely assume that `Base.next` is always called after `Base.done`. And neither -of those function will be called twice consequtively. The detailed interfaces are list below: - -```julia -Base.start(provider :: AbstractDataProvider) => AbstractDataProviderState -``` - -Initialize or reset the data iteration. - -```julia -Base.next(provider :: AbstractDataProvider, state :: AbstractDataProviderState) - => (AbstractDataBatch, AbstractDataProviderState) -``` - -Return one batch of data. Actual data can be retrieved from the batch by interface functions described -in the document of type `AbstractDataBatch`. - -```julia -Base.done(provider :: AbstractDataProvider, state :: AbstractDataProviderState) => Bool -``` - -Return `false` if there is more batch to get. - -```julia -Base.eltype(::Type{MyDataProvider}) => MyDataProviderState -``` - -Return the type of the data provider state. - - -*source:* -[MXNet/src/io.jl:71](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L71) - ---- - - -#### MXNet.mx.AbstractDataProviderState -Root type for states of data provider - -*source:* -[MXNet/src/io.jl:74](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L74) - ---- - - -#### MXNet.mx.MXDataProvider -Wrapper of built-in `libmxnet` data iterators. - - -*source:* -[MXNet/src/io.jl:119](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L119) - ---- - - -#### MXNet.mx.MXError -Exception thrown when an error occurred calling MXNet API. - -*source:* -[MXNet/src/init.jl:2](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/init.jl#L2) - ---- - - -#### MXNet.mx.NDArray -Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block - of tensor-based computation. - - **Note** since C/C++ use row-major ordering for arrays while Julia follows a - column-major ordering. To keep things consistent, we keep the underlying data - in their original layout, but use *language-native* convention when we talk - about shapes. For example, a mini-batch of 100 MNIST images is a tensor of - C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory - have shape (28,28,1,100). - - -*source:* -[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L32) - ---- - - -#### SlicedNDArray -A tuple of (slice, NDArray). Usually each NDArray resides on a different device, and each - slice describe which part of a larger piece of data should goto that device. - - -*source:* -[MXNet/src/io.jl:79](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/io.jl#L79) - ---- - - -#### @inplace(stmt) -Julia does not support re-definiton of += operator (like __iadd__ in python), -When one write a += b, it gets translated to a = a+b. a+b will allocate new -memory for the results, and the newly allocated NDArray object is then assigned -back to a, while the original contents in a is discarded. This is very inefficient -when we want to do inplace update. - -This macro is a simple utility to implement this behavior. Write - - @mx.inplace a += b - -will translate into - - mx.add_to!(a, b) - -which will do inplace adding of the contents of b into a. - - -*source:* -[MXNet/src/ndarray.jl:234](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/ndarray.jl#L234) - ---- - - -#### @mxcall(fv, argtypes, args...) -Utility macro to call MXNet API functions - -*source:* -[MXNet/src/init.jl:41](https://github.com/dmlc/MXNet.jl/tree/34a1c89bf2b65351914e00ccd12a033df724a721/src/init.jl#L41) - diff --git a/docs/api/ndarray.md b/docs/api/ndarray.md new file mode 100644 index 000000000000..2ede7ba99e78 --- /dev/null +++ b/docs/api/ndarray.md @@ -0,0 +1,189 @@ +# MXNet.mx + +## Internal + +--- + + +#### _import_ndarray_functions() +Import dynamic functions for NDArrays. The arguments to the functions are typically ordered +as + +```julia +func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) +``` + +unless NDARRAY_ARG_BEFORE_SCALAR is not set. In this case, the scalars are put before the input arguments: + +```julia +func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) +``` + +If `ACCEPT_EMPTY_MUTATE_TARGET` is set. An overloaded function without the output arguments will also be defined: + +```julia +func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) +``` + +Upon calling, the output arguments will be automatically initialized with empty NDArrays. + +Those functions always return the output arguments. If there is only one output (the typical situation), that +object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. + + +*source:* +[MXNet/src/ndarray.jl:380](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L380) + +--- + + +#### copy!(dst::Array{Float32, N}, src::MXNet.mx.NDArray) +Copy data from NDArray to Julia Array + +*source:* +[MXNet/src/ndarray.jl:187](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L187) + +--- + + +#### copy!(dst::MXNet.mx.NDArray, src::MXNet.mx.NDArray) +Copy data between NDArrays + +*source:* +[MXNet/src/ndarray.jl:175](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L175) + +--- + + +#### copy!{T<:Real}(dst::MXNet.mx.NDArray, src::Array{T<:Real, N}) +Copy data from Julia Array to NDArray + +*source:* +[MXNet/src/ndarray.jl:195](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L195) + +--- + + +#### copy(arr::MXNet.mx.NDArray) +Create copy: NDArray -> Julia Array + +*source:* +[MXNet/src/ndarray.jl:205](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L205) + +--- + + +#### copy(arr::MXNet.mx.NDArray, ctx::MXNet.mx.Context) +Create copy: NDArray -> NDArray in a given context + +*source:* +[MXNet/src/ndarray.jl:211](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L211) + +--- + + +#### copy{T<:Real}(arr::Array{T<:Real, N}, ctx::MXNet.mx.Context) +Create copy: Julia Array -> NDArray in a given context + +*source:* +[MXNet/src/ndarray.jl:217](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L217) + +--- + + +#### ones{N}(shape::NTuple{N, Int64}) +Create NDArray and initialize with 1 + +*source:* +[MXNet/src/ndarray.jl:118](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L118) + +--- + + +#### setindex!(arr::MXNet.mx.NDArray, val::Real, ::Colon) +Assign all elements of an NDArray to a scalar + +*source:* +[MXNet/src/ndarray.jl:155](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L155) + +--- + + +#### size(arr::MXNet.mx.NDArray) +Get the shape of an `NDArray`. Note the shape is converted to Julia convention. + So the same piece of memory, in Julia (column-major), with shape (K, M, N), will be of the + shape (N, M, K) in the Python (row-major) binding. + + +*source:* +[MXNet/src/ndarray.jl:84](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L84) + +--- + + +#### slice(arr::MXNet.mx.NDArray, ::Colon) +`slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest +changing dimension is supported. In Julia's column-major perspective, this is the last +dimension. For example, given an `NDArray` of shape (2,3,4), `sub(array, 2:3)` will create +a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is +used in data parallelization to split mini-batch into sub-batches for different devices. + + +*source:* +[MXNet/src/ndarray.jl:137](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L137) + +--- + + +#### zeros{N}(shape::NTuple{N, Int64}) +Create zero-ed NDArray of specific shape + +*source:* +[MXNet/src/ndarray.jl:105](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L105) + +--- + + +#### MXNet.mx.NDArray +Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block +of tensor-based computation. + +**Note** since C/C++ use row-major ordering for arrays while Julia follows a +column-major ordering. To keep things consistent, we keep the underlying data +in their original layout, but use *language-native* convention when we talk +about shapes. For example, a mini-batch of 100 MNIST images is a tensor of +C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory +have shape (28,28,1,100). + + +*source:* +[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L32) + +--- + + +#### @inplace(stmt) +Julia does not support re-definiton of `+=` operator (like `__iadd__` in python), +When one write `a += b`, it gets translated to `a = a+b`. `a+b` will allocate new +memory for the results, and the newly allocated `NDArray` object is then assigned +back to a, while the original contents in a is discarded. This is very inefficient +when we want to do inplace update. + +This macro is a simple utility to implement this behavior. Write + +```julia +@mx.inplace a += b +``` + +will translate into + +```julia +mx.add_to!(a, b) +``` + +which will do inplace adding of the contents of b into a. + + +*source:* +[MXNet/src/ndarray.jl:247](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L247) + diff --git a/docs/api/symbol.md b/docs/api/symbol.md new file mode 100644 index 000000000000..1172f54214df --- /dev/null +++ b/docs/api/symbol.md @@ -0,0 +1,46 @@ +# MXNet.mx + +## Internal + +--- + + +#### get_internals(self::MXNet.mx.Symbol) +Get a new grouped symbol whose output contains all the internal outputs of this symbol. + +*source:* +[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/symbol.jl#L63) + +--- + + +#### group(symbols::MXNet.mx.Symbol...) +Create a symbol that groups symbols together + +*source:* +[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/symbol.jl#L77) + +--- + + +#### list_auxiliary_states(self::MXNet.mx.Symbol) +List all auxiliary states in the symbool. + +Auxiliary states are special states of symbols that do not corresponds to an argument, +and do not have gradient. But still be useful for the specific operations. +A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. +Most operators do not have Auxiliary states. + + +*source:* +[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/symbol.jl#L58) + +--- + + +#### variable(name::Union{AbstractString, Symbol}) +Create a symbolic variable with the given name + +*source:* +[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/symbol.jl#L70) + diff --git a/docs/build.jl b/docs/build.jl index 11a45ec75883..24c380f0f40a 100644 --- a/docs/build.jl +++ b/docs/build.jl @@ -3,5 +3,19 @@ using Lexicon config = Config(md_permalink = false, mathjax = true) -index = save("api/MXNet.md", mx, config) +function save_meta(file :: AbstractString, docs :: Lexicon.Metadata, order = [:source]) + isfile(file) || mkpath(dirname(file)) + open(file, "w") do io + for (k,v) in Lexicon.EachEntry(docs, order = order) + name = Lexicon.writeobj(k) + println(io, "#### $name") + println(io, v.docs.data) + end + end +end + +doc = Lexicon.metadata(MXNet.mx) +for mod in [:ndarray, :symbol] + save("api/$mod.md", MIME("text/md"), filter(doc, files=["$mod.jl"]), config) +end diff --git a/docs/conf.py b/docs/conf.py deleted file mode 100644 index 33f8b3ce6a42..000000000000 --- a/docs/conf.py +++ /dev/null @@ -1,303 +0,0 @@ -# -*- coding: utf-8 -*- -# -# MXNet.jl documentation build configuration file, created by -# sphinx-quickstart on Tue Oct 20 00:09:24 2015. -# -# This file is execfile()d with the current directory set to its -# containing dir. -# -# Note that not all possible configuration values are present in this -# autogenerated file. -# -# All configuration values have a default; values that are commented out -# serve to show the default. - -import sys -import os -import shlex - -# If extensions (or modules to document with autodoc) are in another directory, -# add these directories to sys.path here. If the directory is relative to the -# documentation root, use os.path.abspath to make it absolute, like shown here. -#sys.path.insert(0, os.path.abspath('.')) - -# -- General configuration ------------------------------------------------ - -# If your documentation needs a minimal Sphinx version, state it here. -#needs_sphinx = '1.0' - -# Add any Sphinx extension module names here, as strings. They can be -# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom -# ones. -extensions = [ - 'sphinx.ext.mathjax', -] - -# Add any paths that contain templates here, relative to this directory. -templates_path = ['_templates'] - -# The suffix(es) of source filenames. -# You can specify multiple suffix as a list of string: -# source_suffix = ['.rst', '.md'] -source_suffix = ['.rst', '.md'] - -from recommonmark.parser import CommonMarkParser - -source_parsers = { - '.md': CommonMarkParser, -} - -# The encoding of source files. -#source_encoding = 'utf-8-sig' - -# The master toctree document. -master_doc = 'index' - -# General information about the project. -project = u'MXNet.jl' -copyright = u'2015, pluskid' -author = u'pluskid' - -# The version info for the project you're documenting, acts as replacement for -# |version| and |release|, also used in various other places throughout the -# built documents. -# -# The short X.Y version. -version = '0.0.1' -# The full version, including alpha/beta/rc tags. -release = '0.0.1' - -# The language for content autogenerated by Sphinx. Refer to documentation -# for a list of supported languages. -# -# This is also used if you do content translation via gettext catalogs. -# Usually you set "language" from the command line for these cases. -language = None - -# There are two options for replacing |today|: either, you set today to some -# non-false value, then it is used: -#today = '' -# Else, today_fmt is used as the format for a strftime call. -#today_fmt = '%B %d, %Y' - -# List of patterns, relative to source directory, that match files and -# directories to ignore when looking for source files. -exclude_patterns = ['_build'] - -# The reST default role (used for this markup: `text`) to use for all -# documents. -#default_role = None - -# If true, '()' will be appended to :func: etc. cross-reference text. -#add_function_parentheses = True - -# If true, the current module name will be prepended to all description -# unit titles (such as .. function::). -#add_module_names = True - -# If true, sectionauthor and moduleauthor directives will be shown in the -# output. They are ignored by default. -#show_authors = False - -# The name of the Pygments (syntax highlighting) style to use. -pygments_style = 'sphinx' - -# A list of ignored prefixes for module index sorting. -#modindex_common_prefix = [] - -# If true, keep warnings as "system message" paragraphs in the built documents. -#keep_warnings = False - -# If true, `todo` and `todoList` produce output, else they produce nothing. -todo_include_todos = False - - -# -- Options for HTML output ---------------------------------------------- - -# The theme to use for HTML and HTML Help pages. See the documentation for -# a list of builtin themes. -html_theme = 'default' - -import os -on_rtd = os.environ.get('READTHEDOCS', None) == 'True' - -if not on_rtd: # only import and set the theme if we're building docs locally - try: - import sphinx_rtd_theme - html_theme = "sphinx_rtd_theme" - html_theme_path = [sphinx_rtd_theme.get_html_theme_path()] - except: - pass - -# Theme options are theme-specific and customize the look and feel of a theme -# further. For a list of options available for each theme, see the -# documentation. -#html_theme_options = {} - -# Add any paths that contain custom themes here, relative to this directory. -#html_theme_path = [] - -# The name for this set of Sphinx documents. If None, it defaults to -# " v documentation". -#html_title = None - -# A shorter title for the navigation bar. Default is the same as html_title. -#html_short_title = None - -# The name of an image file (relative to this directory) to place at the top -# of the sidebar. -#html_logo = None - -# The name of an image file (within the static path) to use as favicon of the -# docs. This file should be a Windows icon file (.ico) being 16x16 or 32x32 -# pixels large. -#html_favicon = None - -# Add any paths that contain custom static files (such as style sheets) here, -# relative to this directory. They are copied after the builtin static files, -# so a file named "default.css" will overwrite the builtin "default.css". -html_static_path = ['_static'] - -# Add any extra paths that contain custom files (such as robots.txt or -# .htaccess) here, relative to this directory. These files are copied -# directly to the root of the documentation. -#html_extra_path = [] - -# If not '', a 'Last updated on:' timestamp is inserted at every page bottom, -# using the given strftime format. -#html_last_updated_fmt = '%b %d, %Y' - -# If true, SmartyPants will be used to convert quotes and dashes to -# typographically correct entities. -#html_use_smartypants = True - -# Custom sidebar templates, maps document names to template names. -#html_sidebars = {} - -# Additional templates that should be rendered to pages, maps page names to -# template names. -#html_additional_pages = {} - -# If false, no module index is generated. -#html_domain_indices = True - -# If false, no index is generated. -#html_use_index = True - -# If true, the index is split into individual pages for each letter. -#html_split_index = False - -# If true, links to the reST sources are added to the pages. -#html_show_sourcelink = True - -# If true, "Created using Sphinx" is shown in the HTML footer. Default is True. -#html_show_sphinx = True - -# If true, "(C) Copyright ..." is shown in the HTML footer. Default is True. -#html_show_copyright = True - -# If true, an OpenSearch description file will be output, and all pages will -# contain a tag referring to it. The value of this option must be the -# base URL from which the finished HTML is served. -#html_use_opensearch = '' - -# This is the file name suffix for HTML files (e.g. ".xhtml"). -#html_file_suffix = None - -# Language to be used for generating the HTML full-text search index. -# Sphinx supports the following languages: -# 'da', 'de', 'en', 'es', 'fi', 'fr', 'hu', 'it', 'ja' -# 'nl', 'no', 'pt', 'ro', 'ru', 'sv', 'tr' -#html_search_language = 'en' - -# A dictionary with options for the search language support, empty by default. -# Now only 'ja' uses this config value -#html_search_options = {'type': 'default'} - -# The name of a javascript file (relative to the configuration directory) that -# implements a search results scorer. If empty, the default will be used. -#html_search_scorer = 'scorer.js' - -# Output file base name for HTML help builder. -htmlhelp_basename = 'MXNetjldoc' - -# -- Options for LaTeX output --------------------------------------------- - -latex_elements = { -# The paper size ('letterpaper' or 'a4paper'). -#'papersize': 'letterpaper', - -# The font size ('10pt', '11pt' or '12pt'). -#'pointsize': '10pt', - -# Additional stuff for the LaTeX preamble. -#'preamble': '', - -# Latex figure (float) alignment -#'figure_align': 'htbp', -} - -# Grouping the document tree into LaTeX files. List of tuples -# (source start file, target name, title, -# author, documentclass [howto, manual, or own class]). -latex_documents = [ - (master_doc, 'MXNetjl.tex', u'MXNet.jl Documentation', - u'pluskid', 'manual'), -] - -# The name of an image file (relative to this directory) to place at the top of -# the title page. -#latex_logo = None - -# For "manual" documents, if this is true, then toplevel headings are parts, -# not chapters. -#latex_use_parts = False - -# If true, show page references after internal links. -#latex_show_pagerefs = False - -# If true, show URL addresses after external links. -#latex_show_urls = False - -# Documents to append as an appendix to all manuals. -#latex_appendices = [] - -# If false, no module index is generated. -#latex_domain_indices = True - - -# -- Options for manual page output --------------------------------------- - -# One entry per manual page. List of tuples -# (source start file, name, description, authors, manual section). -man_pages = [ - (master_doc, 'mxnetjl', u'MXNet.jl Documentation', - [author], 1) -] - -# If true, show URL addresses after external links. -#man_show_urls = False - - -# -- Options for Texinfo output ------------------------------------------- - -# Grouping the document tree into Texinfo files. List of tuples -# (source start file, target name, title, author, -# dir menu entry, description, category) -texinfo_documents = [ - (master_doc, 'MXNetjl', u'MXNet.jl Documentation', - author, 'MXNetjl', 'One line description of project.', - 'Miscellaneous'), -] - -# Documents to append as an appendix to all manuals. -#texinfo_appendices = [] - -# If false, no module index is generated. -#texinfo_domain_indices = True - -# How to display URL addresses: 'footnote', 'no', or 'inline'. -#texinfo_show_urls = 'footnote' - -# If true, do not generate a @detailmenu in the "Top" node's menu. -#texinfo_no_detailmenu = False diff --git a/docs/index.md b/docs/index.md new file mode 100644 index 000000000000..e69de29bb2d1 diff --git a/docs/index.rst b/docs/index.rst deleted file mode 100644 index b2598cac01bb..000000000000 --- a/docs/index.rst +++ /dev/null @@ -1,29 +0,0 @@ -.. MXNet.jl documentation master file, created by - sphinx-quickstart on Tue Oct 20 00:09:24 2015. - You can adapt this file completely to your liking, but it should at least - contain the root `toctree` directive. - -Welcome to MXNet.jl's documentation! -==================================== - -Contents: - -.. toctree:: - :maxdepth: 2 - -API Documentation ------------------ - -.. toctree:: - :maxdepth: 1 - - api/MXNet - - -Indices and tables -================== - -* :ref:`genindex` -* :ref:`modindex` -* :ref:`search` - diff --git a/docs/make.bat b/docs/make.bat deleted file mode 100644 index e682697a9877..000000000000 --- a/docs/make.bat +++ /dev/null @@ -1,263 +0,0 @@ -@ECHO OFF - -REM Command file for Sphinx documentation - -if "%SPHINXBUILD%" == "" ( - set SPHINXBUILD=sphinx-build -) -set BUILDDIR=_build -set ALLSPHINXOPTS=-d %BUILDDIR%/doctrees %SPHINXOPTS% . -set I18NSPHINXOPTS=%SPHINXOPTS% . -if NOT "%PAPER%" == "" ( - set ALLSPHINXOPTS=-D latex_paper_size=%PAPER% %ALLSPHINXOPTS% - set I18NSPHINXOPTS=-D latex_paper_size=%PAPER% %I18NSPHINXOPTS% -) - -if "%1" == "" goto help - -if "%1" == "help" ( - :help - echo.Please use `make ^` where ^ is one of - echo. html to make standalone HTML files - echo. dirhtml to make HTML files named index.html in directories - echo. singlehtml to make a single large HTML file - echo. pickle to make pickle files - echo. json to make JSON files - echo. htmlhelp to make HTML files and a HTML help project - echo. qthelp to make HTML files and a qthelp project - echo. devhelp to make HTML files and a Devhelp project - echo. epub to make an epub - echo. latex to make LaTeX files, you can set PAPER=a4 or PAPER=letter - echo. text to make text files - echo. man to make manual pages - echo. texinfo to make Texinfo files - echo. gettext to make PO message catalogs - echo. changes to make an overview over all changed/added/deprecated items - echo. xml to make Docutils-native XML files - echo. pseudoxml to make pseudoxml-XML files for display purposes - echo. linkcheck to check all external links for integrity - echo. doctest to run all doctests embedded in the documentation if enabled - echo. coverage to run coverage check of the documentation if enabled - goto end -) - -if "%1" == "clean" ( - for /d %%i in (%BUILDDIR%\*) do rmdir /q /s %%i - del /q /s %BUILDDIR%\* - goto end -) - - -REM Check if sphinx-build is available and fallback to Python version if any -%SPHINXBUILD% 2> nul -if errorlevel 9009 goto sphinx_python -goto sphinx_ok - -:sphinx_python - -set SPHINXBUILD=python -m sphinx.__init__ -%SPHINXBUILD% 2> nul -if errorlevel 9009 ( - echo. - echo.The 'sphinx-build' command was not found. Make sure you have Sphinx - echo.installed, then set the SPHINXBUILD environment variable to point - echo.to the full path of the 'sphinx-build' executable. Alternatively you - echo.may add the Sphinx directory to PATH. - echo. - echo.If you don't have Sphinx installed, grab it from - echo.http://sphinx-doc.org/ - exit /b 1 -) - -:sphinx_ok - - -if "%1" == "html" ( - %SPHINXBUILD% -b html %ALLSPHINXOPTS% %BUILDDIR%/html - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The HTML pages are in %BUILDDIR%/html. - goto end -) - -if "%1" == "dirhtml" ( - %SPHINXBUILD% -b dirhtml %ALLSPHINXOPTS% %BUILDDIR%/dirhtml - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The HTML pages are in %BUILDDIR%/dirhtml. - goto end -) - -if "%1" == "singlehtml" ( - %SPHINXBUILD% -b singlehtml %ALLSPHINXOPTS% %BUILDDIR%/singlehtml - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The HTML pages are in %BUILDDIR%/singlehtml. - goto end -) - -if "%1" == "pickle" ( - %SPHINXBUILD% -b pickle %ALLSPHINXOPTS% %BUILDDIR%/pickle - if errorlevel 1 exit /b 1 - echo. - echo.Build finished; now you can process the pickle files. - goto end -) - -if "%1" == "json" ( - %SPHINXBUILD% -b json %ALLSPHINXOPTS% %BUILDDIR%/json - if errorlevel 1 exit /b 1 - echo. - echo.Build finished; now you can process the JSON files. - goto end -) - -if "%1" == "htmlhelp" ( - %SPHINXBUILD% -b htmlhelp %ALLSPHINXOPTS% %BUILDDIR%/htmlhelp - if errorlevel 1 exit /b 1 - echo. - echo.Build finished; now you can run HTML Help Workshop with the ^ -.hhp project file in %BUILDDIR%/htmlhelp. - goto end -) - -if "%1" == "qthelp" ( - %SPHINXBUILD% -b qthelp %ALLSPHINXOPTS% %BUILDDIR%/qthelp - if errorlevel 1 exit /b 1 - echo. - echo.Build finished; now you can run "qcollectiongenerator" with the ^ -.qhcp project file in %BUILDDIR%/qthelp, like this: - echo.^> qcollectiongenerator %BUILDDIR%\qthelp\MXNetjl.qhcp - echo.To view the help file: - echo.^> assistant -collectionFile %BUILDDIR%\qthelp\MXNetjl.ghc - goto end -) - -if "%1" == "devhelp" ( - %SPHINXBUILD% -b devhelp %ALLSPHINXOPTS% %BUILDDIR%/devhelp - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. - goto end -) - -if "%1" == "epub" ( - %SPHINXBUILD% -b epub %ALLSPHINXOPTS% %BUILDDIR%/epub - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The epub file is in %BUILDDIR%/epub. - goto end -) - -if "%1" == "latex" ( - %SPHINXBUILD% -b latex %ALLSPHINXOPTS% %BUILDDIR%/latex - if errorlevel 1 exit /b 1 - echo. - echo.Build finished; the LaTeX files are in %BUILDDIR%/latex. - goto end -) - -if "%1" == "latexpdf" ( - %SPHINXBUILD% -b latex %ALLSPHINXOPTS% %BUILDDIR%/latex - cd %BUILDDIR%/latex - make all-pdf - cd %~dp0 - echo. - echo.Build finished; the PDF files are in %BUILDDIR%/latex. - goto end -) - -if "%1" == "latexpdfja" ( - %SPHINXBUILD% -b latex %ALLSPHINXOPTS% %BUILDDIR%/latex - cd %BUILDDIR%/latex - make all-pdf-ja - cd %~dp0 - echo. - echo.Build finished; the PDF files are in %BUILDDIR%/latex. - goto end -) - -if "%1" == "text" ( - %SPHINXBUILD% -b text %ALLSPHINXOPTS% %BUILDDIR%/text - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The text files are in %BUILDDIR%/text. - goto end -) - -if "%1" == "man" ( - %SPHINXBUILD% -b man %ALLSPHINXOPTS% %BUILDDIR%/man - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The manual pages are in %BUILDDIR%/man. - goto end -) - -if "%1" == "texinfo" ( - %SPHINXBUILD% -b texinfo %ALLSPHINXOPTS% %BUILDDIR%/texinfo - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The Texinfo files are in %BUILDDIR%/texinfo. - goto end -) - -if "%1" == "gettext" ( - %SPHINXBUILD% -b gettext %I18NSPHINXOPTS% %BUILDDIR%/locale - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The message catalogs are in %BUILDDIR%/locale. - goto end -) - -if "%1" == "changes" ( - %SPHINXBUILD% -b changes %ALLSPHINXOPTS% %BUILDDIR%/changes - if errorlevel 1 exit /b 1 - echo. - echo.The overview file is in %BUILDDIR%/changes. - goto end -) - -if "%1" == "linkcheck" ( - %SPHINXBUILD% -b linkcheck %ALLSPHINXOPTS% %BUILDDIR%/linkcheck - if errorlevel 1 exit /b 1 - echo. - echo.Link check complete; look for any errors in the above output ^ -or in %BUILDDIR%/linkcheck/output.txt. - goto end -) - -if "%1" == "doctest" ( - %SPHINXBUILD% -b doctest %ALLSPHINXOPTS% %BUILDDIR%/doctest - if errorlevel 1 exit /b 1 - echo. - echo.Testing of doctests in the sources finished, look at the ^ -results in %BUILDDIR%/doctest/output.txt. - goto end -) - -if "%1" == "coverage" ( - %SPHINXBUILD% -b coverage %ALLSPHINXOPTS% %BUILDDIR%/coverage - if errorlevel 1 exit /b 1 - echo. - echo.Testing of coverage in the sources finished, look at the ^ -results in %BUILDDIR%/coverage/python.txt. - goto end -) - -if "%1" == "xml" ( - %SPHINXBUILD% -b xml %ALLSPHINXOPTS% %BUILDDIR%/xml - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The XML files are in %BUILDDIR%/xml. - goto end -) - -if "%1" == "pseudoxml" ( - %SPHINXBUILD% -b pseudoxml %ALLSPHINXOPTS% %BUILDDIR%/pseudoxml - if errorlevel 1 exit /b 1 - echo. - echo.Build finished. The pseudo-XML files are in %BUILDDIR%/pseudoxml. - goto end -) - -:end diff --git a/mkdocs.yml b/mkdocs.yml new file mode 100644 index 000000000000..4b8b0cbcf6ca --- /dev/null +++ b/mkdocs.yml @@ -0,0 +1,9 @@ +site_name: MXNet.jl +site_author: pluskid +repo_url: https://github.com/dmlc/MXNet.jl +theme: readthedocs +pages: + - Home: index.md + - API Documentation: + - 'ndarray': 'api/ndarray.md' + - 'symbol': 'api/symbol.md' diff --git a/src/ndarray.jl b/src/ndarray.jl index d5a61a173a34..a868495a846b 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -20,14 +20,14 @@ end # NDArray Type ################################################################################ """Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block - of tensor-based computation. - - **Note** since C/C++ use row-major ordering for arrays while Julia follows a - column-major ordering. To keep things consistent, we keep the underlying data - in their original layout, but use *language-native* convention when we talk - about shapes. For example, a mini-batch of 100 MNIST images is a tensor of - C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory - have shape (28,28,1,100). +of tensor-based computation. + +**Note** since C/C++ use row-major ordering for arrays while Julia follows a +column-major ordering. To keep things consistent, we keep the underlying data +in their original layout, but use *language-native* convention when we talk +about shapes. For example, a mini-batch of 100 MNIST images is a tensor of +C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory +have shape (28,28,1,100). """ type NDArray handle :: MX_NDArrayHandle @@ -129,10 +129,10 @@ end import Base: slice """`slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest - changing dimension is supported. In Julia's column-major perspective, this is the last - dimension. For example, given an `NDArray` of shape (2,3,4), `sub(array, 2:3)` will create - a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is - used in data parallelization to split mini-batch into sub-batches for different devices. +changing dimension is supported. In Julia's column-major perspective, this is the last +dimension. For example, given an `NDArray` of shape (2,3,4), `sub(array, 2:3)` will create +a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is +used in data parallelization to split mini-batch into sub-batches for different devices. """ function slice(arr :: NDArray, ::Colon) arr @@ -224,19 +224,23 @@ end # Basic arithmetics #------------------------------------------------------------ """ -Julia does not support re-definiton of += operator (like __iadd__ in python), -When one write a += b, it gets translated to a = a+b. a+b will allocate new -memory for the results, and the newly allocated NDArray object is then assigned +Julia does not support re-definiton of `+=` operator (like `__iadd__` in python), +When one write `a += b`, it gets translated to `a = a+b`. `a+b` will allocate new +memory for the results, and the newly allocated `NDArray` object is then assigned back to a, while the original contents in a is discarded. This is very inefficient when we want to do inplace update. This macro is a simple utility to implement this behavior. Write - @mx.inplace a += b +```julia +@mx.inplace a += b +``` will translate into - mx.add_to!(a, b) +```julia +mx.add_to!(a, b) +``` which will do inplace adding of the contents of b into a. """ From 0257055072b7f350963a9b3a19806268d41e7d01 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 20 Oct 2015 02:03:32 -0400 Subject: [PATCH 077/630] one-sentence readme. --- docs/index.md | 3 +++ 1 file changed, 3 insertions(+) diff --git a/docs/index.md b/docs/index.md index e69de29bb2d1..f5d55b86aec0 100644 --- a/docs/index.md +++ b/docs/index.md @@ -0,0 +1,3 @@ +# MXNet.jl + +MXNet.jl is a [Julia](http://julialang.org/) package for *efficient* and *flexible* deep learning, built on top of [dmlc/mxnet](https://github.com/dmlc/mxnet). From 1eb7ebcda9aec2b97ec88d208704411890d018c7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 20 Oct 2015 14:17:01 -0400 Subject: [PATCH 078/630] use osx.mk to simplify travis OSX build --- test/travis/build_mxnet.sh | 13 ++++++------- 1 file changed, 6 insertions(+), 7 deletions(-) diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh index 7b7f421d3cdb..5eaa31c03c7b 100755 --- a/test/travis/build_mxnet.sh +++ b/test/travis/build_mxnet.sh @@ -4,19 +4,18 @@ git clone --recursive https://github.com/dmlc/mxnet __mxnet_build cd __mxnet_build if [ ! -f config.mk ]; then - echo "Use the default config.m" - cp make/config.mk config.mk - if [ ${TRAVIS_OS_NAME} == "linux" ]; then + cp make/config.mk config.mk sed -i 's/export CC = gcc/export CC = gcc-4.8/g' config.mk sed -i 's/export CXX = g++/export CXX = g++-4.8/g' config.mk fi if [ ${TRAVIS_OS_NAME} == "osx" ]; then - # add built-in blas header file to path - sed -i -s 's%ADD_CFLAGS =%ADD_CFLAGS = -I/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers/%' config.mk - # disable openmp - sed -i -s 's%USE_OPENMP = 1%USE_OPENMP = 0%g' config.mk + cp make/osx.mk config.mk + ## add built-in blas header file to path + #sed -i -s 's%ADD_CFLAGS =%ADD_CFLAGS = -I/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers/%' config.mk + ## disable openmp + #sed -i -s 's%USE_OPENMP = 1%USE_OPENMP = 0%g' config.mk fi fi From 92237212c594440455567ec4d39caec909ddd11e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 20 Oct 2015 14:50:31 -0400 Subject: [PATCH 079/630] clean up CI build script --- test/travis/build_mxnet.sh | 4 ---- 1 file changed, 4 deletions(-) diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh index 5eaa31c03c7b..6774011f6355 100755 --- a/test/travis/build_mxnet.sh +++ b/test/travis/build_mxnet.sh @@ -12,10 +12,6 @@ if [ ! -f config.mk ]; then if [ ${TRAVIS_OS_NAME} == "osx" ]; then cp make/osx.mk config.mk - ## add built-in blas header file to path - #sed -i -s 's%ADD_CFLAGS =%ADD_CFLAGS = -I/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers/%' config.mk - ## disable openmp - #sed -i -s 's%USE_OPENMP = 1%USE_OPENMP = 0%g' config.mk fi fi From 2c945ea216f3c9431074f7f9466f77f2d22bee20 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Oct 2015 01:03:37 -0400 Subject: [PATCH 080/630] docstring for imported symbols --- docs/api/ndarray.md | 28 ++++++++++++++-------------- docs/api/symbol.md | 8 ++++---- docs/build.jl | 11 ----------- src/symbol.jl | 12 ++++++++++-- src/util.jl | 29 +++++++++++++++++++++++++++++ 5 files changed, 57 insertions(+), 31 deletions(-) diff --git a/docs/api/ndarray.md b/docs/api/ndarray.md index 2ede7ba99e78..c09b80ea0ab2 100644 --- a/docs/api/ndarray.md +++ b/docs/api/ndarray.md @@ -32,7 +32,7 @@ object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs wi *source:* -[MXNet/src/ndarray.jl:380](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L380) +[MXNet/src/ndarray.jl:380](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L380) --- @@ -41,7 +41,7 @@ object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs wi Copy data from NDArray to Julia Array *source:* -[MXNet/src/ndarray.jl:187](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L187) +[MXNet/src/ndarray.jl:187](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L187) --- @@ -50,7 +50,7 @@ Copy data from NDArray to Julia Array Copy data between NDArrays *source:* -[MXNet/src/ndarray.jl:175](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L175) +[MXNet/src/ndarray.jl:175](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L175) --- @@ -59,7 +59,7 @@ Copy data between NDArrays Copy data from Julia Array to NDArray *source:* -[MXNet/src/ndarray.jl:195](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L195) +[MXNet/src/ndarray.jl:195](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L195) --- @@ -68,7 +68,7 @@ Copy data from Julia Array to NDArray Create copy: NDArray -> Julia Array *source:* -[MXNet/src/ndarray.jl:205](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L205) +[MXNet/src/ndarray.jl:205](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L205) --- @@ -77,7 +77,7 @@ Create copy: NDArray -> Julia Array Create copy: NDArray -> NDArray in a given context *source:* -[MXNet/src/ndarray.jl:211](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L211) +[MXNet/src/ndarray.jl:211](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L211) --- @@ -86,7 +86,7 @@ Create copy: NDArray -> NDArray in a given context Create copy: Julia Array -> NDArray in a given context *source:* -[MXNet/src/ndarray.jl:217](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L217) +[MXNet/src/ndarray.jl:217](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L217) --- @@ -95,7 +95,7 @@ Create copy: Julia Array -> NDArray in a given context Create NDArray and initialize with 1 *source:* -[MXNet/src/ndarray.jl:118](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L118) +[MXNet/src/ndarray.jl:118](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L118) --- @@ -104,7 +104,7 @@ Create NDArray and initialize with 1 Assign all elements of an NDArray to a scalar *source:* -[MXNet/src/ndarray.jl:155](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L155) +[MXNet/src/ndarray.jl:155](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L155) --- @@ -116,7 +116,7 @@ Get the shape of an `NDArray`. Note the shape is converted to Julia convention. *source:* -[MXNet/src/ndarray.jl:84](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L84) +[MXNet/src/ndarray.jl:84](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L84) --- @@ -130,7 +130,7 @@ used in data parallelization to split mini-batch into sub-batches for different *source:* -[MXNet/src/ndarray.jl:137](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L137) +[MXNet/src/ndarray.jl:137](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L137) --- @@ -139,7 +139,7 @@ used in data parallelization to split mini-batch into sub-batches for different Create zero-ed NDArray of specific shape *source:* -[MXNet/src/ndarray.jl:105](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L105) +[MXNet/src/ndarray.jl:105](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L105) --- @@ -157,7 +157,7 @@ have shape (28,28,1,100). *source:* -[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L32) +[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L32) --- @@ -185,5 +185,5 @@ which will do inplace adding of the contents of b into a. *source:* -[MXNet/src/ndarray.jl:247](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/ndarray.jl#L247) +[MXNet/src/ndarray.jl:247](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L247) diff --git a/docs/api/symbol.md b/docs/api/symbol.md index 1172f54214df..1ccd875896b9 100644 --- a/docs/api/symbol.md +++ b/docs/api/symbol.md @@ -9,7 +9,7 @@ Get a new grouped symbol whose output contains all the internal outputs of this symbol. *source:* -[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/symbol.jl#L63) +[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/symbol.jl#L63) --- @@ -18,7 +18,7 @@ Get a new grouped symbol whose output contains all the internal outputs of this Create a symbol that groups symbols together *source:* -[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/symbol.jl#L77) +[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/symbol.jl#L77) --- @@ -33,7 +33,7 @@ Most operators do not have Auxiliary states. *source:* -[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/symbol.jl#L58) +[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/symbol.jl#L58) --- @@ -42,5 +42,5 @@ Most operators do not have Auxiliary states. Create a symbolic variable with the given name *source:* -[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/d13ddc6542bdb00e26b87e721a9b0e79a22bbd66/src/symbol.jl#L70) +[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/symbol.jl#L70) diff --git a/docs/build.jl b/docs/build.jl index 24c380f0f40a..9576e4112c38 100644 --- a/docs/build.jl +++ b/docs/build.jl @@ -3,17 +3,6 @@ using Lexicon config = Config(md_permalink = false, mathjax = true) -function save_meta(file :: AbstractString, docs :: Lexicon.Metadata, order = [:source]) - isfile(file) || mkpath(dirname(file)) - open(file, "w") do io - for (k,v) in Lexicon.EachEntry(docs, order = order) - name = Lexicon.writeobj(k) - println(io, "#### $name") - println(io, v.docs.data) - end - end -end - doc = Lexicon.metadata(MXNet.mx) for mod in [:ndarray, :symbol] save("api/$mod.md", MIME("text/md"), filter(doc, files=["$mod.jl"]), config) diff --git a/src/symbol.jl b/src/symbol.jl index 921671e394e9..013c24d865c5 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -256,6 +256,14 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) kv_nargs_s = bytestring(ref_kv_nargs[]) kv_nargs = symbol(kv_nargs_s) + f_desc = bytestring(ref_desc[]) * "\n\n" + if !isempty(kv_nargs_s) + f_desc *= "This function support variable length positional `Symbol` inputs.\n\n" + end + f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) + f_desc *= "* `name`: Julia Symbol (e.g. `:my_symbol`), optional.\n\n The name of the symbol.\n\n" + f_desc *= "**Returns**\n\n`symbol`: `mx.Symbol`\n\n The constructed symbol." + # function $func_name(args...; kwargs...) func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) func_body = quote @@ -324,8 +332,8 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) func_def = Expr(:function, func_head, Expr(:block, func_body)) eval(func_def) - # TODO: add doc string - # eval(:(@doc($doc_str, $func_name))) + # add doc string + eval(:(@doc($f_desc, $func_name))) end function _import_atomic_symbol_creators() diff --git a/src/util.jl b/src/util.jl index 4a331fcbfec1..1c52fdf3f2c3 100644 --- a/src/util.jl +++ b/src/util.jl @@ -1,3 +1,6 @@ +################################################################################ +# Dataset related utilities +################################################################################ function get_data_dir() data_dir = joinpath(Pkg.dir("MXNet"), "data") mkpath(data_dir) @@ -38,3 +41,29 @@ function get_cifar10() filenames[:mean] = joinpath(cifar10_dir, "cifar/cifar_mean.bin") return filenames end + + +################################################################################ +# Internal Utilities +################################################################################ +function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{char_pp}, arg_descs::Ref{char_pp}, remove_dup::Bool=true) + param_keys = Set{AbstractString}() + + arg_names = pointer_to_array(arg_names[], narg) + arg_types = pointer_to_array(arg_types[], narg) + arg_descs = pointer_to_array(arg_descs[], narg) + docstrings = AbstractString[] + + for i = 1:narg + arg_name = bytestring(arg_names[i]) + if arg_name ∈ param_keys && remove_dup + continue + end + push!(param_keys, arg_name) + + arg_type = bytestring(arg_types[i]) + arg_desc = bytestring(arg_descs[i]) + push!(docstrings, "* `$arg_name`: $arg_type\n\n $arg_desc\n\n") + end + return "**Parameters**\n\n$(join(docstrings, "\n"))" +end From 1da331cc08aa7b90b858cdb16c9bd636d978e444 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Oct 2015 09:57:45 -0400 Subject: [PATCH 081/630] installation guide (or what we wanted to be...) --- docs/index.md | 5 ++++- docs/user-guide/install.md | 20 ++++++++++++++++++++ mkdocs.yml | 2 ++ 3 files changed, 26 insertions(+), 1 deletion(-) create mode 100644 docs/user-guide/install.md diff --git a/docs/index.md b/docs/index.md index f5d55b86aec0..350c3ab52fc9 100644 --- a/docs/index.md +++ b/docs/index.md @@ -1,3 +1,6 @@ # MXNet.jl -MXNet.jl is a [Julia](http://julialang.org/) package for *efficient* and *flexible* deep learning, built on top of [dmlc/mxnet](https://github.com/dmlc/mxnet). +MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julialang.org/) package. MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of features include: + +* Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. +* Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. diff --git a/docs/user-guide/install.md b/docs/user-guide/install.md new file mode 100644 index 000000000000..ab62c116ed03 --- /dev/null +++ b/docs/user-guide/install.md @@ -0,0 +1,20 @@ +# Automatic Installation + +To install MXNet.jl, simply type +```jl +Pkg.add("MXNet") +``` +in the Julia REPL. MXNet.jl is built on top of [libmxnet](https://github.com/dmlc/mxnet). Upon installation, Julia will try to automatically download and build libmxnet. If the compilation fails due to unresolved dependency, or if you prefer to work with a customized installation of libmxnet, please see [below](#manual-compilation). + +To use the latest git version of MXNet.jl, use the following command instead +```jl +Pkg.checkout("MXNet") +``` + +# Manual Compilation + +It is possible to compile libmxnet separately and point MXNet.jl to a the existing library in case automatic compilation fails due to unresolved dependencies in an un-standard environment; Or when one want to work with a seperate, maybe customized libmxnet. + +To build libmxnet, please refer to [the installation guide of libmxnet](http://mxnet.readthedocs.org/en/latest/build.html). After successfully installing libmxnet, set the `MXNET_HOME` environment variable to the location of libmxnet. In other words, the compiled `libmxnet.so` should be found in `$MXNET_HOME/lib`. + +When the `MXNET_HOME` environment variable is detected and the corresponding `libmxnet.so` could be loaded successfully, MXNet.jl will skip automatic building during installation and use the specified libmxnet instead. diff --git a/mkdocs.yml b/mkdocs.yml index 4b8b0cbcf6ca..1dec035a93bd 100644 --- a/mkdocs.yml +++ b/mkdocs.yml @@ -4,6 +4,8 @@ repo_url: https://github.com/dmlc/MXNet.jl theme: readthedocs pages: - Home: index.md + - User Guide: + - 'Installation Guide' : 'user-guide/install.md' - API Documentation: - 'ndarray': 'api/ndarray.md' - 'symbol': 'api/symbol.md' From 684bad20fe7f200556b850b2e2d0405604b02c98 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Oct 2015 10:51:49 -0400 Subject: [PATCH 082/630] part of overview --- docs/user-guide/overview.md | 39 +++++++++++++++++++++++++++++++++++++ mkdocs.yml | 1 + 2 files changed, 40 insertions(+) create mode 100644 docs/user-guide/overview.md diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md new file mode 100644 index 000000000000..7271b9263a32 --- /dev/null +++ b/docs/user-guide/overview.md @@ -0,0 +1,39 @@ +# MXNet.jl Namespace + +Most the functions and types in MXNet.jl are organized in a flat namespace. Because many some functions are conflicting with existing names in the Julia Base module, we wrap them all in a `mx` module. The convention of accessing the MXNet.jl interface is the to use the `mx.` prefix explicitly: +```jl +using MXNet + +x = mx.zeros(2,3) # MXNet NDArray +y = zeros(eltype(x), size(x)) # Julia Array +copy!(y, x) # Overloaded function in Julia Base +z = mx.ones(size(x), mx.gpu()) # MXNet NDArray on GPU +mx.copy!(z, y) # Same as copy!(z, y) +``` +Note functions like `size`, `copy!` that is extensively overloaded for various types works out of the box. But functions like `zeros` and `ones` will be ambiguous, so we always use the `mx.` prefix. If you prefer, the `mx.` prefix can be used explicitly for all MXNet.jl functions, including `size` and `copy!` as shown in the last line. + +# High Level Interface + +The way we build deep learning models in MXNet.jl is to use the powerful symbolic composition system. It is like [Theano](http://deeplearning.net/software/theano/), except that we avoided long expression compiliation time by providing *larger* neural network related building blocks to guarantee computation performance. See also [this note](http://mxnet.readthedocs.org/en/latest/program_model.html) for the design and trade-off of the MXNet symbolic composition system. + +The basic type is `mx.Symbol`. The following is a trivial example of composing two symbols with the `+` operation. +```jl +A = mx.variable(:A) +B = mx.variable(:B) +C = A + B +``` +We get a new *symbol* by composing existing *symbols* by some *operations*. A hierarchical architecture of a deep neural network could be realized by recursive composition. For example, the following code snippet shows a simple 2-layer MLP construction, using a hidden layer of 128 units and a ReLU activation function. +```jl +net = mx.variable(:data) +net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) +net = mx.Activation(data=net, name=:relu1, act_type=:relu) +net = mx.FullyConnected(data=net, name=:fc2, num_hidden=64) +net = mx.Softmax(data=net, name=:out) +``` +Each time we take the previous symbol, and compose with an operation. Unlike the simple `+` example above, the *operations* here are "bigger" ones, that correspond to common computation layers in deep neural networks. + +Each of those operation takes one or more input symbols for composition, with optional hyper-parameters (e.g. `num_hidden`, `act_type`) to further customize the composition results. + +When applying those operations, we can also specify a `name` for the result symbol. This is convenient if we want to refer to this symbol later on. If not supplied, a name will be automatically generated. + +# Low Level Interface diff --git a/mkdocs.yml b/mkdocs.yml index 1dec035a93bd..c364b2d4f3a6 100644 --- a/mkdocs.yml +++ b/mkdocs.yml @@ -6,6 +6,7 @@ pages: - Home: index.md - User Guide: - 'Installation Guide' : 'user-guide/install.md' + - 'Overview' : 'user-guide/overview.md' - API Documentation: - 'ndarray': 'api/ndarray.md' - 'symbol': 'api/symbol.md' From df6613dfdfd65a33446adae57d7980e5d331408d Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Oct 2015 17:01:57 -0400 Subject: [PATCH 083/630] shape inference doc --- docs/user-guide/overview.md | 81 +++++++++++++++++++++++++++++++++++-- 1 file changed, 78 insertions(+), 3 deletions(-) diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md index 7271b9263a32..86a81a4edf96 100644 --- a/docs/user-guide/overview.md +++ b/docs/user-guide/overview.md @@ -1,7 +1,7 @@ # MXNet.jl Namespace Most the functions and types in MXNet.jl are organized in a flat namespace. Because many some functions are conflicting with existing names in the Julia Base module, we wrap them all in a `mx` module. The convention of accessing the MXNet.jl interface is the to use the `mx.` prefix explicitly: -```jl +```julia using MXNet x = mx.zeros(2,3) # MXNet NDArray @@ -14,16 +14,18 @@ Note functions like `size`, `copy!` that is extensively overloaded for various t # High Level Interface +## Symbols and Composition + The way we build deep learning models in MXNet.jl is to use the powerful symbolic composition system. It is like [Theano](http://deeplearning.net/software/theano/), except that we avoided long expression compiliation time by providing *larger* neural network related building blocks to guarantee computation performance. See also [this note](http://mxnet.readthedocs.org/en/latest/program_model.html) for the design and trade-off of the MXNet symbolic composition system. The basic type is `mx.Symbol`. The following is a trivial example of composing two symbols with the `+` operation. -```jl +```julia A = mx.variable(:A) B = mx.variable(:B) C = A + B ``` We get a new *symbol* by composing existing *symbols* by some *operations*. A hierarchical architecture of a deep neural network could be realized by recursive composition. For example, the following code snippet shows a simple 2-layer MLP construction, using a hidden layer of 128 units and a ReLU activation function. -```jl +```julia net = mx.variable(:data) net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) net = mx.Activation(data=net, name=:relu1, act_type=:relu) @@ -36,4 +38,77 @@ Each of those operation takes one or more input symbols for composition, with op When applying those operations, we can also specify a `name` for the result symbol. This is convenient if we want to refer to this symbol later on. If not supplied, a name will be automatically generated. +Each symbol takes some arguments. For example, in the `+` case above, to compute the value of `C`, we will need to know the values of the two inputs `A` and `B`. For neural networks, the arguments are primarily two categories: *inputs* and *parameters*. *inputs* are data and labels for the networks, while *parameters* are typically trainable *weights*, *bias*, *filters*. + +When composing symbols, their arguments accumulates. We can list all the arguments by +```julia +julia> mx.list_arguments(net) +6-element Array{Symbol,1}: + :data # Input data, name from the first data variable + :fc1_weight # Weights of the fully connected layer named :fc1 + :fc1_bias # Bias of the layer :fc1 + :fc2_weight # Weights of the layer :fc2 + :fc2_bias # Bias of the layer :fc2 + :out_label # Input label, required by the softmax layer named :out +``` +Note the names of the arguments are generated according to the provided name for each layer. We can also specify those names explicitly: +```julia +net = mx.variable(:data) +w = mx.variable(:myweight) +net = mx.FullyConnected(data=data, weight=w, name=:fc1, num_hidden=128) +mx.list_arguments(net) +# => +# 3-element Array{Symbol,1}: +# :data +# :myweight +# :fc1_bias +``` +The simple fact is that a `variable` is just a placeholder `mx.Symbol`. In composition, we can use arbitrary symbols for arguments. For example: +```julia +net = mx.variable(:data) +net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) +net2 = mx.variable(:data2) +net2 = mx.FullyConnected(data=net2, name=:net2, num_hidden=128) +mx.list_arguments(net2) +# => +# 3-element Array{Symbol,1}: +# :data2 +# :net2_weight +# :net2_bias +composed_net = net2(data2=net, name=:composed) +mx.list_arguments(composed_net) +# => +# 5-element Array{Symbol,1}: +# :data +# :fc1_weight +# :fc1_bias +# :net2_weight +# :net2_bias +``` +Note we use a composed symbol, `net` as the argument `data2` for `net2` to get a new symbol, which we named `:composed`. It also shows that a symbol itself is a call-able object, which can be invoked to fill in missing arguments and get more complicated symbol compositions. + +## Shape Inference + +Given enough information, the shapes of all arguments in a composed symbol could be inferred automatically. For example, given the input shape, and some hyper-parameters like `num_hidden`, the shapes for the weights and bias in a neural network could be inferred. +```julia +net = mx.variable(:data) +net = mx.FullyConnected(data=net, name=:fc1, num_hidden=10) +arg_shapes, out_shapes, aux_shapes = mx.infer_shape(net, data=(10, 64)) +``` +The returned shapes corresponds to arguments with the same order as returned by `mx.list_arguments`. The `out_shapes` are shapes for outputs, and `aux_shapes` can be safely ignored for now. +```julia +for (n,s) in zip(mx.list_arguments(net), arg_shapes) + println("$n => $s") +end +# => +# data => (10,64) +# fc1_weight => (10,10) +# fc1_bias => (10,) +for (n,s) in zip(mx.list_outputs(net), out_shapes) + println("$n => $s") +end +# => +# fc1_output => (10,64) +``` + # Low Level Interface From 4ac5e7bcc5e64e40a8f4453b1689dde901853e77 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Oct 2015 17:37:00 -0400 Subject: [PATCH 084/630] allow keyword arguments in bind. --- docs/user-guide/overview.md | 21 +++++++++++++++++++++ src/executor.jl | 32 +++++++++++++++++++++----------- 2 files changed, 42 insertions(+), 11 deletions(-) diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md index 86a81a4edf96..79c8ff6b5d6b 100644 --- a/docs/user-guide/overview.md +++ b/docs/user-guide/overview.md @@ -111,4 +111,25 @@ end # fc1_output => (10,64) ``` +## Binding and Executing + +In order to execute the computation graph specified a composed symbol, we will *bind* the free variables to concrete values, specified as `mx.NDArray`s. This will create an `mx.Executor` on a given `mx.Context`. A context describes the computation devices (CPUs, GPUs, etc.) and an executor will carry out the computation (forward/backward) specified in the corresponding symbolic composition. +```julia +A = mx.variable(:A) +B = mx.variable(:B) +C = A .* B +a = mx.ones(3) * 4 +b = mx.ones(3) * 2 +c_exec = mx.bind(C, context=mx.cpu(), args=Dict(:A => a, :B => b)) + +mx.forward(c_exec) +copy(c_exec.outputs[1]) # copy turns NDArray into Julia Array +# => +# 3-element Array{Float32,1}: +# 8.0 +# 8.0 +# 8.0 +``` +**TODO** Provide pointers to further details. + # Low Level Interface diff --git a/src/executor.jl b/src/executor.jl index 94aabba5ddd5..fe83db86a831 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -48,27 +48,26 @@ function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDA end arr end + # help the type inference + if allow_missing + args_vec = Union{NDArray,Void}[args_vec...] + else + args_vec = NDArray[args_vec...] + end args_hdr = MX_handle[(isa(x,Void) ? MX_handle(0) : x) for x in args_vec] return (args_hdr, args_vec) end @enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; - args_grad :: Union{Void,Vector{NDArray},Dict{Base.Symbol,NDArray}} = nothing, - aux_states :: Union{Void,Vector{NDArray},Dict{Base.Symbol,NDArray}} = nothing, + args_grad :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), + aux_states :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), grad_req :: Union{GRAD_REQ,Vector{GRAD_REQ},Dict{Base.Symbol,GRAD_REQ}} = GRAD_WRITE) arg_names = list_arguments(self) - args_hdr, args = _get_ndarray_inputs("args", args, arg_names, false) - if isa(args_grad, Void) - args_grad = [nothing for i=1:length(args)] - args_grad_hdr = MX_handle[Ptr{Void}(0) for i=1:length(args)] - else - args_grad_hdr, args_grad = _get_ndarray_inputs("args_grad", args_grad, arg_names, true) - end - - if isa(aux_states, Void); aux_states = NDArray[]; end + args_hdr, args = _get_ndarray_inputs("args", args, arg_names, false) + args_grad_hdr, args_grad = _get_ndarray_inputs("args_grad", args_grad, arg_names, true) aux_args_hdr, aux_states = _get_ndarray_inputs("aux_states", aux_states, list_auxiliary_states(self), false) if isa(grad_req, GRAD_REQ) @@ -90,6 +89,17 @@ function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict executor = Executor(MX_ExecutorHandle(ref_hdr[]), self, args, args_grad, aux_states) end +function bind(self :: Symbol; kwargs...) + kwargs = Dict(kwargs) + @assert(haskey(kwargs, :args), "Must specify args") + args = pop!(kwargs, :args) + if haskey(kwargs, :context) + context = pop!(kwargs, :context) + else + context = cpu() + end + bind(self, context, args; kwargs...) +end function simple_bind(self :: Symbol, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) arg_shapes, out_shapes, aux_shapes = infer_shape(self; kwargs...) From af5645615b8e19265de1088fbf49a7b95f7b030c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Oct 2015 17:56:43 -0400 Subject: [PATCH 085/630] part of the doc on NDArrays --- docs/user-guide/overview.md | 15 ++++++++++++++- 1 file changed, 14 insertions(+), 1 deletion(-) diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md index 79c8ff6b5d6b..b750877ed1bd 100644 --- a/docs/user-guide/overview.md +++ b/docs/user-guide/overview.md @@ -130,6 +130,19 @@ copy(c_exec.outputs[1]) # copy turns NDArray into Julia Array # 8.0 # 8.0 ``` -**TODO** Provide pointers to further details. +For neural networks, it is easier to use `simple_bind`. By providing the shape for input arguments, it will perform a shape inference for the rest of the arguments and create the `NDArray`s automatically. In practice, the binding and executing steps are hidden under the `Estimator` interface. + +**TODO** Provide pointers to estimator tutorial and further details about binding and symbolic API. # Low Level Interface + +## NDArrays + +`NDArray`s are basic building blocks of the actual computations in MXNet. It is like a Julia `Array` object, with some important differences listed here: + +* The actual data could live on different `Context` (e.g. GPUs). For some contexts, iterating into the elements one by one is very slow, thus indexing into `NDArray` is not supported in general. The easiest way to inspect the contents of an `NDArray` is to use the `copy` function to copy the contents as a Julia `Array`. +* Operations on `NDArray`s (including basic arithmetics and neural network related operators) are executed in parallel with automatic dependency tracking to ensure correctness. + +While most of the computation is hidden in libmxnet by operators corresponding to various neural network layers. Getting familiar with the `NDArray` API is useful for implementing `Optimizer`s or customized operators in Julia directly. + +## Distributed Key-value Store From cf9a06a0122f21279e844e86cef276611e254b0a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 01:22:54 -0400 Subject: [PATCH 086/630] getindex operator for NDArray --- docs/user-guide/overview.md | 100 ++++++++++++++++++++++++++++++++++++ src/ndarray.jl | 11 ++++ 2 files changed, 111 insertions(+) diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md index b750877ed1bd..40abe770363c 100644 --- a/docs/user-guide/overview.md +++ b/docs/user-guide/overview.md @@ -142,7 +142,107 @@ For neural networks, it is easier to use `simple_bind`. By providing the shape f * The actual data could live on different `Context` (e.g. GPUs). For some contexts, iterating into the elements one by one is very slow, thus indexing into `NDArray` is not supported in general. The easiest way to inspect the contents of an `NDArray` is to use the `copy` function to copy the contents as a Julia `Array`. * Operations on `NDArray`s (including basic arithmetics and neural network related operators) are executed in parallel with automatic dependency tracking to ensure correctness. +* There is no generics in `NDArray`, the `eltype` is always `mx.MX_float`. Because for applications in machine learning, single precision floating point numbers are typical a best choice balancing between precision, speed and portability. Also since libmxnet is designed to support multiple languages as front-ends, it is much simpler to implement with a fixed data type. While most of the computation is hidden in libmxnet by operators corresponding to various neural network layers. Getting familiar with the `NDArray` API is useful for implementing `Optimizer`s or customized operators in Julia directly. +The followings are common ways to create `NDArray` objects: + +* `mx.empty(shape[, context])`: create on uninitialized array of a given shape on a specific device. For example, `mx.empty(2,3)`, `mx.((2,3), mx.gpu(2))`. +* `mx.zeros(shape[, context])` and `mx.ones(shape[, context])`: similar to the Julia's built-in `zeros` and `ones`. +* `mx.copy(jl_arr, context)`: copy the contents of a Julia `Array` to a specific device. + +Most of the convenient functions like `size`, `length`, `ndims`, `eltype` on array objects should work out-of-the-box. Although indexing is not supported, it is possible to take *slices*: +```julia +a = mx.ones(2,3) +b = mx.slice(a, 1:2) +b[:] = 2 +println(copy(a)) +# => +# Float32[2.0 2.0 1.0 +# 2.0 2.0 1.0] +``` +A slice is a sub-region sharing the same memory with the original `NDArray` object. A slice is always a contiguous piece of memory, so only slicing on the *last* dimension is supported. The example above also shows a way to set the contents of an `NDArray`. +```julia +a = mx.empty(2,3) +a[:] = 0.5 # set all elements to a scalar +a[:] = rand(size(a)) # set contents with a Julia Array +copy!(a, rand(size(a))) # set value by copying a Julia Array +b = mx.empty(size(a)) +b[:] = a # copying and assignment between NDArrays +``` +Note due to the intrinsic limitation design of the Julia language, a normal assignment +```julia +a = b +``` +does **not** mean copying the contents of `b` to `a`. Instead, it just make the variable `a` pointing to a new object, which is `b`. Similarly, inplace arithmetics does not work as expected: +```julia +a = mx.ones(2) +r = a # keep a reference to a +b = mx.ones(2) +a += b # translates to a = a + b +println(copy(a)) +# => Float32[2.0f0,2.0f0] +println(copy(r)) +# => Float32[1.0f0,1.0f0] +``` +As we can see, `a` has expected value, but instead of inplace updating, a new `NDArray` is created and `a` is set to point to this new object. If we look at `r`, which still reference to the old `a`, its content has not changed. There is currently no way in Julia to overload the operators like `+=` to get customized behavior. + +Instead, you will need to write `a[:] = a+b`, or if you want *real* inplace `+=` operation, MXNet.jl provides a simple macro `@mx.inplace`: +```julia +@mx.inplace a += b +macroexpand(:(@mx.inplace a += b)) +# => :(MXNet.mx.add_to!(a,b)) +``` +As we can see, it translate the `+=` operator to an explicit `add_to!` function call, which invokes into libmxnet to add the contents of `b` into `a` directly. For example, the following is the update rule in the SGD `Optimizer` (both `grad` and `weight` are `NDArray` objects): +```julia +@inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) +``` +Note there is no much magic in `mx.inplace`: it only does a shallow translation. In the SGD update rule example above, the computation like scaling the gradient by `grad_scale` and adding the weight decay all create temporary `NDArray` objects. However, libmxnet has a customized memory allocator designed specifically to handle this kind of situations. So typically creating temp intermediate arrays is not a problem. The following snippet does a simple benchmark on allocating temp `NDArray`s vs. pre-allocating: +```julia +using Benchmark +using MXNet + +N_REP = 1000 +SHAPE = (128, 64) +CTX = mx.cpu() +LR = 0.1 + +function inplace_op() + weight = mx.zeros(SHAPE, CTX) + grad = mx.ones(SHAPE, CTX) + + # pre-allocate temp objects + grad_lr = mx.empty(SHAPE, CTX) + + for i = 1:N_REP + copy!(grad_lr, grad) + @mx.inplace grad_lr .*= LR + @mx.inplace weight -= grad_lr + end + return weight +end + +function normal_op() + weight = mx.zeros(SHAPE, CTX) + grad = mx.ones(SHAPE, CTX) + + for i = 1:N_REP + weight[:] -= LR * grad + end + return weight +end + +# make sure the results are the same +@assert(maximum(abs(copy(normal_op() - inplace_op()))) < 1e-6) + +println(compare([inplace_op, normal_op], 100)) +``` +The comparison on my laptop shows that + +| Row | Function | Average | Relative | Replications | +|-----|--------------|-----------|----------|--------------| +| 1 | "inplace_op" | 0.0074854 | 1.0 | 100 | +| 2 | "normal_op" | 0.0174202 | 2.32723 | 100 | + ## Distributed Key-value Store diff --git a/src/ndarray.jl b/src/ndarray.jl index a868495a846b..30b08b8ff1e9 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -167,6 +167,17 @@ function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, id copy!(slice(arr, idx), val) end +import Base: getindex +"""Shortcut for `slice`. **NOTE** the behavior for Julia's built-in index slicing is to create a +copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. +""" +function getindex(arr :: NDArray, ::Colon) + return arr +end +function getindex(arr :: NDArray, idx::UnitRange{Int}) + slice(arr, idx) +end + #------------------------------------------------------------ # Copying functions #------------------------------------------------------------ From 3a265442b4b2e612df576815b19c3506fff05c31 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 01:54:05 -0400 Subject: [PATCH 087/630] ndarray doc --- docs/user-guide/overview.md | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md index 40abe770363c..e09b3ec4d002 100644 --- a/docs/user-guide/overview.md +++ b/docs/user-guide/overview.md @@ -238,11 +238,13 @@ end println(compare([inplace_op, normal_op], 100)) ``` -The comparison on my laptop shows that +The comparison on my laptop shows that `normal_op` while allocating a lot of temp `NDArray`s in the loop (the performance gets worse when increasing `N_REP`), is only about twice slower than the pre-allocated one. | Row | Function | Average | Relative | Replications | |-----|--------------|-----------|----------|--------------| | 1 | "inplace_op" | 0.0074854 | 1.0 | 100 | | 2 | "normal_op" | 0.0174202 | 2.32723 | 100 | +So it will typically not be a problem unless you are at the bottleneck of the computation (e.g. implementing some neural network layers in Julia). + ## Distributed Key-value Store From 0c3d0668df8c908c56da93b48597a6504b35ff75 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 12:22:40 -0400 Subject: [PATCH 088/630] API variable -> Variable; group -> Group --- examples/cifar10/cifar10.jl | 2 +- examples/mnist/lenet.jl | 2 +- examples/mnist/mlp.jl | 2 +- src/ndarray.jl | 3 +++ src/symbol.jl | 4 ++-- test/common.jl | 2 +- test/unittest/bind.jl | 4 ++-- test/unittest/symbol.jl | 6 +++--- 8 files changed, 14 insertions(+), 11 deletions(-) diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl index 9d627b0471c2..50d399e32d5e 100644 --- a/examples/cifar10/cifar10.jl +++ b/examples/cifar10/cifar10.jl @@ -36,7 +36,7 @@ end #-------------------------------------------------------------------------------- # Actual architecture -data = mx.variable(:data) +data = mx.Variable(:data) conv1 = conv_factory(data, 96, (3,3); pad=(1,1), act_type=:relu) in3a = simple_factory(conv1, 32, 32) in3b = simple_factory(in3a, 32, 48) diff --git a/examples/mnist/lenet.jl b/examples/mnist/lenet.jl index 7efe4c42eedc..d8e8c9fea0ee 100644 --- a/examples/mnist/lenet.jl +++ b/examples/mnist/lenet.jl @@ -4,7 +4,7 @@ using MXNet # define lenet # input -data = mx.variable(:data) +data = mx.Variable(:data) # first conv conv1 = mx.Convolution(data=data, kernel=(5,5), num_filter=20) diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index c2d30235e0f6..e8c095a613fe 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -1,7 +1,7 @@ using MXNet # define MLP -data = mx.variable(:data) +data = mx.Variable(:data) fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) diff --git a/src/ndarray.jl b/src/ndarray.jl index 30b08b8ff1e9..c3207b8aa963 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -325,6 +325,9 @@ function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) mul_to!(ret, arg) end +function .*(arg0 :: Real, arg :: NDArray) + .*(arg, arg0) +end # unlike *, we only allow type Real in arguments, because array-array * operator # means matrix multiplication in Julia function *(arg0 :: NDArray, arg :: Real) diff --git a/src/symbol.jl b/src/symbol.jl index 013c24d865c5..e0daf53e36c3 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -67,14 +67,14 @@ function get_internals(self :: Symbol) end "Create a symbolic variable with the given name" -function variable(name :: Union{Base.Symbol, AbstractString}) +function Variable(name :: Union{Base.Symbol, AbstractString}) hdr_ref = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) Symbol(MX_SymbolHandle(hdr_ref[])) end "Create a symbol that groups symbols together" -function group(symbols :: Symbol...) +function Group(symbols :: Symbol...) handles = MX_handle[symbols...] ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateGroup, (MX_uint, Ptr{MX_handle}, Ref{MX_handle}), diff --git a/test/common.jl b/test/common.jl index 51dc1ed43ec4..fc4c4f63649e 100644 --- a/test/common.jl +++ b/test/common.jl @@ -12,7 +12,7 @@ function rand_dims(max_ndim=6) end function mlp2() - data = mx.variable(:data) + data = mx.Variable(:data) out = mx.FullyConnected(data=data, name=:fc1, num_hidden=1000) out = mx.Activation(data=out, act_type=:relu) out = mx.FullyConnected(data=out, name=:fc2, num_hidden=10) diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl index 9f480f3f20f3..760e261fe581 100644 --- a/test/unittest/bind.jl +++ b/test/unittest/bind.jl @@ -11,8 +11,8 @@ function test_arithmetic(uf, gf) shape = rand_dims() info("Bind::arithmetic::$uf::dims = $shape") - lhs = mx.variable(:lhs) - rhs = mx.variable(:rhs) + lhs = mx.Variable(:lhs) + rhs = mx.Variable(:rhs) ret = uf(lhs, rhs) @test mx.list_arguments(ret) == [:lhs, :rhs] diff --git a/test/unittest/symbol.jl b/test/unittest/symbol.jl index b62496d20fbc..fecb25c159a8 100644 --- a/test/unittest/symbol.jl +++ b/test/unittest/symbol.jl @@ -19,7 +19,7 @@ end function test_internal() info("Symbol::internal") - data = mx.variable(:data) + data = mx.Variable(:data) oldfc = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) net1 = mx.FullyConnected(data=oldfc, name=:fc2, num_hidden=100) @@ -33,7 +33,7 @@ end function test_compose() info("Symbol::compose") - data = mx.variable(:data) + data = mx.Variable(:data) net1 = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) net1 = mx.FullyConnected(data=net1, name=:fc2, num_hidden=100) @@ -42,7 +42,7 @@ function test_compose() net2 = mx.FullyConnected(data=net2, name=:fc4, num_hidden=20) composed = net2(fc3_data=net1, name=:composed) - multi_out = mx.group(composed, net1) + multi_out = mx.Group(composed, net1) @test mx.list_outputs(multi_out) == [:composed_output, :fc2_output] end From 9665cb1cb7112683cd8728b228aa1be487101d5e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 12:25:03 -0400 Subject: [PATCH 089/630] update doc: variable -> Variable --- docs/user-guide/overview.md | 40 +++++++++++++++++++++++++------------ 1 file changed, 27 insertions(+), 13 deletions(-) diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md index e09b3ec4d002..33567bd7817d 100644 --- a/docs/user-guide/overview.md +++ b/docs/user-guide/overview.md @@ -20,13 +20,13 @@ The way we build deep learning models in MXNet.jl is to use the powerful symboli The basic type is `mx.Symbol`. The following is a trivial example of composing two symbols with the `+` operation. ```julia -A = mx.variable(:A) -B = mx.variable(:B) +A = mx.Variable(:A) +B = mx.Variable(:B) C = A + B ``` We get a new *symbol* by composing existing *symbols* by some *operations*. A hierarchical architecture of a deep neural network could be realized by recursive composition. For example, the following code snippet shows a simple 2-layer MLP construction, using a hidden layer of 128 units and a ReLU activation function. ```julia -net = mx.variable(:data) +net = mx.Variable(:data) net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) net = mx.Activation(data=net, name=:relu1, act_type=:relu) net = mx.FullyConnected(data=net, name=:fc2, num_hidden=64) @@ -53,8 +53,8 @@ julia> mx.list_arguments(net) ``` Note the names of the arguments are generated according to the provided name for each layer. We can also specify those names explicitly: ```julia -net = mx.variable(:data) -w = mx.variable(:myweight) +net = mx.Variable(:data) +w = mx.Variable(:myweight) net = mx.FullyConnected(data=data, weight=w, name=:fc1, num_hidden=128) mx.list_arguments(net) # => @@ -63,11 +63,11 @@ mx.list_arguments(net) # :myweight # :fc1_bias ``` -The simple fact is that a `variable` is just a placeholder `mx.Symbol`. In composition, we can use arbitrary symbols for arguments. For example: +The simple fact is that a `Variable` is just a placeholder `mx.Symbol`. In composition, we can use arbitrary symbols for arguments. For example: ```julia -net = mx.variable(:data) +net = mx.Variable(:data) net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) -net2 = mx.variable(:data2) +net2 = mx.Variable(:data2) net2 = mx.FullyConnected(data=net2, name=:net2, num_hidden=128) mx.list_arguments(net2) # => @@ -91,7 +91,7 @@ Note we use a composed symbol, `net` as the argument `data2` for `net2` to get a Given enough information, the shapes of all arguments in a composed symbol could be inferred automatically. For example, given the input shape, and some hyper-parameters like `num_hidden`, the shapes for the weights and bias in a neural network could be inferred. ```julia -net = mx.variable(:data) +net = mx.Variable(:data) net = mx.FullyConnected(data=net, name=:fc1, num_hidden=10) arg_shapes, out_shapes, aux_shapes = mx.infer_shape(net, data=(10, 64)) ``` @@ -115,8 +115,8 @@ end In order to execute the computation graph specified a composed symbol, we will *bind* the free variables to concrete values, specified as `mx.NDArray`s. This will create an `mx.Executor` on a given `mx.Context`. A context describes the computation devices (CPUs, GPUs, etc.) and an executor will carry out the computation (forward/backward) specified in the corresponding symbolic composition. ```julia -A = mx.variable(:A) -B = mx.variable(:B) +A = mx.Variable(:A) +B = mx.Variable(:B) C = A .* B a = mx.ones(3) * 4 b = mx.ones(3) * 2 @@ -198,7 +198,7 @@ As we can see, it translate the `+=` operator to an explicit `add_to!` function ```julia @inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) ``` -Note there is no much magic in `mx.inplace`: it only does a shallow translation. In the SGD update rule example above, the computation like scaling the gradient by `grad_scale` and adding the weight decay all create temporary `NDArray` objects. However, libmxnet has a customized memory allocator designed specifically to handle this kind of situations. So typically creating temp intermediate arrays is not a problem. The following snippet does a simple benchmark on allocating temp `NDArray`s vs. pre-allocating: +Note there is no much magic in `mx.inplace`: it only does a shallow translation. In the SGD update rule example above, the computation like scaling the gradient by `grad_scale` and adding the weight decay all create temporary `NDArray` objects. To mitigate this issue, libmxnet has a customized memory allocator designed specifically to handle this kind of situations. The following snippet does a simple benchmark on allocating temp `NDArray`s vs. pre-allocating: ```julia using Benchmark using MXNet @@ -245,6 +245,20 @@ The comparison on my laptop shows that `normal_op` while allocating a lot of tem | 1 | "inplace_op" | 0.0074854 | 1.0 | 100 | | 2 | "normal_op" | 0.0174202 | 2.32723 | 100 | -So it will typically not be a problem unless you are at the bottleneck of the computation (e.g. implementing some neural network layers in Julia). +So it will usually not be a big problem unless you are at the bottleneck of the computation. ## Distributed Key-value Store + +The type `KVStore` and related methods are used for data sharing across different devices or machines. It provides a simple and efficient integer-`NDArray` key-value storage system that each device can pull or push. + +The following example shows how to create a `local` `KVStore`, initialize a value and then pull it back. +```julia +kv = mx.KVStore(:local) +shape = (2,3) +key = 3 + +mx.init!(kv, key, mx.ones(shape)*2) +a = mx.empty(shape) +mx.pull!(kv, key, a) # pull value into a +println(copy(a)) +``` From 210aba8530931aa97f2fc1d8c7985c1350dc6ce0 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 12:26:08 -0400 Subject: [PATCH 090/630] add libmxnet.dll into library search list --- src/init.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/init.jl b/src/init.jl index 2c4239ce8d25..eae4cd8995b9 100644 --- a/src/init.jl +++ b/src/init.jl @@ -16,7 +16,7 @@ typealias char_pp Ptr{char_p} ################################################################################ # Initialization and library API entrance ################################################################################ -const MXNET_LIB = Libdl.find_library(["libmxnet.so"], ["$(get(ENV,"MXNET_HOME",""))/lib"]) +const MXNET_LIB = Libdl.find_library(["libmxnet.so","libmxnet.dll"], ["$(get(ENV,"MXNET_HOME",""))/lib"]) function __init__() _import_ndarray_functions() From 478568c9cbabc24c062da9599334e0fd287210ab Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 13:03:52 -0400 Subject: [PATCH 091/630] doc for mnist --- docs/tutorials/mnist.md | 72 +++++++++++++++++++++++++++++++++++++++++ examples/mnist/mlp.jl | 2 +- mkdocs.yml | 2 ++ 3 files changed, 75 insertions(+), 1 deletion(-) create mode 100644 docs/tutorials/mnist.md diff --git a/docs/tutorials/mnist.md b/docs/tutorials/mnist.md new file mode 100644 index 000000000000..dfddf7408e6a --- /dev/null +++ b/docs/tutorials/mnist.md @@ -0,0 +1,72 @@ +In this tutorial, we will work through examples of training a simple multi-layer perceptron and then a convolutional neural network (the LeNet architecture) on the [MNIST handwritten digit dataset](http://yann.lecun.com/exdb/mnist/). The code for this tutorial could be found in [`Pkg.dir("MXNet")`/examples/mnist/](https://github.com/dmlc/MXNet.jl/tree/master/examples/mnist). + +# Simple 3-layer MLP + +This is a tiny 3-layer MLP that could be easily trained on CPU. The script starts with +```julia +using MXNet +``` +to load the `MXNet` module. Then we are ready to define the network architecture via the [symbolic API](../user-guide/overview.md#symbols-and-composition). We start with a placeholder `data` symbol, +```julia +data = mx.Variable(:data) +``` +and then cascading fully-connected layers and activation functions: +```julia +fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) +act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) +fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) +act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) +fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) +``` +Note each composition we take the previous symbol as the `data` argument, forming a feedforward chain. The architecture looks like +``` +Input --> 128 units (ReLU) --> 64 units (ReLU) --> 10 units +``` +where the last 10 units correspond to the 10 output classes (digits 0,...,9). We then add a final `Softmax` operation to turn the 10-dimensional prediction to proper probability values for the 10 classes: +```julia +mlp = mx.Softmax(data = fc3, name=:softmax) +``` + +After defining the architecture, we are ready to load the MNIST data. MXNet.jl provide built-in data providers for the MNIST dataset, which could automatically download the dataset into `Pkg.dir("MXNet")/data/mnist` if necessary. We wrap the code to construct the data provider into `mnist-data.jl` so that it could be shared by both the MLP example and the LeNet ConvNets example. +```julia +batch_size = 100 +include("mnist-data.jl") +train_provider, eval_provider = get_mnist_providers(batch_size) +``` +If you need to write your own data providers for customized data format, please refer to **TODO**: pointer to data provider API. + +Given the architecture and data, we can instantiate an *estimator* to do the actual training. `mx.FeedForward` is the built-in estimator that is suitable for most feed-forward architectures. When constructing the estimator, we also specify the *context* on which the computation should be carried out. Because this is a really tiny MLP, we will just run on a single CPU device. +```julia +estimator = mx.FeedForward(mlp, context=mx.cpu()) +``` +You can use a `mx.gpu()` or if a list of devices (e.g. `[mx.gpu(0), mx.gpu(1)]`) is provided, data-parallelization will be used automatically. But for this tiny example, using a GPU device might not help. + +The last thing we need to specify is the optimization algorithm (a.k.a. *optimizer*) to use. We use the basic SGD with a fixed learning rate 0.1 and momentum 0.9: +```julia +optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.1), + mom_scheduler=mx.FixedMomentumScheduler(0.9), + weight_decay=0.00001) +``` +Now we can do the training. Here the `epoch_stop` parameter specifies that we want to train for 20 epochs. We also supply a `eval_data` to monitor validation accuracy on the validation set. +```julia +mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) +``` +Here is a sample output +``` +INFO: Start training on [CPU0] +INFO: Initializing parameters... +INFO: Creating KVStore... +INFO: == Epoch 001 ========== +INFO: ## Training summary +INFO: :accuracy = 0.7554 +INFO: time = 1.3165 seconds +INFO: ## Validation summary +INFO: :accuracy = 0.9502 +... +INFO: == Epoch 020 ========== +INFO: ## Training summary +INFO: :accuracy = 0.9949 +INFO: time = 0.9287 seconds +INFO: ## Validation summary +INFO: :accuracy = 0.9775 +``` diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index e8c095a613fe..a30e876ae708 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -15,7 +15,7 @@ include("mnist-data.jl") train_provider, eval_provider = get_mnist_providers(batch_size) # setup estimator -estimator = mx.FeedForward(mlp, context=mx.Context(mx.CPU)) +estimator = mx.FeedForward(mlp, context=mx.cpu()) # optimizer optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.1), diff --git a/mkdocs.yml b/mkdocs.yml index c364b2d4f3a6..78822e3ada5a 100644 --- a/mkdocs.yml +++ b/mkdocs.yml @@ -7,6 +7,8 @@ pages: - User Guide: - 'Installation Guide' : 'user-guide/install.md' - 'Overview' : 'user-guide/overview.md' + - Tutorials: + - 'MNIST': 'tutorials/mnist.md' - API Documentation: - 'ndarray': 'api/ndarray.md' - 'symbol': 'api/symbol.md' From d15bc779ab829327f2162ea9525e2cf22e66f819 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 17:17:42 -0400 Subject: [PATCH 092/630] add mx.chain macro --- README.md | 10 ++++++++++ examples/mnist/mlp.jl | 27 ++++++++++++++++++++------- src/symbol.jl | 29 +++++++++++++++++++++++++++++ 3 files changed, 59 insertions(+), 7 deletions(-) diff --git a/README.md b/README.md index 4852bcd52161..2df461d4993c 100644 --- a/README.md +++ b/README.md @@ -6,3 +6,13 @@ Julia wrapper of [MXNet](https://github.com/dmlc/mxnet). + +```julia +mlp = @mx.chain mx.Variable(:data) => + mx.FullyConnected(name=:fc1, num_hidden=128) => + mx.Activation(name=:relu1, act_type=:relu) => + mx.FullyConnected(name=:fc2, num_hidden=64) => + mx.Activation(name=:relu2, act_type=:relu) => + mx.FullyConnected(name=:fc3, num_hidden=10) => + mx.Softmax(name=:softmax) +``` diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index a30e876ae708..8fab150ad7a7 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -1,13 +1,26 @@ using MXNet +#-------------------------------------------------------------------------------- # define MLP -data = mx.Variable(:data) -fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) -act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) -fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) -act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) -fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) -mlp = mx.Softmax(data = fc3, name=:softmax) +# the following two ways are equivalent + +#-- Option 1: explicit composition +# data = mx.Variable(:data) +# fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) +# act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) +# fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) +# act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) +# fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) +# mlp = mx.Softmax(data = fc3, name=:softmax) + +#-- Option 2: using the mx.chain macro +mlp = @mx.chain mx.Variable(:data) => + mx.FullyConnected(name=:fc1, num_hidden=128) => + mx.Activation(name=:relu1, act_type=:relu) => + mx.FullyConnected(name=:fc2, num_hidden=64) => + mx.Activation(name=:relu2, act_type=:relu) => + mx.FullyConnected(name=:fc3, num_hidden=10) => + mx.Softmax(name=:softmax) # data provider batch_size = 100 diff --git a/src/symbol.jl b/src/symbol.jl index e0daf53e36c3..b69dfd37f226 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -349,3 +349,32 @@ function _import_atomic_symbol_creators() _define_atomic_symbol_creator(creator_hdr) end end + +################################################################################ +# Utility macros to chain up symbols +################################################################################ +macro chain(layers) + exprs = [] + last_layer = nothing + function _chain_layer(layer, last_layer) + if isa(last_layer, Void) + layer + else + @assert(isa(layer, Expr) && layer.head == :call, "Do not know how to chain up $layer") + return Expr(:call, layer.args[1], last_layer, layer.args[2:end]...) + end + end + while true + if layers.head == :(=>) + new_layer = gensym() + push!(exprs, :($new_layer = $(_chain_layer(layers.args[1], last_layer)))) + last_layer = new_layer + layers = layers.args[2] + else + push!(exprs, _chain_layer(layers, last_layer)) + break + end + end + return Expr(:block, exprs...) +end + From e9088f5d64ced63ac988bf7fa60eb74403f2168a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 18:22:38 -0400 Subject: [PATCH 093/630] rename init.jl -> base.jl --- src/{init.jl => base.jl} | 66 ++++++++++++++++++++++++++++++++++++++++ 1 file changed, 66 insertions(+) rename src/{init.jl => base.jl} (69%) diff --git a/src/init.jl b/src/base.jl similarity index 69% rename from src/init.jl rename to src/base.jl index eae4cd8995b9..b3c6cee026dc 100644 --- a/src/init.jl +++ b/src/base.jl @@ -129,3 +129,69 @@ end function dump_mx_param{N,T<:Integer}(shape :: NTuple{N, T}) string(tuple(flipdim([shape...],1)...)) end + +"""A convenient macro copied from Mocha.jl that could be used to define structs +with default values and type checks. For example +```julia +@defstruct MyStruct Any ( + field1 :: Int = 0, + (field2 :: AbstractString = "", !isempty(field2)) +) +``` +where each field could be either +```julia +field_name :: field_type = default_value +``` +or put within a tuple, with the second element +specifying a validation check on the field value. +In the example above, the default value for +field2 does not satisfy the assertion, this +could be used to force user to provide a +valid value when no meaningful default value +is available. + +The macro will define a constructor that could accept +the keyword arguments. +""" +macro defstruct(name, super_name, fields) + @assert fields.head == :tuple + fields = fields.args + @assert length(fields) > 0 + name = esc(name) + + field_defs = Array(Expr, length(fields)) # :(field2 :: Int) + field_names = Array(Base.Symbol, length(fields)) # :field2 + field_defaults = Array(Expr, length(fields)) # :(field2 :: Int = 0) + field_asserts = Array(Expr, length(fields)) # :(field2 >= 0) + + for i = 1:length(fields) + field = fields[i] + if field.head == :tuple + field_asserts[i] = field.args[2] + field = field.args[1] + end + field_defs[i] = esc(field.args[1]) + field_names[i] = field.args[1].args[1] + field_defaults[i] = Expr(:kw, field.args...) + end + + # body of layer type, defining fields + type_body = Expr(:block, field_defs...) + + # constructor + asserts = map(filter(i -> isdefined(field_asserts,i), 1:length(fields))) do i + :(@assert($(field_asserts[i]))) + end + construct = Expr(:call, name, field_names...) + ctor_body = Expr(:block, asserts..., construct) + ctor_def = Expr(:call, name, Expr(:parameters, field_defaults...)) + ctor = Expr(:(=), ctor_def, ctor_body) + + quote + type $(name) <: $super_name + $type_body + end + + $ctor + end +end From bed3a02d7b1ef58aab2db80e620433965af5514c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 18:22:55 -0400 Subject: [PATCH 094/630] refactor optimizer options --- src/MXNet.jl | 2 +- src/estimator.jl | 2 +- src/optimizer.jl | 50 +++---------------------------------- src/optimizers/sgd.jl | 57 +++++++++++++++++++++++++++++++++++++++++++ 4 files changed, 62 insertions(+), 49 deletions(-) create mode 100644 src/optimizers/sgd.jl diff --git a/src/MXNet.jl b/src/MXNet.jl index cfa56b21d292..0e56b743d5d5 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -8,7 +8,7 @@ export mx module mx using Formatting -include("init.jl") +include("base.jl") include("context.jl") include("ndarray.jl") diff --git a/src/estimator.jl b/src/estimator.jl index e349ec952115..42402d0a2bdf 100644 --- a/src/estimator.jl +++ b/src/estimator.jl @@ -138,7 +138,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra param_arrays = [NDArray[exec.arg_arrays[i] for exec in train_execs] for i in param_idx] grad_arrays = [NDArray[exec.grad_arrays[i] for exec in train_execs] for i in param_idx] - optimizer.inv_batch_size = 1.0/batch_size + optimizer.batch_size = batch_size if !update_on_kvstore updater = get_updater(optimizer) diff --git a/src/optimizer.jl b/src/optimizer.jl index 191fc6a855c2..d01f92e7d735 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -17,53 +17,6 @@ type FixedMomentumScheduler <: AbstractMomentumScheduler end get_momentum(self :: FixedMomentumScheduler, iter :: Int) = self.momentum -type SGD <: AbstractOptimizer - iter :: Int - - lr_scheduler :: AbstractLearningRateScheduler - mom_scheduler :: AbstractMomentumScheduler - weight_decay :: Float64 - grad_scale :: Float64 - grad_clip :: Float64 - inv_batch_size:: Float64 - - function SGD(;lr_scheduler::AbstractLearningRateScheduler=FixedLearningRateScheduler(0.01), - mom_scheduler::AbstractMomentumScheduler=NullMomentumScheduler(), - weight_decay::Float64=0.0001, - grad_scale::Float64=1.0, - grad_clip::Float64=0.0) - new(0, lr_scheduler, mom_scheduler, weight_decay, grad_scale, grad_clip, 1.0) - end -end - -function create_state(self :: SGD, index :: Int, weight :: NDArray) - if isa(self.mom_scheduler, NullMomentumScheduler) - return nothing - else - return zeros(size(weight), context(weight)) - end -end - -function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: Union{Void, NDArray}) - lr = get_learning_rate(self.lr_scheduler, self.iter) - grad_scale = self.grad_scale * self.inv_batch_size - - if isa(state, Void) - @inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) - else - mom = state :: NDArray - coef = get_momentum(self.mom_scheduler, self.iter) - @inplace mom .*= coef - if self.grad_clip > 0 - # TODO: - else - @inplace mom += -lr * (grad_scale * grad + self.weight_decay * weight) - end - @inplace weight += mom - end -end - - function get_updater(optimizer :: AbstractOptimizer) states = Dict{Int,Any}() function updater(index :: Int, grad :: NDArray, weight :: NDArray) @@ -74,3 +27,6 @@ function get_updater(optimizer :: AbstractOptimizer) end return updater end + + +include("optimizers/sgd.jl") diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl new file mode 100644 index 000000000000..4e6a6757fb67 --- /dev/null +++ b/src/optimizers/sgd.jl @@ -0,0 +1,57 @@ +@defstruct SGDOptions Any ( + (lr :: Real = 0.01, lr > 0), + (momentum :: Real = 0.0, momentum >= 0), + (weight_decay :: Real = 0.0001, weight_decay >= 0), + (grad_scale :: Real = 1.0, grad_scale >= 0), + (grad_clip :: Real = 0, grad_clip >= 0), + lr_scheduler :: Any = nothing, + mom_scheduler :: Any = nothing +) + + +type SGD <: AbstractOptimizer + iter :: Int + batch_size :: Int + opts :: SGDOptions + + function SGD(; kwargs...) + opts = SGDOptions(;kwargs...) + if !isa(opts.lr_scheduler, AbstractLearningRateScheduler) + opts.lr_scheduler = FixedLearningRateScheduler(opts.lr) + end + if !isa(opts.mom_scheduler, AbstractMomentumScheduler) + opts.mom_scheduler = opts.momentum > 0 ? + FixedMomentumScheduler(opts.momentum) : + NullMomentumScheduler() + end + + new(0, 0, opts) + end +end + +function create_state(self :: SGD, index :: Int, weight :: NDArray) + if isa(self.opts.mom_scheduler, NullMomentumScheduler) + return nothing + else + return zeros(size(weight), context(weight)) + end +end + +function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: Union{Void, NDArray}) + lr = get_learning_rate(self.opts.lr_scheduler, self.iter) + grad_scale = self.opts.grad_scale / self.batch_size + + if isa(state, Void) + @inplace weight += -lr * (grad_scale * grad + self.opts.weight_decay * weight) + else + mom = state :: NDArray + coef = get_momentum(self.opts.mom_scheduler, self.iter) + @inplace mom .*= coef + if self.opts.grad_clip > 0 + # TODO: + else + @inplace mom += -lr * (grad_scale * grad + self.opts.weight_decay * weight) + end + @inplace weight += mom + end +end From a75a8efedc7f2944d4cad0515661a95643a2c5c5 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 18:24:06 -0400 Subject: [PATCH 095/630] simplify mnist mlp example --- examples/mnist/mlp.jl | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 8fab150ad7a7..66e1bdac49a8 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -31,9 +31,7 @@ train_provider, eval_provider = get_mnist_providers(batch_size) estimator = mx.FeedForward(mlp, context=mx.cpu()) # optimizer -optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.1), - mom_scheduler=mx.FixedMomentumScheduler(0.9), - weight_decay=0.00001) +optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) # fit parameters mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) From 43b2486578509996a73bab93609a4cdaa9d6bff6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 18:29:44 -0400 Subject: [PATCH 096/630] clean up lenet example --- docs/tutorials/mnist.md | 14 +++++++++++--- examples/mnist/lenet.jl | 7 ++----- 2 files changed, 13 insertions(+), 8 deletions(-) diff --git a/docs/tutorials/mnist.md b/docs/tutorials/mnist.md index dfddf7408e6a..15b651d4b69c 100644 --- a/docs/tutorials/mnist.md +++ b/docs/tutorials/mnist.md @@ -26,6 +26,16 @@ where the last 10 units correspond to the 10 output classes (digits 0,...,9). We ```julia mlp = mx.Softmax(data = fc3, name=:softmax) ``` +As we can see, the MLP is just a chain of layers. For this case, we can also use the `mx.chain` macro. The same architecture above can be defined as +```julia +mlp = @mx.chain mx.Variable(:data) => + mx.FullyConnected(name=:fc1, num_hidden=128) => + mx.Activation(name=:relu1, act_type=:relu) => + mx.FullyConnected(name=:fc2, num_hidden=64) => + mx.Activation(name=:relu2, act_type=:relu) => + mx.FullyConnected(name=:fc3, num_hidden=10) => + mx.Softmax(name=:softmax) +``` After defining the architecture, we are ready to load the MNIST data. MXNet.jl provide built-in data providers for the MNIST dataset, which could automatically download the dataset into `Pkg.dir("MXNet")/data/mnist` if necessary. We wrap the code to construct the data provider into `mnist-data.jl` so that it could be shared by both the MLP example and the LeNet ConvNets example. ```julia @@ -43,9 +53,7 @@ You can use a `mx.gpu()` or if a list of devices (e.g. `[mx.gpu(0), mx.gpu(1)]`) The last thing we need to specify is the optimization algorithm (a.k.a. *optimizer*) to use. We use the basic SGD with a fixed learning rate 0.1 and momentum 0.9: ```julia -optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.1), - mom_scheduler=mx.FixedMomentumScheduler(0.9), - weight_decay=0.00001) +optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) ``` Now we can do the training. Here the `epoch_stop` parameter specifies that we want to train for 20 epochs. We also supply a `eval_data` to monitor validation accuracy on the validation set. ```julia diff --git a/examples/mnist/lenet.jl b/examples/mnist/lenet.jl index d8e8c9fea0ee..bcf0b02893b5 100644 --- a/examples/mnist/lenet.jl +++ b/examples/mnist/lenet.jl @@ -36,13 +36,10 @@ train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) #-------------------------------------------------------------------------------- # fit model -dev = mx.Context(mx.GPU) -estimator = mx.FeedForward(lenet, context=dev) +estimator = mx.FeedForward(lenet, context=mx.gpu()) # optimizer -optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.05), - mom_scheduler=mx.FixedMomentumScheduler(0.9), - weight_decay=0.00001) +optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) # fit parameters mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) From 02e4af36114fd5a18c4b97fc2ccd5a4884b9ecb5 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 20:55:07 -0400 Subject: [PATCH 097/630] hygiene in chain macro --- src/symbol.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/symbol.jl b/src/symbol.jl index b69dfd37f226..097fe1d5b20a 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -358,10 +358,10 @@ macro chain(layers) last_layer = nothing function _chain_layer(layer, last_layer) if isa(last_layer, Void) - layer + esc(layer) else @assert(isa(layer, Expr) && layer.head == :call, "Do not know how to chain up $layer") - return Expr(:call, layer.args[1], last_layer, layer.args[2:end]...) + return Expr(:call, esc(layer.args[1]), last_layer, map(esc, layer.args[2:end])...) end end while true From 1fb4946797084a63f15558225732115cc479bff3 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 21:02:03 -0400 Subject: [PATCH 098/630] use @chain in lenet example. --- examples/mnist/lenet.jl | 20 ++++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/examples/mnist/lenet.jl b/examples/mnist/lenet.jl index bcf0b02893b5..af631e44c3bc 100644 --- a/examples/mnist/lenet.jl +++ b/examples/mnist/lenet.jl @@ -7,22 +7,22 @@ using MXNet data = mx.Variable(:data) # first conv -conv1 = mx.Convolution(data=data, kernel=(5,5), num_filter=20) -tanh1 = mx.Activation(data=conv1, act_type=:tanh) -pool1 = mx.Pooling(data=tanh1, pool_type=:max, kernel=(2,2), stride=(2,2)) +conv1 = @mx.chain mx.Convolution(data=data, kernel=(5,5), num_filter=20) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) # second conv -conv2 = mx.Convolution(data=pool1, kernel=(5,5), num_filter=50) -tanh2 = mx.Activation(data=conv2, act_type=:tanh) -pool2 = mx.Pooling(data=tanh2, pool_type=:max, kernel=(2,2), stride=(2,2)) +conv2 = @mx.chain mx.Convolution(data=conv1, kernel=(5,5), num_filter=50) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) # first fully-connected -flat = mx.Flatten(data=pool2) -fc1 = mx.FullyConnected(data=flat, num_hidden=500) -tanh3 = mx.Activation(data=fc1, act_type=:tanh) +fc1 = @mx.chain mx.Flatten(data=conv2) => + mx.FullyConnected(num_hidden=500) => + mx.Activation(act_type=:tanh) # second fully-connected -fc2 = mx.FullyConnected(data=tanh3, num_hidden=10) +fc2 = mx.FullyConnected(data=fc1, num_hidden=10) # softmax loss lenet = mx.Softmax(data=fc2, name=:softmax) From 3548a5ffa15064dcf223022a10ddaf6aacdc558f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 21:29:17 -0400 Subject: [PATCH 099/630] lenet tutorial --- README.md | 15 +++++++++ docs/tutorials/mnist.md | 70 +++++++++++++++++++++++++++++++++++++++++ 2 files changed, 85 insertions(+) diff --git a/README.md b/README.md index 2df461d4993c..559d630473a2 100644 --- a/README.md +++ b/README.md @@ -8,6 +8,8 @@ Julia wrapper of [MXNet](https://github.com/dmlc/mxnet). ```julia +using MXNet + mlp = @mx.chain mx.Variable(:data) => mx.FullyConnected(name=:fc1, num_hidden=128) => mx.Activation(name=:relu1, act_type=:relu) => @@ -15,4 +17,17 @@ mlp = @mx.chain mx.Variable(:data) => mx.Activation(name=:relu2, act_type=:relu) => mx.FullyConnected(name=:fc3, num_hidden=10) => mx.Softmax(name=:softmax) + +# data provider +batch_size = 100 +train_provider, eval_provider = get_mnist_providers(batch_size) + +# setup estimator +estimator = mx.FeedForward(mlp, context=mx.cpu()) + +# optimizer +optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) + +# fit parameters +mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) ``` diff --git a/docs/tutorials/mnist.md b/docs/tutorials/mnist.md index 15b651d4b69c..219d8936f686 100644 --- a/docs/tutorials/mnist.md +++ b/docs/tutorials/mnist.md @@ -78,3 +78,73 @@ INFO: time = 0.9287 seconds INFO: ## Validation summary INFO: :accuracy = 0.9775 ``` + +# Convolutional Neural Networks + +In the second example, we show a slightly more complicated architecture that involves convolution and pooling. This architecture for the MNIST is usually called the *LeNet*. The first part of the architecture is listed below: +```julia +# input +data = mx.Variable(:data) + +# first conv +conv1 = @mx.chain mx.Convolution(data=data, kernel=(5,5), num_filter=20) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) + +# second conv +conv2 = @mx.chain mx.Convolution(data=conv1, kernel=(5,5), num_filter=50) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) +``` +We basically defined two convolution modules. Each convolution module is actually a chain of `Convolution`, `tanh` activation and then max `Pooling` operations. + +Each sample in the MNIST dataset is a 28x28 single-channel grayscale image. In the tensor format used by `NDArray`, a batch of 100 samples is a tensor of shape `(28,28,1,100)`. The convolution and pooling operates in the spatial axis, so `kernel=(5,5)` indicate a square region of 5-width and 5-height. +The rest of the architecture follows as: +```julia +# first fully-connected +fc1 = @mx.chain mx.Flatten(data=conv2) => + mx.FullyConnected(num_hidden=500) => + mx.Activation(act_type=:tanh) + +# second fully-connected +fc2 = mx.FullyConnected(data=fc1, num_hidden=10) + +# softmax loss +lenet = mx.Softmax(data=fc2, name=:softmax) +``` +Note a fully-connected operator expects the input to be a matrix. However, the results from spatial convolution and pooling are 4D tensors. So we explicitly used a `Flatten` operator to flat the tensor, before connecting it to the `FullyConnected` operator. + +The rest of the network is the same as the previous MLP example. As before, we can now load the MNIST dataset: +```julia +batch_size = 100 +include("mnist-data.jl") +train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) +``` +Note we specified `flat=false` to tell the data provider to provide 4D tensors instead of 2D matrices because the convolution operators needs correct spatial shape information. We then construct a feedforward model on GPU, and train it. +```julia +#-------------------------------------------------------------------------------- +# fit model +estimator = mx.FeedForward(lenet, context=mx.gpu()) + +# optimizer +optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) + +# fit parameters +mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) +``` +And here is a sample of running outputs: +``` +INFO: == Epoch 001 ========== +INFO: ## Training summary +INFO: :accuracy = 0.6750 +INFO: time = 4.9814 seconds +INFO: ## Validation summary +INFO: :accuracy = 0.9712 +... +INFO: == Epoch 020 ========== +INFO: ## Training summary +INFO: :accuracy = 1.0000 +INFO: time = 4.0086 seconds +INFO: ## Validation summary +INFO: :accuracy = 0.9915 +``` From 7c43f2cae15261d25d4b682dabcb730b44601fc5 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 21:37:33 -0400 Subject: [PATCH 100/630] update readme. --- README.md | 8 +++++++- docs/index.md | 2 ++ 2 files changed, 9 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 559d630473a2..acf0fca121fb 100644 --- a/README.md +++ b/README.md @@ -4,8 +4,12 @@ [![Documentation Status](https://readthedocs.org/projects/mxnetjl/badge/?version=latest)](http://mxnetjl.readthedocs.org/en/latest/?badge=latest) [![License](http://dmlc.github.io/img/apache2.svg)](LICENSE.md) +MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julialang.org/) package. MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of features include: -Julia wrapper of [MXNet](https://github.com/dmlc/mxnet). +* Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. +* Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. + +Here is an exmple of how training a simple 3-layer MLP on MNIST looks like: ```julia using MXNet @@ -31,3 +35,5 @@ optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) # fit parameters mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) ``` + +For more details, please refer to the [document](http://mxnetjl.readthedocs.org/) and [examples](examples). diff --git a/docs/index.md b/docs/index.md index 350c3ab52fc9..c411cc86fd95 100644 --- a/docs/index.md +++ b/docs/index.md @@ -4,3 +4,5 @@ MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julia * Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. * Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. + +To install MXNet.jl, please follow the [installaton guide](user-guide/install.md). See the navigation menu in the sidebar for an [overview](user-guide/overview.md) of MXNet.jl and tutorials on training neural networks in MXNet.jl. From 3b43bcbd23c7db40f18d92ab4b794ceb3002dfe4 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 23:30:09 -0400 Subject: [PATCH 101/630] first version of deps/build.jl that is not working b/c opencv --- REQUIRE | 1 + deps/build.jl | 82 +++++++++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 83 insertions(+) create mode 100644 deps/build.jl diff --git a/REQUIRE b/REQUIRE index 76fa30ce5f54..a0f5c9865565 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,2 +1,3 @@ julia 0.4 Formatting +BinDeps diff --git a/deps/build.jl b/deps/build.jl new file mode 100644 index 000000000000..00d088d4bc17 --- /dev/null +++ b/deps/build.jl @@ -0,0 +1,82 @@ +################################################################################ +# First try to detect and load existing libmxnet +################################################################################ +# if haskey(ENV, "MXNET_HOME") +# info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") +# info("Trying to load existing libmxnet...") +# lib = Libdl.find_library(["libmxnet.so","libmxnet.dll"], ["$(ENV["MXNET_HOME"])/lib"]) +# if !isempty(lib) +# info("Existing libmxnet detected at $lib") +# exit(0) +# else +# info("Failed to load existing libmxnet, trying to build from source...") +# end +# end + + +################################################################################ +# If not found, try to build automatically using BinDeps +################################################################################ +@windows_only begin + info("Automatic building libxmnet on Windows is currently not supported.") + info("Please follow the libmxnet documentation on how to build manually") + info("or to install pre-build packages:") + info("http://mxnet.readthedocs.org/en/latest/build.html#building-on-windows") + exit(-1) +end + +using BinDeps +@BinDeps.setup + +#-------------------------------------------------------------------------------- +# Install dependencies, opencv and blas +opencv_core = library_dependency("opencv_core", aliases=["libopencv_core"]) + +@linux_only begin + provides(AptGet, "libopencv-dev", opencv_core) + provides(Pacman, "opencv", opencv_core) + provides(Yum, "opencv", opencv_core) + + blas = library_dependency("blas", aliases=["libblas","libblas.so.3"]) + provides(AptGet, "libblas-dev", blas) + provides(Pacman, "blas", blas) + provides(Yum, "blas-devel", blas) +end + +@osx_only begin + using Homebrew + provides(Homebrew.HB, "opencv", opencv_core, os = :Darwin) + + # OSX has built-in BLAS we could use +end + +@BinDeps.install Dict(:opencv_core => :opencv_core) +@linux_only begin + @BinDeps.install Dict(:blas => :blas) +end + +#-------------------------------------------------------------------------------- +# Build libmxnet +mxnet = library_dependency("mxnet", aliases=["libmxnet"]) + +prefix = joinpath(BinDeps.depsdir(mxnet), "usr") +srcdir = joinpath(BinDeps.depsdir(mxnet),"src", "libmxnet") +libdir = joinpath(prefix, "lib") +provides(BuildProcess, + (@build_steps begin + CreateDirectory(srcdir) + CreateDirectory(libdir) + @build_steps begin + ChangeDirectory(srcdir) + `git clone --recursive https://github.com/dmlc/mxnet` + FileRule(joinpath(libdir, "libmxnet.so"), @build_steps begin + ChangeDirectory("mxnet") + @osx_only `cp make/osx.mk config.mk` + @osx_only `echo hahahahahahahaha=================` + `make` + `cp lib/libmxnet.so $libdir` + end) + end + end), mxnet) + + @BinDeps.install Dict(:mxnet => :mxnet) From e77fdd0f234858943606a61c90a506f92e7a9cf1 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Oct 2015 23:56:31 -0400 Subject: [PATCH 102/630] default building without opencv. --- .gitignore | 4 +++- deps/build.jl | 29 ++++++++--------------------- src/base.jl | 4 +++- 3 files changed, 14 insertions(+), 23 deletions(-) diff --git a/.gitignore b/.gitignore index 1b5cdca45b40..5660a75bb89b 100644 --- a/.gitignore +++ b/.gitignore @@ -2,4 +2,6 @@ *.jl.*.cov *.jl.mem data -docs/_build +deps/src +deps/usr +deps/deps.jl diff --git a/deps/build.jl b/deps/build.jl index 00d088d4bc17..6959325c86ea 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -29,38 +29,23 @@ using BinDeps @BinDeps.setup #-------------------------------------------------------------------------------- -# Install dependencies, opencv and blas -opencv_core = library_dependency("opencv_core", aliases=["libopencv_core"]) - +# Install dependencies, blas @linux_only begin - provides(AptGet, "libopencv-dev", opencv_core) - provides(Pacman, "opencv", opencv_core) - provides(Yum, "opencv", opencv_core) - blas = library_dependency("blas", aliases=["libblas","libblas.so.3"]) provides(AptGet, "libblas-dev", blas) provides(Pacman, "blas", blas) provides(Yum, "blas-devel", blas) -end - -@osx_only begin - using Homebrew - provides(Homebrew.HB, "opencv", opencv_core, os = :Darwin) - # OSX has built-in BLAS we could use -end - -@BinDeps.install Dict(:opencv_core => :opencv_core) -@linux_only begin @BinDeps.install Dict(:blas => :blas) end #-------------------------------------------------------------------------------- # Build libmxnet -mxnet = library_dependency("mxnet", aliases=["libmxnet"]) +mxnet = library_dependency("mxnet", aliases=["libmxnet.so"]) prefix = joinpath(BinDeps.depsdir(mxnet), "usr") -srcdir = joinpath(BinDeps.depsdir(mxnet),"src", "libmxnet") +srcdir = joinpath(BinDeps.depsdir(mxnet),"src") +mxdir = joinpath(srcdir, "mxnet") libdir = joinpath(prefix, "lib") provides(BuildProcess, (@build_steps begin @@ -68,11 +53,13 @@ provides(BuildProcess, CreateDirectory(libdir) @build_steps begin ChangeDirectory(srcdir) + `rm -rf mxnet` `git clone --recursive https://github.com/dmlc/mxnet` FileRule(joinpath(libdir, "libmxnet.so"), @build_steps begin - ChangeDirectory("mxnet") + ChangeDirectory("$mxdir") + `cp make/config.mk config.mk` @osx_only `cp make/osx.mk config.mk` - @osx_only `echo hahahahahahahaha=================` + `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` `make` `cp lib/libmxnet.so $libdir` end) diff --git a/src/base.jl b/src/base.jl index b3c6cee026dc..cf940c9ef232 100644 --- a/src/base.jl +++ b/src/base.jl @@ -16,7 +16,9 @@ typealias char_pp Ptr{char_p} ################################################################################ # Initialization and library API entrance ################################################################################ -const MXNET_LIB = Libdl.find_library(["libmxnet.so","libmxnet.dll"], ["$(get(ENV,"MXNET_HOME",""))/lib"]) +const MXNET_LIB = Libdl.find_library(["libmxnet.so","libmxnet.dll"], + [joinpath("$(get(ENV,"MXNET_HOME",""))","lib"), + joinpath(Pkg.dir("MXNet"),"deps/usr/lib")]) function __init__() _import_ndarray_functions() From 263e60211d18fe85e4555facba1c798a07173e42 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 23 Oct 2015 00:07:59 -0400 Subject: [PATCH 103/630] update install guide --- docs/user-guide/install.md | 11 ++++++++++- 1 file changed, 10 insertions(+), 1 deletion(-) diff --git a/docs/user-guide/install.md b/docs/user-guide/install.md index ab62c116ed03..eb4e1ecec80d 100644 --- a/docs/user-guide/install.md +++ b/docs/user-guide/install.md @@ -4,7 +4,10 @@ To install MXNet.jl, simply type ```jl Pkg.add("MXNet") ``` -in the Julia REPL. MXNet.jl is built on top of [libmxnet](https://github.com/dmlc/mxnet). Upon installation, Julia will try to automatically download and build libmxnet. If the compilation fails due to unresolved dependency, or if you prefer to work with a customized installation of libmxnet, please see [below](#manual-compilation). +in the Julia REPL. MXNet.jl is built on top of [libmxnet](https://github.com/dmlc/mxnet). Upon installation, Julia will try to automatically download and build libmxnet. + +The libmxnet source is downloaded to `Pkg.dir("MXNet")/deps/src/mxnet`. The automatic build is using default configurations, with OpenCV, CUDA disabled. +If the compilation failed due to unresolved dependency, or if you want to customize the build, it is recommended to compile and install libmxnet manually. Please see [below](#manual-compilation) for more details. To use the latest git version of MXNet.jl, use the following command instead ```jl @@ -18,3 +21,9 @@ It is possible to compile libmxnet separately and point MXNet.jl to a the existi To build libmxnet, please refer to [the installation guide of libmxnet](http://mxnet.readthedocs.org/en/latest/build.html). After successfully installing libmxnet, set the `MXNET_HOME` environment variable to the location of libmxnet. In other words, the compiled `libmxnet.so` should be found in `$MXNET_HOME/lib`. When the `MXNET_HOME` environment variable is detected and the corresponding `libmxnet.so` could be loaded successfully, MXNet.jl will skip automatic building during installation and use the specified libmxnet instead. + +Basically, MXNet.jl will search `libmxnet.so` or `libmxnet.dll` in the following paths (and in that order): + +* `$MXNET_HOME/lib`: customized libmxnet builds +* `Pkg.dir("MXNet")/deps/usr/lib`: automatic builds +* Any system wide library search path From 7934f672e2449a6c221bb3088ed40c2c6256a134 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 23 Oct 2015 01:09:49 -0400 Subject: [PATCH 104/630] add release notes for v0.0.1 --- NEWS.md | 8 ++++++++ 1 file changed, 8 insertions(+) create mode 100644 NEWS.md diff --git a/NEWS.md b/NEWS.md new file mode 100644 index 000000000000..6a43caddce02 --- /dev/null +++ b/NEWS.md @@ -0,0 +1,8 @@ +# v0.0.1 (2015.10.23) + +Initial release. + +* Basic libmxnet API. +* Basic documentation, overview and MNIST tutorial. +* Working MNIST and cifar-10 examples, with multi-GPU training. +* Automatic building of libmxnet with BinDeps.jl. From 0a32996d656a755f416b3daf4321b5de6b9f7f0f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 23 Oct 2015 07:24:23 -0400 Subject: [PATCH 105/630] fix build script (don't exit Julia) --- deps/build.jl | 111 +++++++++++++++++++++++++------------------------- 1 file changed, 56 insertions(+), 55 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 6959325c86ea..5c0dd2bb749f 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -1,69 +1,70 @@ ################################################################################ # First try to detect and load existing libmxnet ################################################################################ -# if haskey(ENV, "MXNET_HOME") -# info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") -# info("Trying to load existing libmxnet...") -# lib = Libdl.find_library(["libmxnet.so","libmxnet.dll"], ["$(ENV["MXNET_HOME"])/lib"]) -# if !isempty(lib) -# info("Existing libmxnet detected at $lib") -# exit(0) -# else -# info("Failed to load existing libmxnet, trying to build from source...") -# end -# end +libmxnet_detected = false - -################################################################################ -# If not found, try to build automatically using BinDeps -################################################################################ -@windows_only begin - info("Automatic building libxmnet on Windows is currently not supported.") - info("Please follow the libmxnet documentation on how to build manually") - info("or to install pre-build packages:") - info("http://mxnet.readthedocs.org/en/latest/build.html#building-on-windows") - exit(-1) +if haskey(ENV, "MXNET_HOME") + info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") + info("Trying to load existing libmxnet...") + lib = Libdl.find_library(["libmxnet.so","libmxnet.dll"], ["$(ENV["MXNET_HOME"])/lib"]) + if !isempty(lib) + info("Existing libmxnet detected at $lib, skip building...") + libmxnet_detected = true + else + info("Failed to load existing libmxnet, trying to build from source...") + end end using BinDeps @BinDeps.setup +if !libmxnet_detected + ################################################################################ + # If not found, try to build automatically using BinDeps + ################################################################################ + @windows_only begin + info("Please follow the libmxnet documentation on how to build manually") + info("or to install pre-build packages:") + info("http://mxnet.readthedocs.org/en/latest/build.html#building-on-windows") + error("Automatic building libxmnet on Windows is currently not supported yet.") + end -#-------------------------------------------------------------------------------- -# Install dependencies, blas -@linux_only begin - blas = library_dependency("blas", aliases=["libblas","libblas.so.3"]) - provides(AptGet, "libblas-dev", blas) - provides(Pacman, "blas", blas) - provides(Yum, "blas-devel", blas) + #-------------------------------------------------------------------------------- + # Install dependencies, blas + @linux_only begin + blas = library_dependency("blas", aliases=["libblas","libblas.so.3"]) + provides(AptGet, "libblas-dev", blas) + provides(Pacman, "blas", blas) + provides(Yum, "blas-devel", blas) - @BinDeps.install Dict(:blas => :blas) -end + @BinDeps.install Dict(:blas => :blas) + end -#-------------------------------------------------------------------------------- -# Build libmxnet -mxnet = library_dependency("mxnet", aliases=["libmxnet.so"]) + #-------------------------------------------------------------------------------- + # Build libmxnet + mxnet = library_dependency("mxnet", aliases=["libmxnet.so"]) -prefix = joinpath(BinDeps.depsdir(mxnet), "usr") -srcdir = joinpath(BinDeps.depsdir(mxnet),"src") -mxdir = joinpath(srcdir, "mxnet") -libdir = joinpath(prefix, "lib") -provides(BuildProcess, - (@build_steps begin - CreateDirectory(srcdir) - CreateDirectory(libdir) - @build_steps begin - ChangeDirectory(srcdir) - `rm -rf mxnet` - `git clone --recursive https://github.com/dmlc/mxnet` - FileRule(joinpath(libdir, "libmxnet.so"), @build_steps begin - ChangeDirectory("$mxdir") - `cp make/config.mk config.mk` - @osx_only `cp make/osx.mk config.mk` - `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` - `make` - `cp lib/libmxnet.so $libdir` - end) - end - end), mxnet) + _prefix = joinpath(BinDeps.depsdir(mxnet), "usr") + _srcdir = joinpath(BinDeps.depsdir(mxnet),"src") + _mxdir = joinpath(_srcdir, "mxnet") + _libdir = joinpath(_prefix, "lib") + provides(BuildProcess, + (@build_steps begin + CreateDirectory(_srcdir) + CreateDirectory(_libdir) + @build_steps begin + ChangeDirectory(_srcdir) + `rm -rf mxnet` + `git clone --recursive https://github.com/dmlc/mxnet` + FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin + ChangeDirectory("$_mxdir") + `cp make/config.mk config.mk` + @osx_only `cp make/osx.mk config.mk` + `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` + `make` + `cp lib/libmxnet.so $_libdir` + end) + end + end), mxnet) @BinDeps.install Dict(:mxnet => :mxnet) +end From 48f423017989d720ed8af3d88b3eb08a9a3272a6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 23 Oct 2015 07:52:47 -0400 Subject: [PATCH 106/630] update news for bugfix v0.0.2 --- NEWS.md | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/NEWS.md b/NEWS.md index 6a43caddce02..53c3f2e5418d 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,7 @@ +# v0.0.2 (2015.10.23) + +* Fix a bug in build script that causes Julia REPL to exit. + # v0.0.1 (2015.10.23) Initial release. @@ -6,3 +10,4 @@ Initial release. * Basic documentation, overview and MNIST tutorial. * Working MNIST and cifar-10 examples, with multi-GPU training. * Automatic building of libmxnet with BinDeps.jl. + From 119fac1eddccb052e327b4ab88e2a6828ffa9d8a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 24 Oct 2015 20:39:15 -0400 Subject: [PATCH 107/630] update kvstore doc. --- docs/user-guide/overview.md | 3 +++ 1 file changed, 3 insertions(+) diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md index 33567bd7817d..3155b281245d 100644 --- a/docs/user-guide/overview.md +++ b/docs/user-guide/overview.md @@ -261,4 +261,7 @@ mx.init!(kv, key, mx.ones(shape)*2) a = mx.empty(shape) mx.pull!(kv, key, a) # pull value into a println(copy(a)) +# => +# Float32[2.0 2.0 2.0 +# 2.0 2.0 2.0] ``` From d738fba18ebf731bf4f7306d81056fc63357810a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 24 Oct 2015 21:31:13 -0400 Subject: [PATCH 108/630] NDArray save and load API --- src/ndarray.jl | 59 ++++++++++++++++++++++++++++++++++++++++ test/unittest/ndarray.jl | 41 ++++++++++++++++++++++++++++ 2 files changed, 100 insertions(+) diff --git a/src/ndarray.jl b/src/ndarray.jl index c3207b8aa963..2ae28b3a48a4 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -352,6 +352,65 @@ function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) div_from!(ret, arg) end +#------------------------------------------------------------ +# IO +#------------------------------------------------------------ +"""Load NDArrays from binary file. + +**Parameters**: + +* `filename`: the path of the file to load. It could be S3 or HDFS address + if the `libmxnet` is built with the corresponding component enabled. Examples + + * `s3://my-bucket/path/my-s3-ndarray` + * `hdfs://my-bucket/path/my-hdfs-ndarray` + * `/path-to/my-local-ndarray` + +**Returns**: + + Either `Dict{Base.Symbol, NDArray}` or `Vector{NDArray}`. +""" +function load_ndarrays(filename::AbstractString) + out_size = Ref{MX_uint}(0) + out_hdrs = Ref{Ptr{MX_handle}}(0) + out_name_size = Ref{MX_uint}(0) + out_names = Ref{char_pp}(0) + @mxcall(:MXNDArrayLoad, (char_p, Ref{MX_uint}, Ref{Ptr{MX_handle}}, Ref{MX_uint}, Ref{char_pp}), + filename, out_size, out_hdrs, out_name_size, out_names) + out_name_size = out_name_size[] + out_size = out_size[] + if out_name_size == 0 + return [NDArray(MX_NDArrayHandle(hdr)) for hdr in pointer_to_array(out_hdrs[], out_size)] + else + @assert out_size == out_name_size + return Dict([(symbol(bytestring(k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in + zip(pointer_to_array(out_names[], out_size), pointer_to_array(out_hdrs[], out_size))]) + end +end + +"""Save NDarrays to binary file. + +**Parameters**: + +* `filename`: path to the binary file to write to. +* `data`: an `NDArray`, or a `Vector{NDArray}` or a `Dict{Base.Symbol, NDArray}`. +""" +function save_ndarrays(filename::AbstractString, data::NDArray) + save_ndarrays(filename, [data]) +end +function save_ndarrays(filename::AbstractString, data::Vector{NDArray}) + @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), + filename, length(data), MX_handle[data...], char_pp(0)) +end +function save_ndarrays(filename::AbstractString, data::Dict{Base.Symbol,NDArray}) + names = [k for k in keys(data)] + arrays = MX_handle[data[k] for k in names] + names = AbstractString[string(k) for k in names] + + @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), + filename, length(names), arrays, names) +end + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 7d5df826f32b..565846154b0b 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -176,6 +176,46 @@ function test_gd() end +function test_saveload() + n_arrays = 5 + info("NDArray::saveload::n_arrays = $n_arrays") + fname = tempname() + + # save and load a single array + dims = rand_dims() + j_array, nd_array = rand_tensors(dims) + mx.save_ndarrays(fname, nd_array) + data = mx.load_ndarrays(fname) + @test isa(data, Vector{mx.NDArray}) + @test length(data) == 1 + @test reldiff(copy(data[1]), j_array) < 1e-6 + + # save and load N arrays of different shape + arrays = [rand_tensors(rand_dims()) for i = 1:n_arrays] + nd_arrays = [x[2] for x in arrays] + mx.save_ndarrays(fname, nd_arrays) + data = mx.load_ndarrays(fname) + @test isa(data, Vector{mx.NDArray}) + @test length(data) == n_arrays + for i = 1:n_arrays + @test reldiff(copy(data[i]), arrays[i][1]) < 1e-6 + end + + # save and load dictionary of ndarrays + names = [symbol("array$i") for i = 1:n_arrays] + dict = Dict([n => v for (n,v) in zip(names, nd_arrays)]) + mx.save_ndarrays(fname, dict) + data = mx.load_ndarrays(fname) + @test isa(data, Dict{Symbol, mx.NDArray}) + @test length(data) == n_arrays + for i = 1:n_arrays + @test reldiff(copy(data[names[i]]), arrays[i][1]) < 1e-6 + end + + rm(fname) +end + + ################################################################################ # Run tests ################################################################################ @@ -187,5 +227,6 @@ test_minus() test_mul() test_div() test_gd() +test_saveload() end From 4e5e152cccf0176cf5e9be5674ddcc01ab4ef9cb Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 24 Oct 2015 21:42:40 -0400 Subject: [PATCH 109/630] gradient clipping --- docs/api/ndarray.md | 77 ++++++++++++++++++++++++++++++++-------- docs/api/symbol.md | 36 +++++++++---------- src/optimizers/sgd.jl | 17 ++++----- test/unittest/ndarray.jl | 16 +++++++++ 4 files changed, 106 insertions(+), 40 deletions(-) diff --git a/docs/api/ndarray.md b/docs/api/ndarray.md index c09b80ea0ab2..87e664ffb0cc 100644 --- a/docs/api/ndarray.md +++ b/docs/api/ndarray.md @@ -32,7 +32,7 @@ object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs wi *source:* -[MXNet/src/ndarray.jl:380](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L380) +[MXNet/src/ndarray.jl:453](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L453) --- @@ -41,7 +41,7 @@ object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs wi Copy data from NDArray to Julia Array *source:* -[MXNet/src/ndarray.jl:187](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L187) +[MXNet/src/ndarray.jl:198](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L198) --- @@ -50,7 +50,7 @@ Copy data from NDArray to Julia Array Copy data between NDArrays *source:* -[MXNet/src/ndarray.jl:175](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L175) +[MXNet/src/ndarray.jl:186](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L186) --- @@ -59,7 +59,7 @@ Copy data between NDArrays Copy data from Julia Array to NDArray *source:* -[MXNet/src/ndarray.jl:195](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L195) +[MXNet/src/ndarray.jl:206](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L206) --- @@ -68,7 +68,7 @@ Copy data from Julia Array to NDArray Create copy: NDArray -> Julia Array *source:* -[MXNet/src/ndarray.jl:205](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L205) +[MXNet/src/ndarray.jl:216](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L216) --- @@ -77,7 +77,7 @@ Create copy: NDArray -> Julia Array Create copy: NDArray -> NDArray in a given context *source:* -[MXNet/src/ndarray.jl:211](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L211) +[MXNet/src/ndarray.jl:222](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L222) --- @@ -86,7 +86,41 @@ Create copy: NDArray -> NDArray in a given context Create copy: Julia Array -> NDArray in a given context *source:* -[MXNet/src/ndarray.jl:217](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L217) +[MXNet/src/ndarray.jl:228](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L228) + +--- + + +#### getindex(arr::MXNet.mx.NDArray, ::Colon) +Shortcut for `slice`. **NOTE** the behavior for Julia's built-in index slicing is to create a +copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. + + +*source:* +[MXNet/src/ndarray.jl:174](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L174) + +--- + + +#### load_ndarrays(filename::AbstractString) +Load NDArrays from binary file. + +**Parameters**: + +* `filename`: the path of the file to load. It could be S3 or HDFS address + if the `libmxnet` is built with the corresponding component enabled. Examples + + * `s3://my-bucket/path/my-s3-ndarray` + * `hdfs://my-bucket/path/my-hdfs-ndarray` + * `/path-to/my-local-ndarray` + +**Returns**: + + Either `Dict{Base.Symbol, NDArray}` or `Vector{NDArray}`. + + +*source:* +[MXNet/src/ndarray.jl:373](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L373) --- @@ -95,7 +129,22 @@ Create copy: Julia Array -> NDArray in a given context Create NDArray and initialize with 1 *source:* -[MXNet/src/ndarray.jl:118](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L118) +[MXNet/src/ndarray.jl:118](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L118) + +--- + + +#### save_ndarrays(filename::AbstractString, data::MXNet.mx.NDArray) +Save NDarrays to binary file. + +**Parameters**: + +* `filename`: path to the binary file to write to. +* `data`: an `NDArray`, or a `Vector{NDArray}` or a `Dict{Base.Symbol, NDArray}`. + + +*source:* +[MXNet/src/ndarray.jl:398](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L398) --- @@ -104,7 +153,7 @@ Create NDArray and initialize with 1 Assign all elements of an NDArray to a scalar *source:* -[MXNet/src/ndarray.jl:155](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L155) +[MXNet/src/ndarray.jl:155](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L155) --- @@ -116,7 +165,7 @@ Get the shape of an `NDArray`. Note the shape is converted to Julia convention. *source:* -[MXNet/src/ndarray.jl:84](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L84) +[MXNet/src/ndarray.jl:84](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L84) --- @@ -130,7 +179,7 @@ used in data parallelization to split mini-batch into sub-batches for different *source:* -[MXNet/src/ndarray.jl:137](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L137) +[MXNet/src/ndarray.jl:137](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L137) --- @@ -139,7 +188,7 @@ used in data parallelization to split mini-batch into sub-batches for different Create zero-ed NDArray of specific shape *source:* -[MXNet/src/ndarray.jl:105](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L105) +[MXNet/src/ndarray.jl:105](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L105) --- @@ -157,7 +206,7 @@ have shape (28,28,1,100). *source:* -[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L32) +[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L32) --- @@ -185,5 +234,5 @@ which will do inplace adding of the contents of b into a. *source:* -[MXNet/src/ndarray.jl:247](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/ndarray.jl#L247) +[MXNet/src/ndarray.jl:258](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L258) diff --git a/docs/api/symbol.md b/docs/api/symbol.md index 1ccd875896b9..d263bb4fcbc2 100644 --- a/docs/api/symbol.md +++ b/docs/api/symbol.md @@ -4,21 +4,30 @@ --- - -#### get_internals(self::MXNet.mx.Symbol) -Get a new grouped symbol whose output contains all the internal outputs of this symbol. + +#### Group(symbols::MXNet.mx.Symbol...) +Create a symbol that groups symbols together *source:* -[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/symbol.jl#L63) +[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/symbol.jl#L77) --- - -#### group(symbols::MXNet.mx.Symbol...) -Create a symbol that groups symbols together + +#### Variable(name::Union{AbstractString, Symbol}) +Create a symbolic variable with the given name + +*source:* +[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/symbol.jl#L70) + +--- + + +#### get_internals(self::MXNet.mx.Symbol) +Get a new grouped symbol whose output contains all the internal outputs of this symbol. *source:* -[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/symbol.jl#L77) +[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/symbol.jl#L63) --- @@ -33,14 +42,5 @@ Most operators do not have Auxiliary states. *source:* -[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/symbol.jl#L58) - ---- - - -#### variable(name::Union{AbstractString, Symbol}) -Create a symbolic variable with the given name - -*source:* -[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/92237212c594440455567ec4d39caec909ddd11e/src/symbol.jl#L70) +[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/symbol.jl#L58) diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index 4e6a6757fb67..b910e2c3d6b6 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -41,17 +41,18 @@ function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, s lr = get_learning_rate(self.opts.lr_scheduler, self.iter) grad_scale = self.opts.grad_scale / self.batch_size + grad = grad_scale * grad + if self.opts.grad_clip > 0 + grad = clip(grad, -self.opts.grad_clip, self.opts.grad_clip) + end + if isa(state, Void) - @inplace weight += -lr * (grad_scale * grad + self.opts.weight_decay * weight) + @inplace weight += -lr * (grad + self.opts.weight_decay * weight) else mom = state :: NDArray coef = get_momentum(self.opts.mom_scheduler, self.iter) - @inplace mom .*= coef - if self.opts.grad_clip > 0 - # TODO: - else - @inplace mom += -lr * (grad_scale * grad + self.opts.weight_decay * weight) - end - @inplace weight += mom + @inplace mom .*= coef + @inplace mom .+= -lr * (grad + self.opts.weight_decay * weight) + @inplace weight .+= mom end end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 565846154b0b..9a6f916ab556 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -215,6 +215,21 @@ function test_saveload() rm(fname) end +function test_clip() + dims = rand_dims() + info("NDArray::clip::dims = $dims") + + j_array, nd_array = rand_tensors(dims) + clip_up = maximum(abs(j_array)) / 2 + clip_down = 0 + clipped = mx.clip(nd_array, clip_down, clip_up) + + # make sure the original array is not modified + @test reldiff(copy(nd_array), j_array) < 1e-6 + + @test all(clip_down .<= copy(clipped) .<= clip_up) +end + ################################################################################ # Run tests @@ -228,5 +243,6 @@ test_mul() test_div() test_gd() test_saveload() +test_clip() end From 9d138da15de27ff86b72c3156770e9e0cba141fa Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 24 Oct 2015 22:10:19 -0400 Subject: [PATCH 110/630] save and load for symbol --- src/ndarray.jl | 14 +++++++++----- src/symbol.jl | 18 ++++++++++++++++++ test/unittest/ndarray.jl | 22 ++++++++++++++++------ 3 files changed, 43 insertions(+), 11 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 2ae28b3a48a4..00edc6c7c671 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -370,7 +370,7 @@ end Either `Dict{Base.Symbol, NDArray}` or `Vector{NDArray}`. """ -function load_ndarrays(filename::AbstractString) +function load(filename::AbstractString, ::Type{NDArray}) out_size = Ref{MX_uint}(0) out_hdrs = Ref{Ptr{MX_handle}}(0) out_name_size = Ref{MX_uint}(0) @@ -395,14 +395,14 @@ end * `filename`: path to the binary file to write to. * `data`: an `NDArray`, or a `Vector{NDArray}` or a `Dict{Base.Symbol, NDArray}`. """ -function save_ndarrays(filename::AbstractString, data::NDArray) - save_ndarrays(filename, [data]) +function save(filename::AbstractString, data::NDArray) + save(filename, [data]) end -function save_ndarrays(filename::AbstractString, data::Vector{NDArray}) +function save(filename::AbstractString, data::Vector{NDArray}) @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), filename, length(data), MX_handle[data...], char_pp(0)) end -function save_ndarrays(filename::AbstractString, data::Dict{Base.Symbol,NDArray}) +function save(filename::AbstractString, data::Dict{Base.Symbol,NDArray}) names = [k for k in keys(data)] arrays = MX_handle[data[k] for k in names] names = AbstractString[string(k) for k in names] @@ -425,6 +425,10 @@ end ACCEPT_EMPTY_MUTATE_TARGET = (1 << 2) ) +# Import corresponding math functions from base so the automatically defined libmxnet +# functions can overload them +import Base: sqrt + """ Import dynamic functions for NDArrays. The arguments to the functions are typically ordered as diff --git a/src/symbol.jl b/src/symbol.jl index 097fe1d5b20a..a1f008c29cd3 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -229,12 +229,30 @@ function _compose!(sym :: Symbol, name :: Union{Base.Symbol, char_p}, args::Symb return sym end +"""Save Symbol into a JSON string""" function to_json(self :: Symbol) ref_json = Ref{char_p}(0) @mxcall(:MXSymbolSaveToJSON, (MX_handle, Ref{char_p}), self, ref_json) return bytestring(ref_json[]) end +"""Load Symbol from a JSON string representation.""" +function from_json(repr :: AbstractString, ::Type{Symbol}) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolCreateFromJSON, (char_p, Ref{MX_handle}), repr, ref_hdr) + return Symbol(MX_SymbolHandle(ref_hdr[])) +end + +"""Load Symbol from a JSON file.""" +function load(filename :: AbstractString, ::Type{Symbol}) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolCreateFromFile, (char_p, Ref{MX_handle}), filename, ref_hdr) + return Symbol(MX_SymbolHandle(ref_hdr[])) +end +function save(filename :: AbstractString, sym :: Symbol) + @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), sym, filename) +end + ################################################################################ # Atomic Symbol functions dynamically imported from libmxnet ################################################################################ diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 9a6f916ab556..cfab1dea0d86 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -184,8 +184,8 @@ function test_saveload() # save and load a single array dims = rand_dims() j_array, nd_array = rand_tensors(dims) - mx.save_ndarrays(fname, nd_array) - data = mx.load_ndarrays(fname) + mx.save(fname, nd_array) + data = mx.load(fname, mx.NDArray) @test isa(data, Vector{mx.NDArray}) @test length(data) == 1 @test reldiff(copy(data[1]), j_array) < 1e-6 @@ -193,8 +193,8 @@ function test_saveload() # save and load N arrays of different shape arrays = [rand_tensors(rand_dims()) for i = 1:n_arrays] nd_arrays = [x[2] for x in arrays] - mx.save_ndarrays(fname, nd_arrays) - data = mx.load_ndarrays(fname) + mx.save(fname, nd_arrays) + data = mx.load(fname, mx.NDArray) @test isa(data, Vector{mx.NDArray}) @test length(data) == n_arrays for i = 1:n_arrays @@ -204,8 +204,8 @@ function test_saveload() # save and load dictionary of ndarrays names = [symbol("array$i") for i = 1:n_arrays] dict = Dict([n => v for (n,v) in zip(names, nd_arrays)]) - mx.save_ndarrays(fname, dict) - data = mx.load_ndarrays(fname) + mx.save(fname, dict) + data = mx.load(fname, mx.NDArray) @test isa(data, Dict{Symbol, mx.NDArray}) @test length(data) == n_arrays for i = 1:n_arrays @@ -230,6 +230,15 @@ function test_clip() @test all(clip_down .<= copy(clipped) .<= clip_up) end +function test_sqrt() + dims = rand_dims() + info("NDArray::sqrt::dims = $dims") + + j_array, nd_array = rand_tensors(dims) + sqrt_ed = sqrt(nd_array) + @test reldiff(copy(sqrt_ed), sqrt(j_array)) < 1e-6 +end + ################################################################################ # Run tests @@ -244,5 +253,6 @@ test_div() test_gd() test_saveload() test_clip() +test_sqrt() end From 30f89a8efa4b30d96a97245cbc51a66bff48707e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 24 Oct 2015 22:13:25 -0400 Subject: [PATCH 111/630] unit test for symbol save and load --- test/unittest/symbol.jl | 13 +++++++++++++ 1 file changed, 13 insertions(+) diff --git a/test/unittest/symbol.jl b/test/unittest/symbol.jl index fecb25c159a8..3397b7eaf70d 100644 --- a/test/unittest/symbol.jl +++ b/test/unittest/symbol.jl @@ -69,6 +69,18 @@ function test_infer_shape_error() @test_throws mx.MXError mx.infer_shape(model, data=data_shape, fc1_weight=weight_shape) end +function test_saveload() + info("Symbol::saveload::mlp2") + + model = mlp2() + fname = tempname() + mx.save(fname, model) + model2 = mx.load(fname, mx.Symbol) + @test mx.to_json(model) == mx.to_json(model2) + + rm(fname) +end + ################################################################################ # Run tests @@ -78,5 +90,6 @@ test_internal() test_compose() test_infer_shape() test_infer_shape_error() +test_saveload() end From 7e86c8f7f001977f5429762112824b0a7d50e32f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 00:09:46 -0400 Subject: [PATCH 112/630] improve defstruct macro --- src/base.jl | 25 ++++++++++++++++--------- 1 file changed, 16 insertions(+), 9 deletions(-) diff --git a/src/base.jl b/src/base.jl index cf940c9ef232..5e547de727c1 100644 --- a/src/base.jl +++ b/src/base.jl @@ -157,35 +157,42 @@ the keyword arguments. """ macro defstruct(name, super_name, fields) @assert fields.head == :tuple - fields = fields.args + fields = fields.args @assert length(fields) > 0 - name = esc(name) + name = esc(name) + super_name = esc(super_name) field_defs = Array(Expr, length(fields)) # :(field2 :: Int) - field_names = Array(Base.Symbol, length(fields)) # :field2 - field_defaults = Array(Expr, length(fields)) # :(field2 :: Int = 0) + field_names = Array(Expr, length(fields)) # :field2 + field_defaults = Array(Expr, length(fields)) # :(field2 = 0) + field_types = Array(Expr, length(fields)) # Int field_asserts = Array(Expr, length(fields)) # :(field2 >= 0) for i = 1:length(fields) field = fields[i] if field.head == :tuple - field_asserts[i] = field.args[2] + field_asserts[i] = esc(field.args[2]) field = field.args[1] end - field_defs[i] = esc(field.args[1]) - field_names[i] = field.args[1].args[1] - field_defaults[i] = Expr(:kw, field.args...) + field_defs[i] = esc(field.args[1]) + field_names[i] = esc(field.args[1].args[1]) + field_types[i] = esc(field.args[1].args[2]) + field_defaults[i] = Expr(:kw, field.args[1].args[1], esc(field.args[2])) end # body of layer type, defining fields type_body = Expr(:block, field_defs...) # constructor + converts = map(zip(field_names, field_types)) do param + f_name, f_type = param + :($f_name = convert($f_type, $f_name)) + end asserts = map(filter(i -> isdefined(field_asserts,i), 1:length(fields))) do i :(@assert($(field_asserts[i]))) end construct = Expr(:call, name, field_names...) - ctor_body = Expr(:block, asserts..., construct) + ctor_body = Expr(:block, converts..., asserts..., construct) ctor_def = Expr(:call, name, Expr(:parameters, field_defaults...)) ctor = Expr(:(=), ctor_def, ctor_body) From 00bd457366d3e7bc12ca7507bbeb3eeba87df872 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 00:10:15 -0400 Subject: [PATCH 113/630] callback interface --- src/MXNet.jl | 1 + src/callback.jl | 48 ++++++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 49 insertions(+) create mode 100644 src/callback.jl diff --git a/src/MXNet.jl b/src/MXNet.jl index 0e56b743d5d5..9f404a077aed 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -25,6 +25,7 @@ include("initializer.jl") include("io.jl") include("kvstore.jl") +include("callback.jl") include("estimator.jl") include("util.jl") diff --git a/src/callback.jl b/src/callback.jl new file mode 100644 index 000000000000..c9e5a39c3693 --- /dev/null +++ b/src/callback.jl @@ -0,0 +1,48 @@ +"Abstract type of callback functions used in training" +abstract AbstractCallback + +"Abstract type of callbacks to be called every mini-batch" +abstract AbstractIterationCallback + +"Abstract type of callbacks to be called every epoch" +abstract AbstractEpochCallback + +type CallbackParams + batch_size :: Int + curr_epoch :: Int + curr_iter :: Int +end +CallbackParams(batch_size::Int) = CallbackParams(batch_size, 0, 0) + +type IterationCallback + frequency :: Int + call_on_0 :: Bool + callback :: Function +end + +function every_n_iter(callback :: Function, n :: Int, call_on_0 :: Bool = false) + IterationCallback(n, call_on_0, callback) +end +function Base.call(cb :: IterationCallback, param :: CallbackParams) + if param.curr_iter == 0 + if cb.call_on_0 + cb.callback(param) + end + elseif param.curr_iter % cb.frequency == 0 + cb.callback(param) + end +end + +function speedometer(frequency::Int=50) + cl_tic = 0 + every_n_iter(frequency, true) do params :: CallbackParams + if param.curr_iter == 0 + # reset counter + cl_tic = time() + else + speed = frequency * params.batch_size / (time() - cl_tic) + info("Speed: {1:>6.2} samples/sec", speed) + cl_tic = time() + end + end +end From 06879c6ab6233529e42fcc96a1c01cecbd006d40 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 00:28:06 -0400 Subject: [PATCH 114/630] fix estimator API --- README.md | 2 +- docs/tutorials/mnist.md | 6 ++-- examples/cifar10/cifar10.jl | 2 +- examples/mnist/lenet.jl | 2 +- examples/mnist/mlp.jl | 2 +- src/callback.jl | 22 ++++++++++++- src/estimator.jl | 63 ++++++++++++++++++++++++++----------- 7 files changed, 72 insertions(+), 27 deletions(-) diff --git a/README.md b/README.md index acf0fca121fb..c184eac57178 100644 --- a/README.md +++ b/README.md @@ -33,7 +33,7 @@ estimator = mx.FeedForward(mlp, context=mx.cpu()) optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) +mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) ``` For more details, please refer to the [document](http://mxnetjl.readthedocs.org/) and [examples](examples). diff --git a/docs/tutorials/mnist.md b/docs/tutorials/mnist.md index 219d8936f686..97a12e8aadeb 100644 --- a/docs/tutorials/mnist.md +++ b/docs/tutorials/mnist.md @@ -55,9 +55,9 @@ The last thing we need to specify is the optimization algorithm (a.k.a. *optimiz ```julia optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) ``` -Now we can do the training. Here the `epoch_stop` parameter specifies that we want to train for 20 epochs. We also supply a `eval_data` to monitor validation accuracy on the validation set. +Now we can do the training. Here the `n_epoch` parameter specifies that we want to train for 20 epochs. We also supply a `eval_data` to monitor validation accuracy on the validation set. ```julia -mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) +mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) ``` Here is a sample output ``` @@ -130,7 +130,7 @@ estimator = mx.FeedForward(lenet, context=mx.gpu()) optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) +mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) ``` And here is a sample of running outputs: ``` diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl index 50d399e32d5e..968781a5257c 100644 --- a/examples/cifar10/cifar10.jl +++ b/examples/cifar10/cifar10.jl @@ -82,5 +82,5 @@ optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.05), weight_decay=0.0001) # fit parameters -mx.fit(estimator, optimizer, train_provider, epoch_stop=num_epoch, eval_data=test_provider, +mx.fit(estimator, optimizer, train_provider, n_epoch=num_epoch, eval_data=test_provider, initializer=mx.UniformInitializer(0.07)) diff --git a/examples/mnist/lenet.jl b/examples/mnist/lenet.jl index af631e44c3bc..92f41e88aeb6 100644 --- a/examples/mnist/lenet.jl +++ b/examples/mnist/lenet.jl @@ -42,4 +42,4 @@ estimator = mx.FeedForward(lenet, context=mx.gpu()) optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) +mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 66e1bdac49a8..26aa4ecfda49 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -34,4 +34,4 @@ estimator = mx.FeedForward(mlp, context=mx.cpu()) optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(estimator, optimizer, train_provider, epoch_stop=20, eval_data=eval_provider) +mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) diff --git a/src/callback.jl b/src/callback.jl index c9e5a39c3693..9a2af79ded42 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -14,7 +14,7 @@ type CallbackParams end CallbackParams(batch_size::Int) = CallbackParams(batch_size, 0, 0) -type IterationCallback +type IterationCallback <: AbstractIterationCallback frequency :: Int call_on_0 :: Bool callback :: Function @@ -46,3 +46,23 @@ function speedometer(frequency::Int=50) end end end + + +type EpochCallback <: AbstractEpochCallback + frequency :: Int + call_on_0 :: Bool + callback :: Function +end + +function every_n_epoch(callback :: Function, n :: Int, call_on_0 :: Bool = false) + EpochCallback(n, call_on_0, callback) +end +function Base.call(cb :: EpochCallback, param :: CallbackParams) + if param.curr_epoch == 0 + if cb.call_on_0 + cb.callback(param) + end + elseif param.curr_epoch % cb.frequency == 0 + cb.callback(param) + end +end diff --git a/src/estimator.jl b/src/estimator.jl index 42402d0a2bdf..fc0e55af052a 100644 --- a/src/estimator.jl +++ b/src/estimator.jl @@ -92,12 +92,25 @@ function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params : return (kv, update_on_kvstore) end -function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; - initializer :: AbstractInitializer = UniformInitializer(0.01), - epoch_stop :: Int = 10, epoch_start :: Int = 1, - eval_data :: Union{Void, AbstractDataProvider} = nothing, - eval_metric :: AbstractEvalMetric = Accuracy(), - kvstore :: Union{Base.Symbol, KVStore} = :local) +@defstruct TrainingOptions Any ( + initializer :: AbstractInitializer = UniformInitializer(0.01), + n_epoch :: Int = 10, + eval_data :: Union{Void, AbstractDataProvider} = nothing, + eval_metric :: AbstractEvalMetric = Accuracy(), + kvstore :: Union{Base.Symbol, KVStore} = :local, + callbacks :: Vector{AbstractCallback} = AbstractCallback[], +) + +function _invoke_callbacks(callbacks::Vector{AbstractCallback}, param::CallbackParams, type_filter::Type) + map(callbacks) do cb + if isa(cb, type_filter) + cb(param) + end + end +end + +function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) + opts = TrainingOptions(; kwargs...) info("Start training on $(self.ctx)") @@ -107,9 +120,10 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # initialize parameters info("Initializing parameters...") - arg_names, param_names, aux_names = _init_params(self, data, initializer) + arg_names, param_names, aux_names = _init_params(self, data, opts.initializer) # setup kvstore + kvstore = opts.kvstore if isa(kvstore, Base.Symbol) info("Creating KVStore...") kvstore, update_on_kvstore = _create_kvstore(kvstore, length(self.ctx), self.arg_params) @@ -139,6 +153,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra grad_arrays = [NDArray[exec.grad_arrays[i] for exec in train_execs] for i in param_idx] optimizer.batch_size = batch_size + cb_param = CallbackParams(batch_size) if !update_on_kvstore updater = get_updater(optimizer) @@ -169,11 +184,19 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra cpu_label_arrays = [empty(shape, cpu_dev) for (name,shape) in provide_label(data)] cpu_label_arrays_full_slice = [SlicedNDArray[(1:batch_size, x)] for x in cpu_label_arrays] + # invoke callbacks on epoch 0 + _invoke_callbacks(opts.callbacks, cb_param, AbstractEpochCallback) + # now start training... - for i_epoch = epoch_start:epoch_stop + for i_epoch = 1:opts.n_epoch time_start = time() - reset!(eval_metric) - n_batch = 0 + reset!(opts.eval_metric) + + cb_param.curr_epoch = i_epoch + cb_param.curr_iter = 0 + + # invoke callbacks on iteration 0 + _invoke_callbacks(opts.callbacks, cb_param, AbstractIterationCallback) for batch in data load_data!(batch, data_arrays) @@ -218,30 +241,32 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end end - n_batch += 1 + # invoke callbacks after finishing each iteration + _invoke_callbacks(opts.callbacks, cb_param, AbstractIterationCallback) + cb_param.curr_iter += 1 # update evaluation metric on training set load_label!(batch, cpu_label_arrays_full_slice) - update!(eval_metric, cpu_label_arrays, cpu_output_arrays) + update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) end # end of one epoch time_stop = time() info(format("== Epoch {1:0>3d} ==========", i_epoch)) info("## Training summary") - for (name, value) in get(eval_metric) + for (name, value) in get(opts.eval_metric) info(format("{1:>15s} = {2:.4f}", name, value)) end info(format("{1:>15s} = {2:.4f} seconds", "time", time_stop-time_start)) # evaluation on validation set - if !isa(eval_data, Void) + if !isa(opts.eval_data, Void) # because we are re-using the memory allocated for the training network, # the batch_size of the validation dataset must be the same as the training # batch_size - @assert(get_batch_size(eval_data) == batch_size) + @assert(get_batch_size(opts.eval_data) == batch_size) - reset!(eval_metric) - for batch in eval_data + reset!(opts.eval_metric) + for batch in opts.eval_data load_data!(batch, data_arrays) # forward and backward @@ -254,11 +279,11 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end end load_label!(batch, cpu_label_arrays_full_slice) - update!(eval_metric, cpu_label_arrays, cpu_output_arrays) + update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) end info("## Validation summary") - for (name, value) in get(eval_metric) + for (name, value) in get(opts.eval_metric) info(format("{1:>15s} = {2:.4f}", name, value)) end end From f551c91cd5ea3eb59ea11630fbdb48ca485cbf20 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 00:29:00 -0400 Subject: [PATCH 115/630] add speedometer to cifar10 --- examples/cifar10/cifar10.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl index 968781a5257c..7b335d3b1219 100644 --- a/examples/cifar10/cifar10.jl +++ b/examples/cifar10/cifar10.jl @@ -83,4 +83,4 @@ optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.05), # fit parameters mx.fit(estimator, optimizer, train_provider, n_epoch=num_epoch, eval_data=test_provider, - initializer=mx.UniformInitializer(0.07)) + initializer=mx.UniformInitializer(0.07), callbacks=[mx.speedometer()]) From cb067c34dd5ad73c9435cd30ece24416a2969f03 Mon Sep 17 00:00:00 2001 From: pluskid Date: Sun, 25 Oct 2015 00:36:32 -0400 Subject: [PATCH 116/630] fix speedometer --- src/callback.jl | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/src/callback.jl b/src/callback.jl index 9a2af79ded42..f2a3ef93058f 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -2,10 +2,10 @@ abstract AbstractCallback "Abstract type of callbacks to be called every mini-batch" -abstract AbstractIterationCallback +abstract AbstractIterationCallback <: AbstractCallback "Abstract type of callbacks to be called every epoch" -abstract AbstractEpochCallback +abstract AbstractEpochCallback <: AbstractCallback type CallbackParams batch_size :: Int @@ -35,13 +35,13 @@ end function speedometer(frequency::Int=50) cl_tic = 0 - every_n_iter(frequency, true) do params :: CallbackParams + every_n_iter(frequency, true) do param :: CallbackParams if param.curr_iter == 0 # reset counter cl_tic = time() else - speed = frequency * params.batch_size / (time() - cl_tic) - info("Speed: {1:>6.2} samples/sec", speed) + speed = frequency * param.batch_size / (time() - cl_tic) + info(format("Speed: {1:>6.2f} samples/sec", speed)) cl_tic = time() end end From f7d7ce3a107d7884e03f77410e60a57ace8f6b52 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 01:16:47 -0400 Subject: [PATCH 117/630] save checkpoints in callbacks --- src/callback.jl | 21 ++++++++++++++------- src/estimator.jl | 44 +++++++++++++++++++++++++++++++++++++++----- src/ndarray.jl | 5 ++++- 3 files changed, 57 insertions(+), 13 deletions(-) diff --git a/src/callback.jl b/src/callback.jl index f2a3ef93058f..c124c9b9357c 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -20,7 +20,7 @@ type IterationCallback <: AbstractIterationCallback callback :: Function end -function every_n_iter(callback :: Function, n :: Int, call_on_0 :: Bool = false) +function every_n_iter(callback :: Function, n :: Int; call_on_0 :: Bool = false) IterationCallback(n, call_on_0, callback) end function Base.call(cb :: IterationCallback, param :: CallbackParams) @@ -33,9 +33,9 @@ function Base.call(cb :: IterationCallback, param :: CallbackParams) end end -function speedometer(frequency::Int=50) +function speedometer(;frequency::Int=50) cl_tic = 0 - every_n_iter(frequency, true) do param :: CallbackParams + every_n_iter(frequency, call_on_0=true) do param :: CallbackParams if param.curr_iter == 0 # reset counter cl_tic = time() @@ -54,15 +54,22 @@ type EpochCallback <: AbstractEpochCallback callback :: Function end -function every_n_epoch(callback :: Function, n :: Int, call_on_0 :: Bool = false) +function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) end -function Base.call(cb :: EpochCallback, param :: CallbackParams) +function Base.call(cb :: EpochCallback, estimator :: Any, param :: CallbackParams) if param.curr_epoch == 0 if cb.call_on_0 - cb.callback(param) + cb.callback(estimator, param) end elseif param.curr_epoch % cb.frequency == 0 - cb.callback(param) + cb.callback(estimator, param) + end +end + +function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) + mkpath(dirname(prefix)) + every_n_epoch(frequency, call_on_0=save_epoch_0) do estimator, param + save_checkpoint(estimator, prefix, param) end end diff --git a/src/estimator.jl b/src/estimator.jl index fc0e55af052a..ad436ef359bf 100644 --- a/src/estimator.jl +++ b/src/estimator.jl @@ -101,10 +101,15 @@ end callbacks :: Vector{AbstractCallback} = AbstractCallback[], ) -function _invoke_callbacks(callbacks::Vector{AbstractCallback}, param::CallbackParams, type_filter::Type) +function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, param::CallbackParams, type_filter::Type) map(callbacks) do cb if isa(cb, type_filter) - cb(param) + if type_filter == AbstractEpochCallback + # epoch callback have extra access to the estimator object + cb(self, param) + else + cb(param) + end end end end @@ -151,6 +156,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra param_arrays = [NDArray[exec.arg_arrays[i] for exec in train_execs] for i in param_idx] grad_arrays = [NDArray[exec.grad_arrays[i] for exec in train_execs] for i in param_idx] + aux_arrays = [NDArray[exec.aux_arrays[i] for exec in train_execs] for i = 1:length(aux_names)] optimizer.batch_size = batch_size cb_param = CallbackParams(batch_size) @@ -185,7 +191,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra cpu_label_arrays_full_slice = [SlicedNDArray[(1:batch_size, x)] for x in cpu_label_arrays] # invoke callbacks on epoch 0 - _invoke_callbacks(opts.callbacks, cb_param, AbstractEpochCallback) + _invoke_callbacks(self, opts.callbacks, cb_param, AbstractEpochCallback) # now start training... for i_epoch = 1:opts.n_epoch @@ -196,7 +202,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra cb_param.curr_iter = 0 # invoke callbacks on iteration 0 - _invoke_callbacks(opts.callbacks, cb_param, AbstractIterationCallback) + _invoke_callbacks(self, opts.callbacks, cb_param, AbstractIterationCallback) for batch in data load_data!(batch, data_arrays) @@ -242,7 +248,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end # invoke callbacks after finishing each iteration - _invoke_callbacks(opts.callbacks, cb_param, AbstractIterationCallback) + _invoke_callbacks(self, opts.callbacks, cb_param, AbstractIterationCallback) cb_param.curr_iter += 1 # update evaluation metric on training set @@ -287,5 +293,33 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra info(format("{1:>15s} = {2:.4f}", name, value)) end end + + if i_epoch == opts.n_epoch || any(map(x->isa(x, AbstractEpochCallback), opts.callbacks)) + # copy data back to cpu + for (name, weights) in zip(param_names, param_arrays) + # average parameters across devices + weight = +([copy(w, cpu()) for w in weights]...) / length(weights) + copy!(self.arg_params[name], weight) + end + for (name, aux_devs) in zip(aux_names, aux_arrays) + aux_avg = +([copy(aux, cpu()) for aux in aux_devs]...) / length(aux_devs) + copy!(self.aux_params[name], aux_avg) + end + end + _invoke_callbacks(self, opts.callbacks, cb_param, AbstractEpochCallback) end # end of all epochs end + +function save_checkpoint(self :: FeedForward, prefix :: AbstractString, param :: CallbackParams) + save_checkpoint(self.arch, self.arg_params, self.aux_params, prefix, param.curr_epoch) +end +function save_checkpoint(sym :: Symbol, arg_params :: Dict{Base.Symbol, NDArray}, + aux_params :: Dict{Base.Symbol, NDArray}, prefix :: AbstractString, epoch :: Int) + save("$prefix-symbol.json", sym) + save_dict = merge(Dict([symbol("arg:$k") => v for (k,v) in arg_params]), + Dict([symbol("aux:$k") => v for (k,v) in aux_params])) + save_filename = format("{1}-{2:04d}.params", prefix, epoch) + save(save_filename, save_dict) + info("Saved checkpoint to '$save_filename'") +end + diff --git a/src/ndarray.jl b/src/ndarray.jl index 00edc6c7c671..40d4c233e2e0 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -346,11 +346,14 @@ function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) _div(dst, arg, dst) end end -import Base: ./ +import Base: ./, / function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) div_from!(ret, arg) end +function /(arg0 :: NDArray, arg :: Real) + ./(arg0, arg) +end #------------------------------------------------------------ # IO From 5ea6b8cf46fb47e606e4c2409d7d974cd30cfaeb Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 12:27:32 -0400 Subject: [PATCH 118/630] array iterator and (part of) the unittest --- src/estimator.jl | 5 ++ src/io.jl | 121 +++++++++++++++++++++++++++++++++++++++++++- src/ndarray.jl | 7 ++- test/unittest/io.jl | 33 ++++++++++++ 4 files changed, 163 insertions(+), 3 deletions(-) diff --git a/src/estimator.jl b/src/estimator.jl index ad436ef359bf..c18eb5f3a6d4 100644 --- a/src/estimator.jl +++ b/src/estimator.jl @@ -7,6 +7,8 @@ type FeedForward <: AbstractEstimator arg_params :: Dict{Base.Symbol, NDArray} aux_params :: Dict{Base.Symbol, NDArray} + pred_exec :: Executor + # leave the rest fields undefined FeedForward(arch :: Symbol, ctx :: Vector{Context}) = new(arch, ctx) end @@ -114,6 +116,9 @@ function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback end end +function train(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) + fit(self, optimizer, data; kwargs...) +end function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) opts = TrainingOptions(; kwargs...) diff --git a/src/io.jl b/src/io.jl index 78fb7cefc22c..389b5a954fe4 100644 --- a/src/io.jl +++ b/src/io.jl @@ -32,8 +32,8 @@ which translates into ```julia state = Base.start(provider) -while !done(provider, state) - (batch, state) = next(provider, state) +while !Base.done(provider, state) + (batch, state) = Base.next(provider, state) # ... load_data!(batch, targets) end @@ -110,6 +110,123 @@ Return the number of *dummy samples* in this mini-batch. abstract AbstractDataBatch +################################################################################ +# ArrayDataProvider +################################################################################ +"A convenient tool to iterate `NDArray` or Julia `Array`" +type ArrayDataProvider <: AbstractDataProvider + data_arrays :: Vector{Array{MX_float}} + data_names :: Vector{Base.Symbol} + label_arrays:: Vector{Array{MX_float}} + label_names :: Vector{Base.Symbol} + batch_size :: Int + sample_count:: Int + shuffle :: Bool +end + +function ArrayDataProvider{T<:Real}(data::Union{NDArray,Array{T}}; batch_size::Int=1, shuffle::Bool=false) + ArrayDataProvider(:data => data, batch_size=batch_size, shuffle=shuffle) +end +function ArrayDataProvider(data::Pair; batch_size=1, shuffle::Bool=false) + ArrayDataProvider(Pair[data], Pair[], batch_size=batch_size, shuffle=shuffle) +end +function ArrayDataProvider{T<:Real}(data::Union{NDArray,Array{T}}, label::Union{NDArray,Array{T}}; + batch_size::Int=1, shuffle::Bool=false) + ArrayDataProvider(:data => data, :softmax_label => label, batch_size=batch_size, shuffle=shuffle) +end +function ArrayDataProvider(data::Pair, label::Pair; batch_size=1, shuffle::Bool=false) + ArrayDataProvider([data], [label], batch_size=batch_size, shuffle=shuffle) +end +function ArrayDataProvider(data::Vector{Pair}, label::Vector{Pair}; batch_size::Int=1, shuffle::Bool=false) + + data_names = Base.Symbol[x[1] for x in data] + data_arrays = Array{MX_float}[x[2] for x in data] + + label_names = Base.Symbol[x[1] for x in label] + label_arrays= Array{MX_float}[x[2] for x in label] + + @assert length(data) > 0 + sample_count = size(data_arrays[1])[end] + for i = 1:length(data_names) + @assert(size(data_arrays[i])[end] == sample_count, + "Number of samples in $(data_names[i]) is mismatch with $(data_names[1])") + end + for i = 1:length(label_names) + @assert(size(label_arrays[i])[end] == sample_count, + "Number of samples in $(label_names[i]) is mismatch with $(label_names[1])") + end + + ArrayDataProvider(data_arrays, data_names, label_arrays, label_names, batch_size, sample_count, shuffle) +end + +function provide_data(provider::ArrayDataProvider) + return collect(zip(provider.data_names, map(size, provider.data_arrays))) +end +function provide_label(provider::ArrayDataProvider) + return collect(zip(provider.label_names, map(size, provider.label_arrays))) +end +get_batch_size(provider::ArrayDataProvider) = provider.batch_size + +immutable ArrayDataProviderState <: AbstractDataProviderState + curr_idx :: Int +end + +function Base.eltype(provider :: ArrayDataProvider) + ArrayDataProviderState +end + +function _shuffle_array(arr::Array, idx::Vector{Int}) + shape = size(arr) + colons = [Colon() for c = 1:length(shape)-1] + getindex(arr, colons..., idx) +end +function Base.start(provider :: ArrayDataProvider) + if provider.shuffle + # re-shuffle all data + idx_perm = randperm(provider.sample_count) + provider.data_arrays = map(x->_shuffle_array(x,idx_perm), provider.data_arrays) + provider.label_arrays = map(x->_shuffle_array(x,idx_perm), provider.label_arrays) + end + + return ArrayDataProviderState(1) +end + +function Base.done(provider::ArrayDataProvider, state :: ArrayDataProviderState) + return state.curr_idx > provider.sample_count +end + +immutable ArrayDataBatch <: AbstractDataBatch + provider :: ArrayDataProvider + idx :: UnitRange{Int} +end +function Base.next(provider :: ArrayDataProvider, state :: ArrayDataProviderState) + idx = state.curr_idx:min(state.curr_idx+provider.batch_size, provider.sample_count) + return (ArrayDataBatch(provider, idx), ArrayDataProviderState(idx.stop+1)) +end + +function get_pad(batch :: ArrayDataBatch) + return batch.provider.batch_size - length(batch.idx) +end + +function _load_general!(batch :: ArrayDataBatch, sources :: Vector{Array{MX_float}}, + targets :: Vector{Vector{SlicedNDArray}}) + @assert length(sources) == length(targets) + for (src, tgt) in zip(sources, targets) + src_colons = [Colon() for i = 1:ndims(src)-1] + for (slice_idx, dst) in tgt + copy!(dst, getindex(src, src_colons..., batch.idx[slice_idx])) + end + end +end +function load_data!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) + _load_general!(batch, batch.provider.data_arrays, targets) +end +function load_label!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) + _load_general!(batch, batch.provider.label_arrays, targets) +end + + + ################################################################################ # MXDataProvider ################################################################################ diff --git a/src/ndarray.jl b/src/ndarray.jl index 40d4c233e2e0..133ebb2a8991 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -181,7 +181,7 @@ end #------------------------------------------------------------ # Copying functions #------------------------------------------------------------ -import Base: copy!, copy +import Base: copy!, copy, convert "Copy data between NDArrays" function copy!(dst :: NDArray, src :: NDArray) @assert(dst.writable) @@ -230,6 +230,11 @@ function copy{T<:Real}(arr :: Array{T}, ctx :: Context) copy!(dst, arr) end +"Convert copy: NDArray -> Julia Array" +function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) + convert(t, copy(arr)) +end + #------------------------------------------------------------ # Basic arithmetics diff --git a/test/unittest/io.jl b/test/unittest/io.jl index 0e9e33f12244..07e3b29a324a 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -2,6 +2,8 @@ module TestIO using MXNet using Base.Test +using ..Main: rand_dims, reldiff + function test_mnist() info("IO::MNIST") filenames = mx.get_mnist_ubyte() @@ -39,6 +41,37 @@ function test_mnist() @test n_batch == 60000 / batch_size end +function test_arrays_impl(data::Vector, label::Vector, provider::mx.ArrayDataProvider) + data = convert(Vector{Array{Float64}}, data) + label = convert(Vector{Array{Float64}}, label) + + sample_count = size(data[1])[end] + batch_size = mx.get_batch_size(provider) + idx_all = 1:batch_size:sample_count + + info("IO::Array::#data=$(length(data)),#label=$(length(label)),batch_size=$batch_size") + for (idx, batch) in zip(idx_all, provider) + data_batch = [x[[Colon() for i=1:ndims(x)-1]..., idx:min(idx+batch_size,sample_count)] for x in data] + data_get = [mx.empty(size(x)[1:end-1]..., batch_size) for x in data] + mx.load_data!(batch, [[(1:batch_size, x)] for x in data_get]) + + for (d_real, d_get) in zip(data_batch, data_batch) + @test reldiff(d_real, copy(d_get)[[1:n for n in size(d_real)]...]) < 1e-6 + @test mx.get_pad(batch) == batch_size - size(d_get)[end] + end + end +end + +function test_arrays() + sample_count = 15 + batch_size = 4 + dims_data = [rand_dims()..., sample_count] + data = rand(dims_data...) + provider = mx.ArrayDataProvider(data, batch_size=batch_size) + test_arrays_impl(Array[data], [], provider) +end + +test_arrays() test_mnist() end From b4cc05cf829a22468caad45eafa65a32770ab4d9 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 20:49:45 -0400 Subject: [PATCH 119/630] more test on array data iterator --- src/io.jl | 60 +++++++++++++++++++++++++++++++-------------- test/unittest/io.jl | 5 ++++ 2 files changed, 47 insertions(+), 18 deletions(-) diff --git a/src/io.jl b/src/io.jl index 389b5a954fe4..5e6cc8b6a449 100644 --- a/src/io.jl +++ b/src/io.jl @@ -124,26 +124,50 @@ type ArrayDataProvider <: AbstractDataProvider shuffle :: Bool end -function ArrayDataProvider{T<:Real}(data::Union{NDArray,Array{T}}; batch_size::Int=1, shuffle::Bool=false) - ArrayDataProvider(:data => data, batch_size=batch_size, shuffle=shuffle) -end -function ArrayDataProvider(data::Pair; batch_size=1, shuffle::Bool=false) - ArrayDataProvider(Pair[data], Pair[], batch_size=batch_size, shuffle=shuffle) -end -function ArrayDataProvider{T<:Real}(data::Union{NDArray,Array{T}}, label::Union{NDArray,Array{T}}; - batch_size::Int=1, shuffle::Bool=false) - ArrayDataProvider(:data => data, :softmax_label => label, batch_size=batch_size, shuffle=shuffle) -end -function ArrayDataProvider(data::Pair, label::Pair; batch_size=1, shuffle::Bool=false) - ArrayDataProvider([data], [label], batch_size=batch_size, shuffle=shuffle) -end -function ArrayDataProvider(data::Vector{Pair}, label::Vector{Pair}; batch_size::Int=1, shuffle::Bool=false) - data_names = Base.Symbol[x[1] for x in data] - data_arrays = Array{MX_float}[x[2] for x in data] +# Julia's type system is sometimes very frustrating. You cannot specify a function +# with argument Vector{Pair} to expect to be matched when calling with the parameter +# [:foo => zeros(2,3), :bar => zeros(3)] because the type inference gives very specific +# results, about the parametric type in the Pair{T1,T2} type, thus does not match the +# generic Pair type. In general, Int <: Number but Vector{Int} <: Vector{Number} is not +# true. So let us just use Any here... +function ArrayDataProvider(data::Any; batch_size::Int=1, shuffle::Bool=false) + ArrayDataProvider(data, [], batch_size=batch_size, shuffle=shuffle) +end +function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bool=false) + if isa(data, Union{NDArray, Array}) + data_names = [:data] + data_arrays = Array{MX_float}[data] + elseif isa(data, Pair) + @assert isa(data.first, Base.Symbol) && isa(data.second, Union{NDArray, Array}) + data_names = [data.first] + data_arrays = Array{MX_float}[data.second] + elseif isa(data, Vector) + map(data) do d + @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) + end + data_names = Base.Symbol[d.first for d in data] + data_arrays = Array{MX_float}[d.second for d in data] + else + error("Invalid data argument type") + end - label_names = Base.Symbol[x[1] for x in label] - label_arrays= Array{MX_float}[x[2] for x in label] + if isa(label, Union{NDArray, Array}) + label_names = [:softmax_label] + label_arrays = Array{MX_float}[data] + elseif isa(label, Pair) + @assert isa(label.first, Base.Symbol) && isa(label.second, Union{NDArray, Array}) + label_names = [label.first] + label_arrays = Array{MX_float}[label.second] + elseif isa(label, Vector) + map(label) do d + @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) + end + label_names = Base.Symbol[d.first for d in label] + label_arrays = Array{MX_float}[d.second for d in label] + else + error("Invalid label argument type") + end @assert length(data) > 0 sample_count = size(data_arrays[1])[end] diff --git a/test/unittest/io.jl b/test/unittest/io.jl index 07e3b29a324a..9eb0581b5eb3 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -69,6 +69,11 @@ function test_arrays() data = rand(dims_data...) provider = mx.ArrayDataProvider(data, batch_size=batch_size) test_arrays_impl(Array[data], [], provider) + + dims_label = [rand_dims()..., sample_count] + label = rand(dims_label...) + provider = mx.ArrayDataProvider(data, label, batch_size=batch_size) + test_arrays_impl(Array[data], Array[label], provider) end test_arrays() From 2c9d9aef77fbf6e8e2061066ba7723e8be0f48e6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 20:59:27 -0400 Subject: [PATCH 120/630] more tests on array data provider --- src/io.jl | 14 +++++++------- test/unittest/io.jl | 16 ++++++++++++---- 2 files changed, 19 insertions(+), 11 deletions(-) diff --git a/src/io.jl b/src/io.jl index 5e6cc8b6a449..efdd4687bff1 100644 --- a/src/io.jl +++ b/src/io.jl @@ -135,14 +135,14 @@ function ArrayDataProvider(data::Any; batch_size::Int=1, shuffle::Bool=false) ArrayDataProvider(data, [], batch_size=batch_size, shuffle=shuffle) end function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bool=false) - if isa(data, Union{NDArray, Array}) + if isa(data, Union{NDArray, Array}) && eltype(data) <: Real data_names = [:data] data_arrays = Array{MX_float}[data] elseif isa(data, Pair) @assert isa(data.first, Base.Symbol) && isa(data.second, Union{NDArray, Array}) data_names = [data.first] data_arrays = Array{MX_float}[data.second] - elseif isa(data, Vector) + elseif isa(data, Vector) || isa(data, Tuple) map(data) do d @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) end @@ -152,14 +152,14 @@ function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bo error("Invalid data argument type") end - if isa(label, Union{NDArray, Array}) + if isa(label, Union{NDArray, Array}) && eltype(label) <: Real label_names = [:softmax_label] - label_arrays = Array{MX_float}[data] + label_arrays = Array{MX_float}[label] elseif isa(label, Pair) @assert isa(label.first, Base.Symbol) && isa(label.second, Union{NDArray, Array}) label_names = [label.first] label_arrays = Array{MX_float}[label.second] - elseif isa(label, Vector) + elseif isa(label, Vector) || isa(label, Tuple) map(label) do d @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) end @@ -169,7 +169,7 @@ function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bo error("Invalid label argument type") end - @assert length(data) > 0 + @assert length(data_arrays) > 0 sample_count = size(data_arrays[1])[end] for i = 1:length(data_names) @assert(size(data_arrays[i])[end] == sample_count, @@ -177,7 +177,7 @@ function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bo end for i = 1:length(label_names) @assert(size(label_arrays[i])[end] == sample_count, - "Number of samples in $(label_names[i]) is mismatch with $(label_names[1])") + "Number of samples in $(label_names[i]) is mismatch with $(data_names[1])") end ArrayDataProvider(data_arrays, data_names, label_arrays, label_names, batch_size, sample_count, shuffle) diff --git a/test/unittest/io.jl b/test/unittest/io.jl index 9eb0581b5eb3..cb7f9edbf7fd 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -66,14 +66,22 @@ function test_arrays() sample_count = 15 batch_size = 4 dims_data = [rand_dims()..., sample_count] - data = rand(dims_data...) - provider = mx.ArrayDataProvider(data, batch_size=batch_size) + data = rand(dims_data...) + provider = mx.ArrayDataProvider(data, batch_size=batch_size) test_arrays_impl(Array[data], [], provider) dims_label = [rand_dims()..., sample_count] - label = rand(dims_label...) - provider = mx.ArrayDataProvider(data, label, batch_size=batch_size) + label = rand(dims_label...) + provider = mx.ArrayDataProvider(data, label, batch_size=batch_size) test_arrays_impl(Array[data], Array[label], provider) + + provider = mx.ArrayDataProvider(:data=>data, :my_label=>label, batch_size=batch_size) + test_arrays_impl(Array[data], Array[label], provider) + + dims_data2 = [rand_dims()..., sample_count] + data2 = rand(dims_data2...) + provider = mx.ArrayDataProvider((:data=>data, :data2=>data2), label, batch_size=batch_size) + test_arrays_impl(Array[data,data2], Array[label], provider) end test_arrays() From dc8ca183623ff2ff84ee8b441110e38bd731ea01 Mon Sep 17 00:00:00 2001 From: Yeesian Ng Date: Sun, 25 Oct 2015 21:31:28 -0400 Subject: [PATCH 121/630] fix README example --- README.md | 1 + 1 file changed, 1 insertion(+) diff --git a/README.md b/README.md index c184eac57178..d856165308eb 100644 --- a/README.md +++ b/README.md @@ -24,6 +24,7 @@ mlp = @mx.chain mx.Variable(:data) => # data provider batch_size = 100 +include(Pkg.dir("MXNet") * "/examples/mnist/mnist-data.jl") train_provider, eval_provider = get_mnist_providers(batch_size) # setup estimator From eb8440215fa75470d06dda5ff9f9c69346a075fe Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 21:49:56 -0400 Subject: [PATCH 122/630] test shuffling of array data provider --- src/io.jl | 44 ++++++++++++++++++++++++++++---------------- src/ndarray.jl | 5 ++++- test/unittest/io.jl | 33 ++++++++++++++++++++++++++++++--- 3 files changed, 62 insertions(+), 20 deletions(-) diff --git a/src/io.jl b/src/io.jl index efdd4687bff1..5ffcf95f0bef 100644 --- a/src/io.jl +++ b/src/io.jl @@ -115,13 +115,15 @@ abstract AbstractDataBatch ################################################################################ "A convenient tool to iterate `NDArray` or Julia `Array`" type ArrayDataProvider <: AbstractDataProvider - data_arrays :: Vector{Array{MX_float}} - data_names :: Vector{Base.Symbol} - label_arrays:: Vector{Array{MX_float}} - label_names :: Vector{Base.Symbol} - batch_size :: Int - sample_count:: Int - shuffle :: Bool + data_arrays :: Vector{Array{MX_float}} + data_names :: Vector{Base.Symbol} + label_arrays :: Vector{Array{MX_float}} + label_names :: Vector{Base.Symbol} + batch_size :: Int + sample_count :: Int + shuffle :: Bool + data_padding :: MX_float + label_padding :: MX_float end @@ -131,10 +133,10 @@ end # results, about the parametric type in the Pair{T1,T2} type, thus does not match the # generic Pair type. In general, Int <: Number but Vector{Int} <: Vector{Number} is not # true. So let us just use Any here... -function ArrayDataProvider(data::Any; batch_size::Int=1, shuffle::Bool=false) - ArrayDataProvider(data, [], batch_size=batch_size, shuffle=shuffle) +function ArrayDataProvider(data::Any; batch_size::Int=1, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) + ArrayDataProvider(data, [], batch_size=batch_size, shuffle=shuffle, data_padding=data_padding, label_padding=label_padding) end -function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bool=false) +function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) if isa(data, Union{NDArray, Array}) && eltype(data) <: Real data_names = [:data] data_arrays = Array{MX_float}[data] @@ -180,7 +182,8 @@ function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bo "Number of samples in $(label_names[i]) is mismatch with $(data_names[1])") end - ArrayDataProvider(data_arrays, data_names, label_arrays, label_names, batch_size, sample_count, shuffle) + ArrayDataProvider(data_arrays, data_names, label_arrays, label_names, batch_size, + sample_count, shuffle, data_padding, label_padding) end function provide_data(provider::ArrayDataProvider) @@ -224,7 +227,7 @@ immutable ArrayDataBatch <: AbstractDataBatch idx :: UnitRange{Int} end function Base.next(provider :: ArrayDataProvider, state :: ArrayDataProviderState) - idx = state.curr_idx:min(state.curr_idx+provider.batch_size, provider.sample_count) + idx = state.curr_idx:min(state.curr_idx+provider.batch_size-1, provider.sample_count) return (ArrayDataBatch(provider, idx), ArrayDataProviderState(idx.stop+1)) end @@ -233,20 +236,29 @@ function get_pad(batch :: ArrayDataBatch) end function _load_general!(batch :: ArrayDataBatch, sources :: Vector{Array{MX_float}}, - targets :: Vector{Vector{SlicedNDArray}}) + targets :: Vector{Vector{SlicedNDArray}}, pad_val::Real) @assert length(sources) == length(targets) for (src, tgt) in zip(sources, targets) src_colons = [Colon() for i = 1:ndims(src)-1] for (slice_idx, dst) in tgt - copy!(dst, getindex(src, src_colons..., batch.idx[slice_idx])) + if slice_idx.start > length(batch.idx) + dst[:] = pad_val + else + slice_idx0 = slice_idx.start:min(slice_idx.stop, length(batch.idx)) + copy!(dst[1:length(slice_idx0)], getindex(src, src_colons..., batch.idx[slice_idx0])) + if length(slice_idx0) < length(slice_idx) + # need padding + dst[length(slice_idx0)+1:length(slice_idx)] = pad_val + end + end end end end function load_data!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) - _load_general!(batch, batch.provider.data_arrays, targets) + _load_general!(batch, batch.provider.data_arrays, targets, batch.provider.data_padding) end function load_label!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) - _load_general!(batch, batch.provider.label_arrays, targets) + _load_general!(batch, batch.provider.label_arrays, targets, batch.provider.label_padding) end diff --git a/src/ndarray.jl b/src/ndarray.jl index 133ebb2a8991..2156ce76be14 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -140,6 +140,9 @@ end function slice(arr :: NDArray, slice::UnitRange{Int}) dim1 = size(arr)[end] @assert(1 <= slice.start <= slice.stop <= dim1) + if slice.start == 1 && slice.stop == dim1 + return arr + end hdr_ref = Ref{MX_handle}(0) # note Julia is 1-based, inclusive-inclusive indexing, while C++ is @@ -164,7 +167,7 @@ function setindex!(arr :: NDArray, val :: NDArray, ::Colon) copy!(arr, val) end function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, idx::UnitRange{Int}) - copy!(slice(arr, idx), val) + setindex!(slice(arr, idx), val, Colon()) end import Base: getindex diff --git a/test/unittest/io.jl b/test/unittest/io.jl index cb7f9edbf7fd..cffb00417a57 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -51,13 +51,13 @@ function test_arrays_impl(data::Vector, label::Vector, provider::mx.ArrayDataPro info("IO::Array::#data=$(length(data)),#label=$(length(label)),batch_size=$batch_size") for (idx, batch) in zip(idx_all, provider) - data_batch = [x[[Colon() for i=1:ndims(x)-1]..., idx:min(idx+batch_size,sample_count)] for x in data] + data_batch = [x[[Colon() for i=1:ndims(x)-1]..., idx:min(idx+batch_size-1,sample_count)] for x in data] data_get = [mx.empty(size(x)[1:end-1]..., batch_size) for x in data] mx.load_data!(batch, [[(1:batch_size, x)] for x in data_get]) - for (d_real, d_get) in zip(data_batch, data_batch) + for (d_real, d_get) in zip(data_batch, data_get) @test reldiff(d_real, copy(d_get)[[1:n for n in size(d_real)]...]) < 1e-6 - @test mx.get_pad(batch) == batch_size - size(d_get)[end] + @test mx.get_pad(batch) == batch_size - size(d_real)[end] end end end @@ -84,6 +84,33 @@ function test_arrays() test_arrays_impl(Array[data,data2], Array[label], provider) end +function test_arrays_shuffle() + info("IO::Array::shuffle") + + sample_count = 15 + batch_size = 4 + data = rand(1, sample_count) + label = collect(1:sample_count) + provider = mx.ArrayDataProvider(data, :index => label, batch_size=batch_size, shuffle=true) + + idx_all = 1:batch_size:sample_count + data_got = similar(data) + label_got = similar(label) + for (idx, batch) in zip(idx_all, provider) + data_batch = [(1:batch_size, mx.empty(1,batch_size))] + label_batch = [(1:batch_size, mx.empty(batch_size))] + mx.load_data!(batch, typeof(data_batch)[data_batch]) + mx.load_label!(batch, typeof(label_batch)[label_batch]) + data_got[idx:min(idx+batch_size-1,sample_count)] = copy(data_batch[1][2])[1:batch_size-mx.get_pad(batch)] + label_got[idx:min(idx+batch_size-1,sample_count)] = copy(label_batch[1][2])[1:batch_size-mx.get_pad(batch)] + end + + @test label_got != label + @test sort(label_got) == label + @test reldiff(data_got, data[:,Int[label_got...]]) < 1e-6 +end + +test_arrays_shuffle() test_arrays() test_mnist() From 1538340e3a6874c4380e7b0b5d44aab3ee992f53 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 22:03:56 -0400 Subject: [PATCH 123/630] rename estimator -> model --- README.md | 6 +++--- docs/tutorials/mnist.md | 10 +++++----- docs/user-guide/overview.md | 4 ++-- examples/cifar10/cifar10.jl | 4 ++-- examples/mnist/lenet.jl | 4 ++-- examples/mnist/mlp.jl | 6 +++--- src/MXNet.jl | 2 +- src/callback.jl | 10 +++++----- src/{estimator.jl => model.jl} | 6 +++--- 9 files changed, 26 insertions(+), 26 deletions(-) rename src/{estimator.jl => model.jl} (98%) diff --git a/README.md b/README.md index c184eac57178..33a347ceeb78 100644 --- a/README.md +++ b/README.md @@ -26,14 +26,14 @@ mlp = @mx.chain mx.Variable(:data) => batch_size = 100 train_provider, eval_provider = get_mnist_providers(batch_size) -# setup estimator -estimator = mx.FeedForward(mlp, context=mx.cpu()) +# setup model +model = mx.FeedForward(mlp, context=mx.cpu()) # optimizer optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) ``` For more details, please refer to the [document](http://mxnetjl.readthedocs.org/) and [examples](examples). diff --git a/docs/tutorials/mnist.md b/docs/tutorials/mnist.md index 97a12e8aadeb..ecf7bab8f631 100644 --- a/docs/tutorials/mnist.md +++ b/docs/tutorials/mnist.md @@ -45,9 +45,9 @@ train_provider, eval_provider = get_mnist_providers(batch_size) ``` If you need to write your own data providers for customized data format, please refer to **TODO**: pointer to data provider API. -Given the architecture and data, we can instantiate an *estimator* to do the actual training. `mx.FeedForward` is the built-in estimator that is suitable for most feed-forward architectures. When constructing the estimator, we also specify the *context* on which the computation should be carried out. Because this is a really tiny MLP, we will just run on a single CPU device. +Given the architecture and data, we can instantiate an *model* to do the actual training. `mx.FeedForward` is the built-in model that is suitable for most feed-forward architectures. When constructing the model, we also specify the *context* on which the computation should be carried out. Because this is a really tiny MLP, we will just run on a single CPU device. ```julia -estimator = mx.FeedForward(mlp, context=mx.cpu()) +model = mx.FeedForward(mlp, context=mx.cpu()) ``` You can use a `mx.gpu()` or if a list of devices (e.g. `[mx.gpu(0), mx.gpu(1)]`) is provided, data-parallelization will be used automatically. But for this tiny example, using a GPU device might not help. @@ -57,7 +57,7 @@ optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) ``` Now we can do the training. Here the `n_epoch` parameter specifies that we want to train for 20 epochs. We also supply a `eval_data` to monitor validation accuracy on the validation set. ```julia -mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) ``` Here is a sample output ``` @@ -124,13 +124,13 @@ Note we specified `flat=false` to tell the data provider to provide 4D tensors i ```julia #-------------------------------------------------------------------------------- # fit model -estimator = mx.FeedForward(lenet, context=mx.gpu()) +model = mx.FeedForward(lenet, context=mx.gpu()) # optimizer optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) ``` And here is a sample of running outputs: ``` diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md index 3155b281245d..7689b3fba921 100644 --- a/docs/user-guide/overview.md +++ b/docs/user-guide/overview.md @@ -130,9 +130,9 @@ copy(c_exec.outputs[1]) # copy turns NDArray into Julia Array # 8.0 # 8.0 ``` -For neural networks, it is easier to use `simple_bind`. By providing the shape for input arguments, it will perform a shape inference for the rest of the arguments and create the `NDArray`s automatically. In practice, the binding and executing steps are hidden under the `Estimator` interface. +For neural networks, it is easier to use `simple_bind`. By providing the shape for input arguments, it will perform a shape inference for the rest of the arguments and create the `NDArray`s automatically. In practice, the binding and executing steps are hidden under the `Model` interface. -**TODO** Provide pointers to estimator tutorial and further details about binding and symbolic API. +**TODO** Provide pointers to model tutorial and further details about binding and symbolic API. # Low Level Interface diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl index 7b335d3b1219..c46e2b3bf15c 100644 --- a/examples/cifar10/cifar10.jl +++ b/examples/cifar10/cifar10.jl @@ -74,7 +74,7 @@ test_provider = mx.ImageRecordProvider(label_name=:loss_label, #-------------------------------------------------------------------------------- # Training model gpus = [mx.Context(mx.GPU, i) for i = 0:num_gpus-1] -estimator = mx.FeedForward(softmax, context=gpus) +model = mx.FeedForward(softmax, context=gpus) # optimizer optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.05), @@ -82,5 +82,5 @@ optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.05), weight_decay=0.0001) # fit parameters -mx.fit(estimator, optimizer, train_provider, n_epoch=num_epoch, eval_data=test_provider, +mx.fit(model, optimizer, train_provider, n_epoch=num_epoch, eval_data=test_provider, initializer=mx.UniformInitializer(0.07), callbacks=[mx.speedometer()]) diff --git a/examples/mnist/lenet.jl b/examples/mnist/lenet.jl index 92f41e88aeb6..804fc1ea5312 100644 --- a/examples/mnist/lenet.jl +++ b/examples/mnist/lenet.jl @@ -36,10 +36,10 @@ train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) #-------------------------------------------------------------------------------- # fit model -estimator = mx.FeedForward(lenet, context=mx.gpu()) +model = mx.FeedForward(lenet, context=mx.gpu()) # optimizer optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 26aa4ecfda49..2dbae9790c3f 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -27,11 +27,11 @@ batch_size = 100 include("mnist-data.jl") train_provider, eval_provider = get_mnist_providers(batch_size) -# setup estimator -estimator = mx.FeedForward(mlp, context=mx.cpu()) +# setup model +model = mx.FeedForward(mlp, context=mx.cpu()) # optimizer optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(estimator, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) diff --git a/src/MXNet.jl b/src/MXNet.jl index 9f404a077aed..53553d417941 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -26,7 +26,7 @@ include("io.jl") include("kvstore.jl") include("callback.jl") -include("estimator.jl") +include("model.jl") include("util.jl") diff --git a/src/callback.jl b/src/callback.jl index c124c9b9357c..049f19432981 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -57,19 +57,19 @@ end function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) end -function Base.call(cb :: EpochCallback, estimator :: Any, param :: CallbackParams) +function Base.call(cb :: EpochCallback, model :: Any, param :: CallbackParams) if param.curr_epoch == 0 if cb.call_on_0 - cb.callback(estimator, param) + cb.callback(model, param) end elseif param.curr_epoch % cb.frequency == 0 - cb.callback(estimator, param) + cb.callback(model, param) end end function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) mkpath(dirname(prefix)) - every_n_epoch(frequency, call_on_0=save_epoch_0) do estimator, param - save_checkpoint(estimator, prefix, param) + every_n_epoch(frequency, call_on_0=save_epoch_0) do model, param + save_checkpoint(model, prefix, param) end end diff --git a/src/estimator.jl b/src/model.jl similarity index 98% rename from src/estimator.jl rename to src/model.jl index c18eb5f3a6d4..77b435dd829c 100644 --- a/src/estimator.jl +++ b/src/model.jl @@ -1,6 +1,6 @@ -abstract AbstractEstimator +abstract AbstractModel -type FeedForward <: AbstractEstimator +type FeedForward <: AbstractModel arch :: Symbol ctx :: Vector{Context} @@ -107,7 +107,7 @@ function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback map(callbacks) do cb if isa(cb, type_filter) if type_filter == AbstractEpochCallback - # epoch callback have extra access to the estimator object + # epoch callback have extra access to the model object cb(self, param) else cb(param) From 28791db37922d16a466be6a2ed9ae4726623acf6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 22:05:59 -0400 Subject: [PATCH 124/630] use joinpath in README --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 4e2d849e035e..8e148c2d7529 100644 --- a/README.md +++ b/README.md @@ -24,7 +24,7 @@ mlp = @mx.chain mx.Variable(:data) => # data provider batch_size = 100 -include(Pkg.dir("MXNet") * "/examples/mnist/mnist-data.jl") +include(joinpath(Pkg.dir("MXNet"), "/examples/mnist/mnist-data.jl")) train_provider, eval_provider = get_mnist_providers(batch_size) # setup model From 1baeabc4eaae8f75da6884b1d9cd5ee638163fed Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 22:36:07 -0400 Subject: [PATCH 125/630] expose init_model API --- src/model.jl | 50 ++++++++++++++++++++++++++++++++++++++++---------- 1 file changed, 40 insertions(+), 10 deletions(-) diff --git a/src/model.jl b/src/model.jl index 77b435dd829c..df364bef3410 100644 --- a/src/model.jl +++ b/src/model.jl @@ -7,7 +7,7 @@ type FeedForward <: AbstractModel arg_params :: Dict{Base.Symbol, NDArray} aux_params :: Dict{Base.Symbol, NDArray} - pred_exec :: Executor + pred_exec :: Union{Executor, Void} # leave the rest fields undefined FeedForward(arch :: Symbol, ctx :: Vector{Context}) = new(arch, ctx) @@ -38,19 +38,28 @@ function FeedForward(arch :: Symbol; context :: Union{Context, Vector{Context}, FeedForward(arch, context) end -function _init_params(self :: FeedForward, data :: AbstractDataProvider, initializer) +"""Initialize the weights in the model. + +This method will be called automatically when training a model. So there is usually no +need to call this method unless one needs to inspect a model with only randomly initialized +weights. + +**Parameters** + +* `self`: the model to be initialized +* `initializer`: an `AbstractInitializer` +* `input_shapes`: the shape of all data and label inputs to this model, given as keyword arguments. +""" +function init_model(self :: FeedForward, initializer :: AbstractInitializer; input_shapes...) # all arg names, including data, label, and parameters arg_names = list_arguments(self.arch) - data_shapes = provide_data(data) - label_shapes = provide_label(data) - data_names = [x[1] for x in data_shapes] - label_names = [x[1] for x in label_shapes] + input_names = [x[1] for x in input_shapes] - param_names = setdiff(arg_names, data_names ∪ label_names) + param_names = setdiff(arg_names, input_names) aux_names = list_auxiliary_states(self.arch) - arg_shapes, out_shapes, aux_shapes = infer_shape(self.arch; data_shapes...) + arg_shapes, out_shapes, aux_shapes = infer_shape(self.arch; input_shapes...) if !isdefined(self, :arg_params) param_name_shapes = filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) self.arg_params = Dict([name => empty(shape) for (name,shape) in param_name_shapes]) @@ -70,6 +79,10 @@ function _init_params(self :: FeedForward, data :: AbstractDataProvider, initial return (arg_names, param_names, aux_names) end +function _init_model(self :: FeedForward, data :: AbstractDataProvider, initializer :: AbstractInitializer) + init_model(self, initializer; [provide_data(data)..., provide_label(data)...]...) +end + function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}) if num_device == 1 && !ismatch(r"dist", string(kv_type)) kv = nothing @@ -116,6 +129,23 @@ function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback end end +function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_shapes...) + if !isdefined(self, :pred_exec) || isa(self.pred_exec, Void) || overwrite + if !isdefined(self, :arg_params) || !isdefined(self, :aux_params) + @assert(false, "Model weights not defined, please init or train the model, or load from file") + end + else + # make sure the new setup is compatible with the existing one + for (d_name, d_shape) in data_shapes + @assert(d_shape == size(self.pred_exec.arg_dict[d_name]), + "Shape of $d_name mismatch with existing predictor, use overwrite=true overwrite existing predictor") + end + end +end + +function predict(self :: FeedForward, data :: AbstractDataProvider) +end + function train(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) fit(self, optimizer, data; kwargs...) end @@ -130,7 +160,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # initialize parameters info("Initializing parameters...") - arg_names, param_names, aux_names = _init_params(self, data, opts.initializer) + arg_names, param_names, aux_names = _init_model(self, data, opts.initializer) # setup kvstore kvstore = opts.kvstore @@ -299,7 +329,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end end - if i_epoch == opts.n_epoch || any(map(x->isa(x, AbstractEpochCallback), opts.callbacks)) + if i_epoch == opts.n_epoch || any(x->isa(x, AbstractEpochCallback), opts.callbacks) # copy data back to cpu for (name, weights) in zip(param_names, param_arrays) # average parameters across devices From 7fa151104fb51d7134da60a5084dfa0d240515f0 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 25 Oct 2015 23:22:05 -0400 Subject: [PATCH 126/630] model predict API and demo --- examples/mnist/mlp.jl | 22 ++++++++++++++++++++++ src/executor.jl | 2 +- src/io.jl | 17 +++++++++++++++++ src/model.jl | 32 +++++++++++++++++++++++++++++++- 4 files changed, 71 insertions(+), 2 deletions(-) diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 2dbae9790c3f..0834739467e9 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -35,3 +35,25 @@ optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) # fit parameters mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) + +#-------------------------------------------------------------------------------- +# Optional, demonstration of the predict API +outputs = mx.predict(model, eval_provider) +probs = outputs[1] + +# collect all labels from eval data +labels = Array[] +for batch in eval_provider + push!(labels, copy(mx.get_label(batch)[1])) +end +labels = cat(1, labels...) + +# Now we use compute the accuracy +correct = 0 +for i = 1:length(labels) + # labels are 0...9 + if indmax(probs[:,i]) == labels[i]+1 + correct += 1 + end +end +println(mx.format("Accuracy on eval set: {1:.2f}%", 100correct/length(labels))) diff --git a/src/executor.jl b/src/executor.jl index fe83db86a831..4d57c1da7b7c 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -108,7 +108,7 @@ function simple_bind(self :: Symbol, ctx :: Context; grad_req :: GRAD_REQ=GRAD_W arg_arrays = NDArray[zeros(shape, ctx) for shape in arg_shapes] arg_names = list_arguments(self) if grad_req == GRAD_NOP - grad_arrays = nothing + grad_arrays = Dict{Base.Symbol,NDArray}() else provided_data_names = [x[1] for x in kwargs] grad_arrays = Dict{Base.Symbol,NDArray}() diff --git a/src/io.jl b/src/io.jl index 5ffcf95f0bef..dcbefb145859 100644 --- a/src/io.jl +++ b/src/io.jl @@ -106,9 +106,26 @@ get_pad(batch :: AbstractDataBatch) ``` Return the number of *dummy samples* in this mini-batch. + +The Batch type should have a field named `provider` pointing to the underlying provider. Helper functions +`get_data` and `get_label` (mainly for debug purpose) will be able to use this. """ abstract AbstractDataBatch +function _get_data_or_label(batch::AbstractDataBatch, provide_func::Function, loader::Function) + data_shapes = provide_func(batch.provider) + data_arrays = [mx.empty(x[2]) for x in data_shapes] + batch_size = get_batch_size(batch.provider) + data_arrays_fake_slice = [SlicedNDArray[(1:batch_size, x)] for x in data_arrays] + loader(batch, data_arrays_fake_slice) + return data_arrays +end +function get_data(batch :: AbstractDataBatch) + _get_data_or_label(batch, provide_data, load_data!) +end +function get_label(batch :: AbstractDataBatch) + _get_data_or_label(batch, provide_label, load_label!) +end ################################################################################ # ArrayDataProvider diff --git a/src/model.jl b/src/model.jl index df364bef3410..6cc7097b28ce 100644 --- a/src/model.jl +++ b/src/model.jl @@ -134,6 +134,10 @@ function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_sha if !isdefined(self, :arg_params) || !isdefined(self, :aux_params) @assert(false, "Model weights not defined, please init or train the model, or load from file") end + + # the predictor use only the first device + self.pred_exec = simple_bind(self.arch, self.ctx[1]; grad_req=GRAD_NOP, data_shapes...) + copy_params_from(self.pred_exec, self.arg_params, self.aux_params) else # make sure the new setup is compatible with the existing one for (d_name, d_shape) in data_shapes @@ -143,7 +147,33 @@ function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_sha end end -function predict(self :: FeedForward, data :: AbstractDataProvider) +function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::Bool=false) + data_shapes = provide_data(data) + data_names = [x[1] for x in data_shapes] + _setup_predictor(self, overwrite; data_shapes...) + + batch_size = get_batch_size(data) + data_arrays = [SlicedNDArray[(1:batch_size, self.pred_exec.arg_dict[name])] for name in data_names] + output_list = [Array{MX_float}[] for i=1:length(self.pred_exec.outputs)] + for batch in data + load_data!(batch, data_arrays) + forward(self.pred_exec, is_train=false) + for (o_list, o_nd) in zip(output_list, self.pred_exec.outputs) + push!(o_list, copy(slice(o_nd, 1:batch_size-get_pad(batch)))) + end + end + + if isempty(output_list) + # maybe model does not have outputs + return Array{MX_float}[] + end + if isempty(output_list[1]) + # model has outputs, but maybe data provider is empty + return output_list + end + # concatenate along mini-batches + output_arrays = [cat(ndims(x[1]), x...) for x in output_list] + return output_arrays end function train(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) From bb4620e6bc228a7b124f038ac7cbe5de939c5d0b Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 26 Oct 2015 16:35:33 -0400 Subject: [PATCH 127/630] model checkpoint loading --- docs/api/ndarray.md | 51 ++++++++++++++++++++-------------- docs/api/symbol.md | 35 ++++++++++++++++++++--- src/model.jl | 67 +++++++++++++++++++++++++++++++++++++++------ 3 files changed, 120 insertions(+), 33 deletions(-) diff --git a/docs/api/ndarray.md b/docs/api/ndarray.md index 87e664ffb0cc..fae68df32c2b 100644 --- a/docs/api/ndarray.md +++ b/docs/api/ndarray.md @@ -32,7 +32,16 @@ object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs wi *source:* -[MXNet/src/ndarray.jl:453](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L453) +[MXNet/src/ndarray.jl:468](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L468) + +--- + + +#### convert{T<:Real}(t::Type{Array{T<:Real, N}}, arr::MXNet.mx.NDArray) +Convert copy: NDArray -> Julia Array + +*source:* +[MXNet/src/ndarray.jl:237](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L237) --- @@ -41,7 +50,7 @@ object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs wi Copy data from NDArray to Julia Array *source:* -[MXNet/src/ndarray.jl:198](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L198) +[MXNet/src/ndarray.jl:201](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L201) --- @@ -50,7 +59,7 @@ Copy data from NDArray to Julia Array Copy data between NDArrays *source:* -[MXNet/src/ndarray.jl:186](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L186) +[MXNet/src/ndarray.jl:189](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L189) --- @@ -59,7 +68,7 @@ Copy data between NDArrays Copy data from Julia Array to NDArray *source:* -[MXNet/src/ndarray.jl:206](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L206) +[MXNet/src/ndarray.jl:209](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L209) --- @@ -68,7 +77,7 @@ Copy data from Julia Array to NDArray Create copy: NDArray -> Julia Array *source:* -[MXNet/src/ndarray.jl:216](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L216) +[MXNet/src/ndarray.jl:219](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L219) --- @@ -77,7 +86,7 @@ Create copy: NDArray -> Julia Array Create copy: NDArray -> NDArray in a given context *source:* -[MXNet/src/ndarray.jl:222](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L222) +[MXNet/src/ndarray.jl:225](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L225) --- @@ -86,7 +95,7 @@ Create copy: NDArray -> NDArray in a given context Create copy: Julia Array -> NDArray in a given context *source:* -[MXNet/src/ndarray.jl:228](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L228) +[MXNet/src/ndarray.jl:231](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L231) --- @@ -97,12 +106,12 @@ copy of the sub-array, while here we simply call `slice`, which shares the under *source:* -[MXNet/src/ndarray.jl:174](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L174) +[MXNet/src/ndarray.jl:177](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L177) --- - -#### load_ndarrays(filename::AbstractString) + +#### load(filename::AbstractString, ::Type{MXNet.mx.NDArray}) Load NDArrays from binary file. **Parameters**: @@ -120,7 +129,7 @@ Load NDArrays from binary file. *source:* -[MXNet/src/ndarray.jl:373](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L373) +[MXNet/src/ndarray.jl:384](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L384) --- @@ -129,12 +138,12 @@ Load NDArrays from binary file. Create NDArray and initialize with 1 *source:* -[MXNet/src/ndarray.jl:118](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L118) +[MXNet/src/ndarray.jl:118](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L118) --- - -#### save_ndarrays(filename::AbstractString, data::MXNet.mx.NDArray) + +#### save(filename::AbstractString, data::MXNet.mx.NDArray) Save NDarrays to binary file. **Parameters**: @@ -144,7 +153,7 @@ Save NDarrays to binary file. *source:* -[MXNet/src/ndarray.jl:398](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L398) +[MXNet/src/ndarray.jl:409](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L409) --- @@ -153,7 +162,7 @@ Save NDarrays to binary file. Assign all elements of an NDArray to a scalar *source:* -[MXNet/src/ndarray.jl:155](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L155) +[MXNet/src/ndarray.jl:158](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L158) --- @@ -165,7 +174,7 @@ Get the shape of an `NDArray`. Note the shape is converted to Julia convention. *source:* -[MXNet/src/ndarray.jl:84](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L84) +[MXNet/src/ndarray.jl:84](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L84) --- @@ -179,7 +188,7 @@ used in data parallelization to split mini-batch into sub-batches for different *source:* -[MXNet/src/ndarray.jl:137](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L137) +[MXNet/src/ndarray.jl:137](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L137) --- @@ -188,7 +197,7 @@ used in data parallelization to split mini-batch into sub-batches for different Create zero-ed NDArray of specific shape *source:* -[MXNet/src/ndarray.jl:105](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L105) +[MXNet/src/ndarray.jl:105](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L105) --- @@ -206,7 +215,7 @@ have shape (28,28,1,100). *source:* -[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L32) +[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L32) --- @@ -234,5 +243,5 @@ which will do inplace adding of the contents of b into a. *source:* -[MXNet/src/ndarray.jl:258](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/ndarray.jl#L258) +[MXNet/src/ndarray.jl:266](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L266) diff --git a/docs/api/symbol.md b/docs/api/symbol.md index d263bb4fcbc2..a17f0c261fa2 100644 --- a/docs/api/symbol.md +++ b/docs/api/symbol.md @@ -9,7 +9,7 @@ Create a symbol that groups symbols together *source:* -[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/symbol.jl#L77) +[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L77) --- @@ -18,7 +18,16 @@ Create a symbol that groups symbols together Create a symbolic variable with the given name *source:* -[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/symbol.jl#L70) +[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L70) + +--- + + +#### from_json(repr::AbstractString, ::Type{MXNet.mx.Symbol}) +Load Symbol from a JSON string representation. + +*source:* +[MXNet/src/symbol.jl:240](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L240) --- @@ -27,7 +36,7 @@ Create a symbolic variable with the given name Get a new grouped symbol whose output contains all the internal outputs of this symbol. *source:* -[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/symbol.jl#L63) +[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L63) --- @@ -42,5 +51,23 @@ Most operators do not have Auxiliary states. *source:* -[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/d738fba18ebf731bf4f7306d81056fc63357810a/src/symbol.jl#L58) +[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L58) + +--- + + +#### load(filename::AbstractString, ::Type{MXNet.mx.Symbol}) +Load Symbol from a JSON file. + +*source:* +[MXNet/src/symbol.jl:247](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L247) + +--- + + +#### to_json(self::MXNet.mx.Symbol) +Save Symbol into a JSON string + +*source:* +[MXNet/src/symbol.jl:233](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L233) diff --git a/src/model.jl b/src/model.jl index 6cc7097b28ce..da9f995f3707 100644 --- a/src/model.jl +++ b/src/model.jl @@ -48,9 +48,10 @@ weights. * `self`: the model to be initialized * `initializer`: an `AbstractInitializer` +* `overwrite`: keyword argument, force initialization even when weights already exists * `input_shapes`: the shape of all data and label inputs to this model, given as keyword arguments. """ -function init_model(self :: FeedForward, initializer :: AbstractInitializer; input_shapes...) +function init_model(self :: FeedForward, initializer :: AbstractInitializer; overwrite::Bool=false, input_shapes...) # all arg names, including data, label, and parameters arg_names = list_arguments(self.arch) @@ -59,28 +60,37 @@ function init_model(self :: FeedForward, initializer :: AbstractInitializer; inp param_names = setdiff(arg_names, input_names) aux_names = list_auxiliary_states(self.arch) + arg_defined = true + aux_defined = true + arg_shapes, out_shapes, aux_shapes = infer_shape(self.arch; input_shapes...) if !isdefined(self, :arg_params) param_name_shapes = filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) self.arg_params = Dict([name => empty(shape) for (name,shape) in param_name_shapes]) + arg_defined = false end if !isdefined(self, :aux_params) self.aux_params = Dict([name => empty(shape) for (name,shape) in zip(aux_names,aux_shapes)]) + aux_defined = false end # initialize the contents of the parameters - for (k,v) in self.arg_params - initializer(k, v) + if !arg_defined || overwrite + for (k,v) in self.arg_params + initializer(k, v) + end end - for (k,v) in self.aux_params - initializer(k, v) + if !aux_defined || overwrite + for (k,v) in self.aux_params + initializer(k, v) + end end return (arg_names, param_names, aux_names) end -function _init_model(self :: FeedForward, data :: AbstractDataProvider, initializer :: AbstractInitializer) - init_model(self, initializer; [provide_data(data)..., provide_label(data)...]...) +function _init_model(self :: FeedForward, data :: AbstractDataProvider, initializer :: AbstractInitializer, overwrite :: Bool) + init_model(self, initializer; overwrite=overwrite, [provide_data(data)..., provide_label(data)...]...) end function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}) @@ -113,6 +123,7 @@ end eval_data :: Union{Void, AbstractDataProvider} = nothing, eval_metric :: AbstractEvalMetric = Accuracy(), kvstore :: Union{Base.Symbol, KVStore} = :local, + force_init :: Bool = false, callbacks :: Vector{AbstractCallback} = AbstractCallback[], ) @@ -190,7 +201,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # initialize parameters info("Initializing parameters...") - arg_names, param_names, aux_names = _init_model(self, data, opts.initializer) + arg_names, param_names, aux_names = _init_model(self, data, opts.initializer, opts.force_init) # setup kvstore kvstore = opts.kvstore @@ -388,3 +399,43 @@ function save_checkpoint(sym :: Symbol, arg_params :: Dict{Base.Symbol, NDArray} info("Saved checkpoint to '$save_filename'") end +function load_checkpoint(prefix :: AbstractString, epoch :: Int) + arch = load("$prefix-symbol.json", Symbol) + saved_dict = load(format("{1}-{2:04d}.params", prefix, epoch), NDArray) + arg_params = Dict{Base.Symbol, NDArray}() + aux_params = Dict{Base.Symbol, NDArray}() + for (k,v) in saved_dict + tp, name = split(string(k), ':') + name = symbol(name) + if tp == "arg" + arg_params[name] = v + else + aux_params[name] = v + end + end + + return (arch, arg_params, aux_params) +end + +function load_checkpoint(prefix :: AbstractString, epoch :: Int, ::Type{FeedForward}) + arch, arg_params, aux_params = load_checkpoint(prefix, epoch) + model = FeedForward(arch) + model.arg_params = arg_params + model.aux_params = aux_params + return model +end + +function load_checkpoint(self :: FeedForward, prefix :: AbstractString, epoch :: Int; overwrite :: Bool = true) + if isdefined(self, :arg_params) && isdefined(self, :aux_params) && !overwrite + info("model weights already exists, skip loading... (call with overwrite=true if needed)") + return self + end + + arch, arg_params, aux_params = load_checkpoint(prefix, epoch) + # TODO: is there better way to compare two symbols + @assert(to_json(self.arch) == to_json(arch), "Cannot load from a checkpoint with different network architecture") + self.arg_params = arg_params + self.aux_params = aux_params + return self +end + From f8a01bfaaef934be49eca2ed18f13c4bf1df7f2c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 26 Oct 2015 16:44:40 -0400 Subject: [PATCH 128/630] allow callbacks in predict --- examples/mnist/mlp.jl | 3 +-- src/model.jl | 30 ++++++++++++++++++++++++------ 2 files changed, 25 insertions(+), 8 deletions(-) diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 0834739467e9..6e40c00b6b15 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -38,8 +38,7 @@ mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) #-------------------------------------------------------------------------------- # Optional, demonstration of the predict API -outputs = mx.predict(model, eval_provider) -probs = outputs[1] +probs = mx.predict(model, eval_provider) # collect all labels from eval data labels = Array[] diff --git a/src/model.jl b/src/model.jl index da9f995f3707..80ee36d10674 100644 --- a/src/model.jl +++ b/src/model.jl @@ -158,7 +158,10 @@ function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_sha end end -function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::Bool=false) +function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = false) + predict(self, data; overwrite = overwrite, callback=callback) +end +function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::Bool=false, callback::Union{Function,Void}=nothing) data_shapes = provide_data(data) data_names = [x[1] for x in data_shapes] _setup_predictor(self, overwrite; data_shapes...) @@ -169,21 +172,36 @@ function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::B for batch in data load_data!(batch, data_arrays) forward(self.pred_exec, is_train=false) - for (o_list, o_nd) in zip(output_list, self.pred_exec.outputs) - push!(o_list, copy(slice(o_nd, 1:batch_size-get_pad(batch)))) + if isa(callback, Void) + # no callback, accumulate the data and return at the end + for (o_list, o_nd) in zip(output_list, self.pred_exec.outputs) + push!(o_list, copy(slice(o_nd, 1:batch_size-get_pad(batch)))) + end + else + callback(self.pred_exec.outputs) end end + if !isa(callback, Void) + # callback exists, do not accumulate data + return nothing + end + if isempty(output_list) # maybe model does not have outputs - return Array{MX_float}[] + return nothing end if isempty(output_list[1]) - # model has outputs, but maybe data provider is empty - return output_list + # maybe no output because data is empty + return length(output_list) == 1 ? output_list[1] : output_list end + # concatenate along mini-batches output_arrays = [cat(ndims(x[1]), x...) for x in output_list] + if length(output_arrays) == 1 + # only 1 output, return it directly, instead of a list + output_arrays = output_arrays[1] + end return output_arrays end From 0f632cc2e9aab4428635394832e422ecf5d43a57 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 26 Oct 2015 16:45:54 -0400 Subject: [PATCH 129/630] add pretrained Inception model --- .gitignore | 1 + models/Inception/.gitignore | 2 ++ models/Inception/get.sh | 4 ++++ 3 files changed, 7 insertions(+) create mode 100644 models/Inception/.gitignore create mode 100755 models/Inception/get.sh diff --git a/.gitignore b/.gitignore index 5660a75bb89b..22b57c756f2f 100644 --- a/.gitignore +++ b/.gitignore @@ -1,6 +1,7 @@ *.jl.cov *.jl.*.cov *.jl.mem +*.pyc data deps/src deps/usr diff --git a/models/Inception/.gitignore b/models/Inception/.gitignore new file mode 100644 index 000000000000..3eabb6e80247 --- /dev/null +++ b/models/Inception/.gitignore @@ -0,0 +1,2 @@ +Inception +Inception.zip diff --git a/models/Inception/get.sh b/models/Inception/get.sh new file mode 100755 index 000000000000..392403a82703 --- /dev/null +++ b/models/Inception/get.sh @@ -0,0 +1,4 @@ +#!/bin/bash + +wget -c http://webdocs.cs.ualberta.ca/~bx3/data/Inception.zip +unzip Inception.zip From 5bcd859229fb67eb26a688d54d3742744d2e37c9 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 26 Oct 2015 16:47:16 -0400 Subject: [PATCH 130/630] add example using pre-trained model to do prediction. --- .gitignore | 1 + .../Prediction with Pre-trained Model.ipynb | 233 ++++++++++++++++++ .../ijulia-pretrained-predict/cat.png | Bin 0 -> 123126 bytes .../ijulia-pretrained-predict/imagehelper.py | 29 +++ 4 files changed, 263 insertions(+) create mode 100644 examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb create mode 100644 examples/imagenet/ijulia-pretrained-predict/cat.png create mode 100644 examples/imagenet/ijulia-pretrained-predict/imagehelper.py diff --git a/.gitignore b/.gitignore index 22b57c756f2f..503353f37bd0 100644 --- a/.gitignore +++ b/.gitignore @@ -2,6 +2,7 @@ *.jl.*.cov *.jl.mem *.pyc +.ipynb_checkpoints data deps/src deps/usr diff --git a/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb b/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb new file mode 100644 index 000000000000..5359f41b299e --- /dev/null +++ b/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb @@ -0,0 +1,233 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Using Pretrained Inception-BatchNorm Network\n", + "\n", + "In this example we will show how to use a pretrained *Inception-BatchNorm* Network. This network is described in the paper\n", + "\n", + "> Ioffe, Sergey, and Christian Szegedy. \"Batch normalization: Accelerating deep network training by reducing internal covariate shift.\" arXiv preprint arXiv:1502.03167 (2015).\n", + "\n", + "The pre-trained Inception-BatchNorm network is able to be downloaded from [this link](http://webdocs.cs.ualberta.ca/~bx3/data/Inception.zip). Run the script `get.sh` in `models/Inception/` will download and unpack it automatically." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Let us first load and display the demo image (try to use other images you like). You will need to install `Images.jl` and `Colors.jl` to load the image." + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "RGB4 Images.Image with:\n", + " data: 256x256 Array{ColorTypes.RGB4{FixedPointNumbers.UfixedBase{UInt8,8}},2}\n", + " properties:\n", + " imagedescription: \n", + " spatialorder: x y\n", + " pixelspacing: 1 1" + ] + }, + "execution_count": 1, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "using Images, Colors\n", + "img = imread(\"cat.png\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now let us do some preprocessing. The most important thing is to resize image to 224x224 that the pre-trained neural network model expect. However, since `Images.jl` does not have a `imresize` function yet, we will call Python to do the preprocessing. The helper function is defined in `imagehelper.py` under the same directory." + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Image resized to (224,224,3)\n", + "('Original Image Shape: ', (256, 256, 3))\n" + ] + } + ], + "source": [ + "img = convert(Array, separate(convert(Image{RGB}, img)))\n", + "using PyCall\n", + "unshift!(PyVector(pyimport(\"sys\")[\"path\"]), \"\")\n", + "@pyimport imagehelper as helper\n", + "\n", + "img = helper.PreprocessImage(img)\n", + "# transform from Python row-major to Julia column-major\n", + "img = permutedims(img, [3,2,1])\n", + "println(\"Image resized to $(size(img))\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The last thing we need to do to prepare the image is to subtract it from the mean. The mean image is computed on the training set, and it comes with the pre-trained model archive." + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Image prepared!\n" + ] + } + ], + "source": [ + "using MXNet\n", + "\n", + "model_dir = joinpath(Pkg.dir(\"MXNet\"), \"models/Inception/Inception/\")\n", + "mean_file = joinpath(model_dir, \"mean_224.nd\")\n", + "mean_arr = mx.load(mean_file, mx.NDArray)[:mean_img]\n", + "\n", + "img = img - copy(mean_arr)\n", + "img = reshape(img, 224, 224, 3, 1) # add a mini-batch dim\n", + "println(\"Image prepared!\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now we can load the pre-trained model, via the `load_checkpoint` function." + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Model loaded\n" + ] + } + ], + "source": [ + "model_prefix = joinpath(model_dir, \"Inception_BN\")\n", + "model_epoch = 39\n", + "model = mx.load_checkpoint(model_prefix, model_epoch, mx.FeedForward)\n", + "println(\"Model loaded\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "With the loaded model, we can do prediction by wrapping the image with a `ArrayDataProvider`. The output is a 1000-way vector giving the predicted probability of each class. The class names are read from `synset.txt`, and we show the class name with the maximum probability." + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Egyptian cat\n" + ] + } + ], + "source": [ + "pred = mx.predict(model, mx.ArrayDataProvider(img))\n", + "classes = open(joinpath(model_dir, \"synset.txt\")) do s \n", + " map(x -> replace(strip(x), r\"^n[0-9]+ \", \"\"), readlines(s))\n", + "end\n", + "println(classes[indmax(pred)])" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can also show easily the top-5 classes and the associated probabilities." + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + " Egyptian cat w.p. 0.415571\n", + " tabby, tabby cat w.p. 0.230575\n", + " lynx, catamount w.p. 0.153771\n", + " tiger cat w.p. 0.129155\n", + " Persian cat w.p. 0.053005\n" + ] + } + ], + "source": [ + "K = 5\n", + "n_best = sortperm(vec(pred), rev=true)[1:K]\n", + "best_probs = pred[n_best]\n", + "best_labels = classes[n_best]\n", + "\n", + "for (l,p) in zip(best_labels, best_probs)\n", + " println(mx.format(\"{1:>18} w.p. {2:4f}\", l, p))\n", + "end" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Julia 0.4.0", + "language": "julia", + "name": "julia-0.4" + }, + "language_info": { + "file_extension": ".jl", + "mimetype": "application/julia", + "name": "julia", + "version": "0.4.0" + } + }, + "nbformat": 4, + "nbformat_minor": 0 +} diff --git a/examples/imagenet/ijulia-pretrained-predict/cat.png b/examples/imagenet/ijulia-pretrained-predict/cat.png new file mode 100644 index 0000000000000000000000000000000000000000..5f681ec7e99cfbca148cb89547f53f13e0eeffc8 GIT binary patch literal 123126 zcmWifcRX9)8^=*vv_))MMT|zORlD|z6_k+JqqSNisM@ zO??$b#il5Je&_yi?l^y(*FE?7oX_(<_r#ez*1gHd%Sc5AygOtKk_?D(=S_6=|eQ&LDPn3R`nt_X?Na+=e1RH07AE< zfB9??Y)AxrZrhLF)GXhPSlBBC3#fTq3K?_;_eE9KO7&esQk!uDkbZK^g0 zV1QddD~grN0>Md@4Apz@#d*bQnU-B$(29|B<6>(+9pZ{+MMRZtCPRlSWvApu49nH2 zYk;v16^z;(FRq&o{0MD$uu?c^WbR?G<#WBhKf%wN5SM`!L5asCK!QHg*>@(Qhxh66 z9k;nssIv7qY4C|qiHy)F%?eHPx2uysc@Xe2hV;S|C{YtZ?PpwLnF|&3BP|@oP(8DziA;R^(b~bXKbl$#1lqKkJY;7N~k~9%I)*ocAmxeZyOI*^* z8G^D`aHqF6>ptIevYQBA54X=zsgUw`q-*~rwFV81Pa5qXeu8F$SaXOy`7{?lKr18Q zDTifg9MvrP8V%<}3s|umvm-$44D5P9jjp zK7zE9QNqQHr*|P>^eyGW%5rRDNm&`*{_WtPo)f0wDt$_7ZR9E%`cOy*qD`w`1Eirk z-d!r^F)_)O{nN-W;E0LB#?b0Qu3o3r#y}AHtlEWOX}!0xIoeD#;Zg`m;_avU0b z@|`|OR#z_ps;dDh5HEyW-#+^#RbeR(6ss{Dz~j~3ehpbr6%+=wxYscXQ*+it{w@@Y z#&eilbpx6L1c6b`wb8YN8hS2QsUc|#-JAUie{QcP?TL6(9+NWmhTnaul=lc9jR<`7 zE{RZ%CGIH`?^{l6oP>2uHkG76*JMBTvQPTG>pN&ICVf{oPtSiwo6ks%5|4^bGtCTL z%1>iNX^7sZ;if^jb1<0DMqR;ha8U8ypo*TxiP=oZm0PCKy%Gkj;rcigKH5pkIhz-A zr5E8pW?7`MF4LvaimAJzQfTU0%MbK%*oz5C(qf%xszRjNUYt(|r zovT^zNE>`g)hkM|US=O)rvVOAnWPN!#;LnW?u@d~Q;9GPfXZsPF@XKqg+uNSWd9U) z!8DN=s91qmaRc^QN->@)`sx768E7DdHW7f|RM*zl5If$r<{AK_o_KO0n#eP@L{mCH z(GTG8ami7qkE@fuLBP~FM=&lMH6GDchW5E|!kCJsYW_&*7f+*`k&ydTZvqlII*mcl zg6KTdUDF6-w9e0;Yh`4YfUneMJ$qhk@$e_L#EZY?onAhZ(u3Rkl;Cjbq~_ReBizcP zdGg$xTc=eC>8X9@(k4vw4cyyW-!Mg6f-7-)wz<K{iLepB3a5$9fuJQQh5>a9eG#4)5Bw5e=q^_-BE=y2z73@(c$8^8Nfg&J z$RG{%ZPUZub%0hqyZGVZv9kvN(>Q2dYX>_gAnMncm;GE0JDLh?A`*(F(*RbWchkw~ zvr6zf$PKGC4O0vV{(?fvXAXqZB*MpOAjPlrT}4zFP3==fqG^}83Gf>883V<22sqDKu=RBz|lYKh|eC65W6A{ z{|0;Z!9oyMCBRW>o3#Crm*kvfI$>|)e(5a&1znf5x`6ubar z9Bicr5R`fvr#>DO{KQ&Mz{XpQ4y1>GIZ0AyWMoU3$`tEUFFr_f8E5CnC+WHg*$m0{ za)W-oJyJVg59v^?jy;~7G%mH6Vmb>7T;Fq!Un_tWWZ>(@@q^b^^e2iPn#-%rR;=K1 z2kDPHWK3geTFAXJCf&^@Q9s<5Dt2-JOd$HFz0>3a}svL0TA9c{&>I z>MVRzT0Tnq0H{u*2RDyf^Q*xZot%7#$HZ}|xPX|5ChjXlm3G}FQHh3rvZ+^dN zrAd*!D}ALWtFBi5A#FBRxPm^^P1(|9d|K&7i5?(zo66Em)MTo`0wFm76co*m%Xi)? zlX~aIEtG=82o_??8vL%MU@4tP)^n}zeub%i_})fLx4O5<;>05IpCsfci>r{AUIZ*n zElt3yw~rtgDRoy2K8@Ix06FYGAMmCOn8DUGD+*y&OAYFuB$e@V;3`l3`bjw zU@AqeD~GeNnW6H`FvL;6VJaqVBRz z-nxMYr-XK=!^U`V9uklhj=gp&(KJECm$SB-@0CYp#(x(dZp}q{C=v^e(jK;2jDiP` zO|Mv#u@@^lwCb~@7>1}9Sn1L945C2pCG5YXhGFyUT=# zVFZC!sp_bb-hL~ri_vO=URNaU>ikjgKLdkJL5Yd~6$;X_JjZL^X9R)FS!q*wqRaFs zPI$Nu2Q=mhoeABmhaNM%$7$&qG}Z*kflu;%c81@%Sw`L zIWHRMXlGP>q-y2iUV;Yz04%}O2u5tDgZJ!)mkWm_k3OtyfT@Z_)DhZvr!K#d!9C)@ zpRaS7`wduphy{Y+umZtNGoo}0SQkw)eV$;#-NiXzCPRirClQ2r6!>URy}WD@6V3j> z3S(79FJR>fYGrx)Tc5ix{%g6BOWgOp$1$O?YzA_ zQ3bwwFTNK7ey@m0+lK~v7J^TIr2Jy}@=)+Dloj`NTv8vYTKVWD~JvgA?b~r&^Mw0YexTeH-w4tI5D)};>oeHQ-YBmWN z9XPX&I~%5Sw6fESS^@B;w@`%uyGcXQd+CX8j!@GK01P86#(JgLidxS_VZ0v<$#51( zCr_(_YU+#%?OZ5BpHC{IT@Ht2zZnB4-7tG>KeZoVO_7|p=Rf*LH-Fr^W7kMfx| zt`0~Wlaj>CNHS{dhNJQC-h_T=xdCl4Ji1v<hnsVz&cTNnO%m~-06|L*KwKejG-6&4qc96l9V{-W z)#5gD%fu)7NtBisVeYy-k5i8?jQ?rko91rKeW!2pzi0NVGPcg~wJk{-0TE$YFJ5$2 zwFDzwtsyzMCI(bL;0w};nrTKe<-KoD`sTc^O!X zdh)gN_{#5>-UeFt3}yW#>&vkwqzbpU6DtYeO8<`Dke13@O&ggrC%X}1hAg%GF8xg9 z+Bf6Otv90R6RcQ1kGWxgSL=7}a~6ne{faP8sL zXlDAMD5-MVxr4mNv$5Bd>tQouzmNPVYn)%1?3dG0VpwN3>5svE+!t0sMNtQ|R%0l1${v{KrKy-QM+ZGxgrX*p} z?tT=zdeB$BHLpylb+r2hl=&6&f=>M1)e>0oSagp1=Bbi^v=*YA7Yl59^B7CZs98{Q zt=N*4-n>Iy5c+#w!nfJN23mo>Y%*`6z zKTC`B_)u|tI=l*DaZH0}GF}&2)O@Nh`pKsNg=qEuETzW){BS$wNxm}xRX60TwB~7M z<{>gXyl*H7gUdQ}nA~YZ0^V?o6w_svI{%OfOQA~9V$~!mtaU3 zb#o8T2}{^JZYNyvgQi0JQT>&0Ck8#^Bb0uRC~2xF6t`PbB&#Bhw6@-OSMtXI`BLSm zUDKmQ%- za7y7nU)##7=C?KUVZ-4J2BT_VW9pnSc%UPuOhfKoVNJJZPD&Orjy`IzNVALwrZ1@R z2N9ST@4m%W94AIo=$AYU@Q7~92r`EjzvV7|W#3T9p=(Z!{9QPlxi(w?6jOQFD&s~l z!W+@ra|7zCDsNzd=fc9Rn@dag_Fe{Iq8sCL?lzm2uJpp}Jb^{Stz{zB;fI=;8R=J_ z+_O6xZ^|(jtZ0|AM6;?_ux7m0iDpHx<|eJPivpdUe~X7pfgm9bKH%i za9mn=ZrCl~d0{P60eWEwNVa!7+z`cRuJQcIDhg7RrsK)OnVP{qZX9u94?!Sk$B)vK|rQS>YUkd;{gGk#4blEkVR?C;TrqW9D*A%O_EgXBvl{X% z=p-}_8klB_GcFZ3Ofabp%^%`l_kgIi_g$QwG3>fqds%kh_FX$ zk(POR-)8m>c7yEX7n(}Hlw~BOS{mHGq4&0Gu0*b}V5A2bs}Qrovp*IzwIXJXaB)r0 zWGGO=f6U`%1F;A->%pr%?E!+V4aeV0raW`YYkF178MPbA(FH~XydL{)!~2|;uVF8=eI7l<=DaCK!NP+R`i_i7dS< z?$k!CE?0XOl_t23s#Z*klQ*P(fV?FmU@W@H4)D zo9ZsJ@QvcDTA!PFJuu0`yL$Ol{q`~4TKS^WkXB2s&B8>2S=XU-X>Oh5t0~&3N2!&AKspYgFV;%8Lu}T4ER(L0-mHx!1z2X1d|Nq?;t7D6CRxnP z%+gMScxg*uu^Ud@ipJez4YP=~0s$T91!@+|)&4hZH`d14)(S+lm_;Low{`ZrDfz228W!38|6PvN0NMab@LCbw18d7J`D^;Z4E0A#CY#2bFq7IjA^2 zS+gS)Y8Xwctv{rv|0>=h0en>X%2wqyk6X%sb)34G>mPTcQz?B5BtE^->+Jh}dLEY0 zIDZ#`K%mv(UuhlX4!qnQ2_t4((o-gMjw~XEX^Ule)jc0;>vR{udxgg1hk0YJ7`bNG zcPXYKgy!zgncbtMu6Cv65cf&*AuwMI^ytp_k3%SO=SXgAqgOw13QNXv?Duj1~Ds zafrj7#x!lfKtBq?0Cr&1WTXS5G)1M^VqQZKl<4o8>ITGAgcX)?@qDK=3Y6&BBwCZE zQ)U8B=uHFCo0sPd6cyW4Sq%eTlpn1g{96=Hw({`OqIVNV7kd)xWWT@lKpoDIHj)=2 zLPB3!hp63tEI(8+m6X~)h`e(3H`4argI`TqbP@u5Iryuo;bQlubM!*qKKm{bs9gN$ z?ZdB59-`r1o8L`Mjfy{17}c|`q>AXlH9vsgo^q!l?1g4wJTV}Lz^_wq2n1?kbMhnO55*NFH7d>5n_teg}F8)OReWP~zX5skU;aq; zZI9@EwwQO`tQHn_u{L8|GOwl_{=<5KAsC-u3%Mibz^cw(#`>~Vj}QJzI5WK*?YB{xac$E zM1ehW9H0`8g-w_r)C(4NZtphC+VByTj?& z?+KnIU;(McT8=d#A>E|b1mv78jVzUw!Hq+^ZG+A z(oD6iSx#JzyP0fp84DO=nu@WqVsa(hGZ$#0%jCA{7Wr&k(O7h2cbMY-hej*HJ$M7o z4HhE35p^j`82^4@jj1L;ZE>5!CA%Jvb!hRr6L2u8Eadl6slsbiXPKV=4i`EKDr$Im zea^ZZ|BdmUfeAssE`K^O0KSQQD*MoKeYtEWae_bc>_f6ca@)c`a@XDmwUh3JQ~8Uz z?vvc4WuLGIq37pZT^A$gOKl7b$2J#34kws}fA25;Tx>5%M1~#h+~v>ZhcY0ibF$0y z*6cl_zm(6ct>~1NKvTsF(R3sE$&0xdc3P9kxJVwQZlAo@?suDmT4Aldw5}^9s82 zo&7>r_{$L4xpu`nUdDZGGfNfaM3~F8h`T|;tYhigGaX@I2zVSp|N1`lyQJ9Vs*PGc z=Ch#Cp93dE;rI4{XxZ8xPj?bS;e5zeeI{*z%eU8UcMY5ulwCycF~Uqa#jH$W3C=Kh zeofN6wY10F(_^{5X6Z{*_|`IRtO&+0^N9OX&kbDu7)2P}?^FP_y>X zh{vL0XV3f6aCl!JmF*+8?{+x|Jti5Ibhfs1VR@10#t1tNm~ zSpCatGBRSp`{D*8$Ir(puPt8N4MvciUa`*Rk#=ks3Qo^xJu}(H2N{^A5ozFMYWudXM(zr7E%GB;|-5Vn? zkgOKI2o4Xf4G1^W9&1u4GgX=elM#krFAYHY{6Y1}>(>qQ*7C3)YdR^fEAbG9&x3>e zv|#FM1_3aAZHRVHe*>TQZtc(wQ-Tz0p_zBbfs6e~gFrz(>T#=~TpUFcHSC9|b&(oJ zcDx(8^o1KD5?MnBA$+%(WNh>-ZG(HsdM$-l?x1^9`TZml;eLnA=~%M-T@U=t%}>is zM%UPkknA7)?ulXYX;^WgaAA^DP>{Jx(Q5z)&gpAYFeC$bg+s(h9rY^l`{)BXtPug5 zQUr}dL(i5 z6OMaU&eZuP>NVNZjQapY1r)7Byj z_`Dge_RddL^KL~+&9zXpklbM9F(*nQ=LF0x`nz8to_;NP zZoX&heR5VEaXOK!c2Q$DVl>_Ex6wO15S=ql#6$7P2qEZ`k_S1sEf-3)_`a5T(p5{Wa( z^WsD8((K(TY(;_&m^y;U*A(a<=VSFRx<)C6@7FxI|%t|F(b z@o}L}67<#gdqU+k1C)i?+mB;Uo4r*}PDy6IB3QvqdaOf$B*Pip5id`7GYJNnr_W8{kQ;7n-c#+ zBSkYk-C#)Ax~?t9!2v7y(z-ujEe%MMP;zI5qxG~Aw5cbJd7XgTVP9r`y%FCN*(!@J z`#!m_TNJ>I4?ji_!@5XG1z{VUyl0ahcO z@5ARFWbG}tzqP2WsyuDOb-yq#ClRIiTEs{1KGpigp@}dXAKr!Z#?O{!m(xg^ZG=~^ zXnK$hArS3yqoJ?X^2n*yx}AV^v-*}9htrdh+};;TYJAS%=)*SKHag`;JhqJNE>NR?+mR{3m6(r&raU*%YGh`2M zTyjPyI@PqXx4gUm*QZmtw+R~KUdj_=R9peM+BD40pY)NDy8conrG{ot3PxgGa&zcU zl^f@uTrP%cL)4v2p$6h{GG@N~B!_5LtCo7>(7X^EOHU$GpNqn9bD(@5?${?g)Z2C1 zFwmVk;D_iZ@GHGdN6M&iSKvfWcIp$I=q!5eU#<2MmxFk=`)6jo(%>szhR)xoZm~GI z#?ISCBjeBZd&xFWoCyLLWY;!pnjqs$HAz_Tag4iA4v2uI%zOZ+O1;81h#?%;6^+T( zL^dzxX0@}GQitl&)sZgGeBw(i6qD?q%cTozEILI&Z`d!~Rvp+2==itX96{lav%T23 zI8^)mlyyx(&SZGMWW+4gYC5g~>MCgaE$f9!@-|nCEPh+lwETTU1(7Ls`Cy|Bhtu+w zGbU}ib#^EW$BLv*Y{=FJP&sq`URG7va!1sBN~5x>SaQ93e;~5>oQh2@7T)S%6zkxn)hscK8Ok@a7UADU!sjQ}=q8jnY z;m)i?iYHl+-dGHKI*W7{o9XASs1r5-kzTCDx{?}hGZPya9ZT$R`nYjJ0Zok5oP3Bo zFe*FEw9F1s$EH3!?CJGT3?mM3o3pNWvA1rXKV9^(%sjqiAEismL|3Rje@pc!c(f8b ztvBKQ@87-J!jOjzjorkskJu6|k93z1h}Q(t#>tb1i9ceFJZYJPv}Jjis+lGNRkw0> zX>|~C&Yf@XY~~fx?a0r3wYztGy!OwB&uL~>ccpB*;LEXJO;v}!_tZ*5RYy9|iYe#| z^{akVZKCGpe=^mTcE9rS5p;N(tfmlo+}EdiG2OMdbuqMX+;z6Y99g!v z$vNUqD8H>}6a(V8*Z!x8EKBx)bAJ4w+(zsDObV{A-@HUz8$a7zdvr8VQWZOI9r{@k z?cZtJ>mT~U^z(K9B)ZP*Nj*kt3Fv1~ej$D8==;A#t&tJ{_Q6V{Ii}d|4IIh0y``lk z{OshMGEUrFEDOiylAKE|kip?$2P+5is%QHL8}i|6WW87Tzo^pKzN0NQ<;$Yd9(l*1 z05XZMgQnzkFPh}|u2#iFf@_jTvKR5RvcB#@Gmu$&*%l(#wvYN!#s;PN530@3PU&ocPc!W*X+dC`R z%9Q>UFDR8`Bza`DG}hx$Vc5+hus-t9w;|^eHa|Q$8l&9 z;>}ArGXV2pwtc+pV>qO^t& zI1g;2qa0FaR&tZGkO@Dn7ZKA2KPTZfm?9=*6svj6pfzmZORK$lUqqApg7a397Pujv z5sWU^d~CEzZpC8#%c}@tJ*`&tcxbYrG5kZ5C_#TC=jS#TNLTH2c|zTY7)Lfm>MN_F z>H2w%_#Z{FpE-buJW*Kh?E?#c zm!>_`{tft6JwC;gb?fQ2Phgj=`4QjD)jBXA zjpXz!*-!@3%SqSkm`QMrR!0P$x+?Nn=Mhh~H;#|HW%z)*eR&rjmlh9> z&JP1G6;17YBslE>E=2i|{4Ec(lhN}LoCZ#k-q5wUyk5 zE6L_UBHfMZ!}bsvWEo$oAJ6KU+%m3mQ_kUEl$VsXgc2p!KNH#G$grEPVEOvJE2u9}KpSm`?&p3&Y`HrOlE}T37Ey_W@fsY%_ zJL3-r;t9?3rNQ``CHbGrnmA-lO4 zUr`_$DD>Y>w}pJEwox_i)V$DFnePt2>c!tf%I3(w73Pa=hl?K$=NsJ{76hXVBR9u! zUNP*a^*b%cofBwhF@x)dzz<+UF)<#6-tBJU+6Va~18EP!(N(Ps?@l|ihtzn2s3%$U zJ!idD!)CZWG}ij%BLReXNrPv4cH?_ioq_ka4AE1{M@w#5LYd>@(KdKdX+TPBLHxYvgn>P64@Pl93Ta3}u1is|h?!`%Kwj7i*bjwZ& zp?FpfGBc5Sk2myl~#1&~i$KGtwI)T6{NJFP5@7emU%vve3*Cd4 zB?(u2Cj0;UT`{6|{`-9Y1mRzdsca!H zhn%G@F-wdvPxMK2p6sAGD3aixV&akHf?|1A5A&9>2f=)-&)0=IqBN3Qw@=2I=NIPZ znUZ$iWs8mz47KCMpL1y8_WyVgZX)k$h~4@TAW@^Kt%CptM79&~EpL9W`=N(1Kk#C2C}C2bqMC86?Z&NPu&aG(vLU8gt>gB@NfRSIR^PyQNTdXuU> zDB5{^`^5oGkhh%t{x@=#sC5U22zj&pc(Q39VV=w@^u}qt+lW=>c7(dLkr)(TcYO-^&JqvM@<70~LE3NKrU8_|4SAAZ+a29*< zck3Tv;Uw~6BT_QFmFlGn#YY;AivM&F!+w=_)~Pu%R)pn$OXi+mmcA=@Y4VD&DB;ePbMe&Nz@% zz(rkt8T5*bG$zeCD1m@i2CE3EwC_%76^wf3e2bmRDZuFraBom_NYh24cW`C5j*hQH zIpc~XrdQ=g=1y*uBxjD;>Nb=gv>4CGjMRsgfg>FA4N^5LJ^T*IghnyDxT@^dI}K*e z&aK`ybU^ox-j4~jNY&q2S)#wsV-P;%VkQD02T#XUdpi{*$=$nYkS}D z%!ENNL@!o$PQRwmQPCe~vqelIh}tfXPuLSn#mFr{n3Q?mvpsx2;aPp%H?gnP6%zqW zv3ItrMn>wj|N4iAc@HK#bTEt~!;dI)%$vo)3UIucefG~U_+1_dnw6Z(T&>FAoK>!% zlgOOBB{4E$>&hv-H$FEvldNWyw3ocJ6KHmKc!H>=E|uE0BmAq~9=5eO+jK)$b?Box zt#Z(uIiJY)*Y`ZbclpnHvd(0NhV$E?KMPyAUM0Ljz2D_(y9)}`*?f>gHm%+LVUrc{ zDSGbYmQAKytM?tm3sndHyuS9ywU4v6nPfs!g*z-KJk@is=lj)>MHy6;Q)`E=_DST^ zG3z`8?t6$%VlC5%|C`e$q>%J*1`F){N?ZwxLF4?&QkZ4Qk_=zgvhcL_4Sb1pLDrs& zU0zs_?a;(#aOK3yw?ct^oX!XeCp`=Rb9ydwfbKg8%(@p|lN z5&yG|v`*;2W`%{|SJ%KbhYL#J`LDjNqvK<(yyVsC*EY+O|4qf;u~u-0dvbqhx;b%E zXy_ie8)TNX_T8n*)pjKY{ng!_B~jB=<2l|Hn(CJOXmcM(A~VMpAC(wo;kwUuTyvB0 zg>O}7F41RvH1;*^7|2=pdQHh0<)M-MHI-o&4D-z0h3e#s&7Y?m%X6_3dAYgs9gz_s zn)R(-OUJuD!6)04dz@;gf25JS$8G#7mC44pnRik+Oz2`{=na%#Po(-S$SG8B6MUGw zavsCo&0oRN43&0+NQjo&G@*N=l5%s%FHOjJp8^m<{izTfQi;Xx&!5hg&f9Esc;vyI zw=mFtGDNYF%cazM&DS<_*(aM*s9U8&Kv+9+WkPM*&g1{aCaJzwKdw>k$8ff6ljPgv z`%N!8yk;hwP?fJ`H;sr5Mu~O-US!`#cd}e^SLXwH-{!Cgg%LJf+H7;1JjPsS);Ih; zvpjmEo{I$v@%`~kW-Tn>{_J02NY203E9>Z_C@rO8WL=U_dovlT4YAH3kL5gPODE%e zS2Y`56o~0YQNTrN%RD&_W0Ashw}Yiej+swkgSqF z$ln=snmM~a_v6u(yfOVybVGS#3)W~lpdik)!01%Q#+!VqY|P#ioK})PUc{^Znae|+ zgLM!M+<$_!qU@iqz|SZuorf)9XV+j`cNUJX(aKyW`{%apmnGn*N_PJ)wn_YFy>K=y z(VpC=7IIPQkTldn^P3j0%wqC~H$aM2Ober;(z~~P9o(S9AwH-vZMzBDdzyAf33%X}|u%}3d2&zV@c(O^iL&0HE&`b^KzFs5&9v2hdq zAh^};q~LAu3u3G`GLGy~RyrXgZZUr`O^#<9n!S4#rs|z7P^I>7fi@NiP=25gF z;1>s+pg9OgI(l!KF!efQ=*522uDDQJI`pn(^&gm`- z=sHJ!rgcg62AGw{ws}MD0cC@8BGqG=6A&i(X8K@-3V-BwW1)%KH|H6`WiWt`#&k36 zpzm@cB5!TgMyq{wF1GD`n4*zAPeyyE>>EgkWP8eVIq5zo0oXLCm)a*Ge=XZ z9HyeCqNc2(mN?`i5e0so*YH7x@@p1Q(Gbwy#!*9GeNzPC+fv1B%>Q7uK6#OHhr7b! z^(i}tI!g>U3}6Zo5PFsQYLeBy7I7oFmMtSdSHoR$$Y!abLGy{TNd1>#kRFSKxzO^W zrrk+xyxiy8yX#sF(WgP3p7~AMv*DE%1zJ)SKt{5cap}^|?~UmaF<@gH`V=+Z7xE$* zFZsBdNkt+rY_%OrPB?BaS_} zZ20ySru6y7BQmXtq_!3`#8zS^fbW%Xfrz0dEsJ35H0Pb9?Wdm_3`d#zKUO}wA1vFI zIMaRm7r%BMKUFRKEsoe2wejf5pm%MUqFs#JJM_C)+3f!}$N!Ic zVsMXM;@UlsVY)MeDF=(|*C&;k7G&$jt2$5q=uRg$Z~k?!ebc~0sE~bXRxjEbD){7< z(A!%|)QEb~ORQGTSk%~3@yZ%m7c3=$S@YEJh1<3n{Q#52+3*X=Rv* zQn$ko0Rs=95-FUyv;4p}MxZz4{#d9GcoRKjrgAtlCmEjmee{~;=beAtzKPBJ9oDT8 zJKg+iAsq^HjZI&h?7vg&yE=nUcP9UP)Vq8K}klE0SK)gyjzcXi9a z_ZEK!IvM#OJ3%wxgVl|7%f17@m#90$hWDb-cy=cS{3t*I@;h|>(cFD*`2jb#q24Z) z@U4Z@6A40(?ti?J2dW60dPC3JI}KI$RSbDOxy;EZ&rH&+dv{-8-uy^&WJ~yBZ!U3; zO+>UU_4>fv!-@b!^rpIugY{b7`|=-(nQz>x9Tgi$QPVREsQ!J_)6xF(G&IdeC5-Ib zWI1uPlv}-*QUbP&M)O*Mw0Awy>H`Z!HjSI@J5~3KB8AF^U307nM{X~fmO{tgbh-+b; z5Lbv!Qhx&K3x)smzgvl#>b?Ek^tw#Hp4?0r@AhcEG37R^1mKNxEjcx4KNZ)*Z$hb0 zkXBBNDs;6rbsu%xu_d6L@mor2z zXWYH-^J-^g`RTCNms%n2T{2WTM4a23GQM`p*tpcVE41O*;e3AU;+V?;`jg^!?QmD% z>!Co-+>2Znu#Oqj*P<0r?lczCd9uvw;rYxqFHfj>X{|>5TJb>DJa4UC^AK-x^2CVR z#echDJKX=D6;>sI($N|{mJ`#rhAVHT0_3G6&Yq`49<3-{{G91ppPE;TRR3r@=M1)H z+X&}ef1r6qOmog30Tj*DaK;NEaE~!!U03%p zd~Dn1!y_VMl<%zUEC#9kD`9KGJy033LOc=MSTDY9<8ob}&+B#DwsqaMZ4J-N!97(X zxqFuEve)ZKABeSTz#TpiQFLtX0IK#}7E~1#6sqv01C}g_odQW3h3@X|!*lgfg|Urw zJwL4L;?pm_`fRBfm&-aTQ@X&TDDuURzF3y!XMXOdK0JK+<-4!e@Q9IdHM8UKe%(AX zu1`;yp~BF1eteLUoZ5DN(7GJ$?$f{aYyb4W{3n0%!$19*uYE7wAI=|U$kZm){mJZ+ zGCO5I$=x?1*L4lA?Yic;#_;qMqBsIupO@Ry{bUW?hk?z7$!|E4tu#I83c2vY@)_?1kGH;nlU1eUJ7rim=+$tTodD133wMnN5c! z36yRe2&6{@RW1dSvY-@3$x1S*&*!r=Va0CZm^C(E$F`+!8BqbD?$$AT_>zw#HL9Vm zmGDt71r>{cE3m9OD^ThdyQH z;pWZb(}$05C-=NuF&@7^;~W3;fA1f?dwihR<>}nC1w_r~nnOU(@JwMOA}ednvF9A- zJQ-0@Xp>Py;_BRx=@}{=KyGVZu8;Yy&V$C1FQ>zN|LXPq{rzk< zkSoC)T^f{!p}+C!v;Xl&Kfk^o@1HLK1G-EzRHYe`SrFrFizcX&EVwF#RDmYTumOnG z6*%^}wdFY9U1A%)PC}Zj;X$IHR$|PR(!eEn@zt~%_uz!(c4-F{&8b;40TOI`@S<3c zs0>kQyO$VHO+?jdkI^V=O*1oxuaRp!+ms~lZEidwEGCYp80X_>+V=K@W3euv%Fw zNt9DnDn_jClCI@L!F3HbQ==S6n=uv72e~baV5?R}bs>{@1?# z+2>!q8zET9E^l7F2IP8K57Xi4>3vKS10ODrtnvQ+`!}y%1Gzpt&7Xhy5B|Y_@cEzp z+5i6k^`9*F%M$i(dz#cz*hOniP*qrKz&XYktF2?5w9iYoR+VEq@%;S0S*i6t%XoVCYx0-A_RU{@^~ukiK05pJ zyYqu5yB?-4kXBVOythTs6r_XFfXW#fiFipXoZPV1W zHS;PaeLS9h1*hElvt*a6No&*Gg(c`+sK|;T#$@COEpL5XR{*LlV=Yuu+Wo6r5sWc1 z(`c14qJR|HN(6wJsA@)4Ya&v)M#QL$eVdmEL=+J5lYmt~QB}#vjLj1$fkZ`-Y{tlh zW+t<0x6V%@OH@Zzg#ePiWg=;ns0vj@1fZoUFOibP8ik9dL=`nrgFy;{n~O?>=s>FY zR09KG#I|1AEM01>PnYM1OcbNwVk(vHUL~s2n>RO?^ZM}gczb&~Z(}+hPlqFb%jNR= z_07%Qtv%fQ_y>Rb(d#z~T+jaS;d!xXzPr0*@kf7h`|Y3m&ENQ+{HOoo|6#}5KY2JW zH^;6q(xrGi&qeugUb8$QERpoL^8xcrthYD!HU;=W7prR4D9=%0NUX8?x*=I<5v~of zo-?n3LXl+yS$kB(`q*(u$o)t6@BGVo^}qG4U;lgG{FOV_ho{G<>$L|(${JMK9^TgG zF0}o&Qw14_Xvm_F9OFvS*4uLT3XktwL~iT*%cW8jT$X|d(sB>O#9)?|cp54)nJGE; zxI}3On_pSGYqQBr1#HWZ7LYJly8GBNDa9^ouxQ3crI^U^xJd6KybC?9lpD%vcK`_I z^TV~zi_PgU2u)Pv1zwjX?i8U>m_0Re2OxpU)W7-L-#Z-Vd7Ae?rJqDWk|9y}-@RK-e-K#Dj?ZG>o8!AL1@YX+}7>#;ra3FpM3iM{TGi9 z4{zSQZmn0w<$66FXR|)m=fnNo?c0wJfAMc0&QD)ieKZ}qnF4ox{`hpWxu4fKwkgU9 zMda;q`Sj}_uY9tjfAsdo+L)JqxS6iFl#Ip{T8X%?+Xn1nK_A!a_38P+V+f^0toM^0 zwz0*wX;$}=*xr5lgTMcsU-`$s{2On>o}bQZ4x%K{+eA>MC4^?v;Yey^w5CRGW0T5? z!96cg_7o^(@M(M0uKoV?KmEb)eAzF@>A1UwQzc3w1B}W*DU|8%Bg$KCs8!OVH@SOz zTJEjQ(k9`g?9@pFs!bx?BUH6pGiamDeL5ZbvfSLvx27Vy$8?0UWM>X#?s}TtOpi=a zqwY(z6r~u+ip&a#NTlyR9ZawoG4xme{&#wB%QDZ?44@DcfTdzDr(gHP)t@LWDk}q7 zsK`p+oeHXICn)SBrv1xUVC^!01$S*TtF%%n251Qjd$QL{^{8S=MzBzxm5EAZRfbHa z%_v1lQMWE4mXtKwgw`7gYge-%ObInXv7jRnl?GJSsFBBrv zlscauBVw5kx6^4oKOVpLbMt!rZ~ow4zPWw#R_tiYo5SmGAMZ{&J+519`PoOG#26pm zeR%u&{_5v9cgK(49?#D|{LZHzy?XU(QfX6c^#sA5X-}oEHLkS>C6Ks|@pQg0%P3V@ z(6`6C^Yb-5-rn8K+vVxUKmP4s{=5I%zxCTUnp>{d%bJ@{(~i2Uh&hC!)*DKz$`pi3 zF|nWwp*%sOhfx^c1I=xx#bwE{@UOFDHSzQGc(m@8c{xiFWC#)tf}c9 zmknV=A|wl58MWurMMZdKX2l-BzWY}&Rcx1k?*RkUJ-IR=Dh1hPkGpbS@;vbm7IHKwx8yZH()-S!)EstHPK0 z_IzGh_3F6jjDl(_YcJXGBAK;C4EQK-DM$-%IZ#)HOEW#p z3mRmuerRG;5mBTe$nCmmand%^4!s}Sw5X~`*J)26ELLW1=`J;Dgb(+vD%bTw2Bjv` zc~a$~CSXSG7QZxQ6U{`vh!8zIa%4pfU+v{&zoe4WtT&A?uu`E4t=cnc0l=tTX6H5N z_2Q*o5Qb#M00he2(sKV_QMq#*sHFx$K?O8~L?axEYO3%^Fday(J=|airouC`O~y&f zpgPoynqn*^TkK)(0wc4ef{l^{BccK-U5b`fE}jBWlV&Ep9b0RZ6sXdI6`+E>FQ>!t zbUI0!lN`ej$D1Nzi)or3KRn#u-@pC%)7%E6zW--`@vFb`OJD!SxBl$U{^ZsDX=-*j z91cgWHJ+c&cOSlgcl*(AeERL*`|7KN%{RwyFQ-OCj_Kj??vqcy`0&o&d~|QiqV4wW za&3=?f!nv=+%!IY_0134kM3@7d?V|zaV&b+E{FGz?|N`B0l$oEWSu4vZI72Ly~=St zUuNT$>y6-l_V4}nZ~W?CpVsRa4<9aLbsu8=8bc@mLIBfwp0_bnc$jYHCHO1*kpY&rGb%O=0MIe7SU#c04V&Za|k>lFf_XF6kqZ!8ZGZE9*gB%ymu zOb*!_5nt;{QC1nyn=06W%Jg!=RZ6qj)TEa{rO|nqoTJ-E=Rg5&YEy_9OF2}>GPe1<5HXUtbgXzS45J3*~uF_0Q zZJy@SVcWLb+uQJZK0iJ^JoIkw-hK7OkAL{-Ctv&IlaK!G_s^H7_0Rs|&%gUKKlkDB z;dof4xow%(r>C3wkfPi3I(_oVN8kA7wjmvK0dD>)^V-E)cVVeN0!ynPuhECrib)SK}3jD>k`{Q zBG> zbUDPb_<^ljQ)q!2wBun`ZLZB^LOpw|>*l>3tg5O|2~brnkh>KlN!9j3n^vvzuHDN8 zkQB|GU5;>%LII^a6Jb~4LKIcV%7hoRQuej48Oy+kRt3dMM3snDWC(=eRU|VKCFH(@ zOwptbDy4@u*;J|r6QHR@X}RtpP(f;y#TJts9Jy`d>{}*o@8;9t*yaAySD*E!QAKIf zvWFlDV-MSaubzoh#{K<$#K@@o`m}Lc>{po%H+Q!`diS_` zeEXZ<`u@{jJYUyu;Wkdw(+__f%QwaQ-RZ{CZ|^>Re0;pD>o>pt(f5D!{`KvvQ@2>R zo73wS_=68Wx@+^-Z*J~Q{)4~s_x|QLe|Eb*uIG1GY|%RZe?LV}S{sp$e!D zs_L9mr%r#~{@r`+)jiFebBw#mhq({=zNEFJHJ|y6ao@k+bxE=5$nGRXq+4xvkcxz< zTPg)2Of{jn=^~$ju;yXm4saT01ZAOMRGq^-NmrwlzN|zspl_?Gnz?WbL}pIv&AlxJ zd@wh2!eH(K0YD|O6Eq++#HNNo;MSU3s7RwGfn8aFM}&ccHgiDXjNlELdaYV#P}j+! znl>|=n?8(yAS85uyt#}gTRdBJW$8P)uc%LERJ_u%%Hi|fS#z=aFWC# z^K@Kq%G=MM?uMP7BI;q1N$H$w3RZTgjf@XnZq==ZbVjPJ>8e}}s)ubZMkS?ub@f%(T1v6#;QZ%5AMZXpe*BfI z7yE~Cuki=2UclT=)-JB{qs?~Jt&UAozdjwt({#K#@82EdkAC%+-oJQO>%%zjrv`Nl zA+UO)Wek#7x_+8#@+hmGDwtLgAy`r*0D;V867|KJvd(278h6uKV zQ=jBia$0*mm^5NW6(ULOv(+#{4YmMaP9jDSMw9{>ToEap4K$3b5dn^&;T3Wrnng5G zW-G`Xewx}L!sb@zT8}oiXyG$BcnzIxF=tO20C`GtP%uZrU5D9;AvqXKZH@@%pk$fZ zs31&cCb#>slxC45yGas47D2>tHd_!V5N<@$mMof?`@;4>1WAb$*kfV0@pX)E@lbL#tBqh3gN<#VORuNL`WP! z%E;)1kz3Pn%#^%hoh{rSU0pnT{OIaz+oeIa!(})0OcFDpj;&!yI*mor@i5moS#ttr z#^dog&8O>^rCDrt+tq6I`t|E>wQ9|5p3K|z@n)4*x1W7__x!~l{}X@m2jBV4byqIe z>+k*K2N|E1evR>pn}c+#b-B5@8Nugy+I3~S8W1sX1wk3hY0j5Je{*wVb=q!L$l1(u zH*7A?F7EuQT|R&GOMmEi`h5TJfKX-|!(g1puInH|x{_C$c%zO651>@YkUdJ@wbnpqu%>7h;1NuW z0gFLhUEAW|Lkf4vOsh;bLnsIaY9yneu647k`J@p&$^;e!oFq#UBX>6xb60~Pqi|4e zZs7{%Eabru#&|?XnZd;nCz!HAwP*&ld26jTYq3Z&Y3bKel1Kh#g7he$(N4T4Ncx&ov&D6{z z$imHy5RypBS(r;Meb*I9Z*0VjNU*3gW9iXgMif{AVZ_L|xMy@3vO21Tqb-^@6azs_ zD9K5Tm>oUXfSd@CoX{BoL0r*{2)h8*iRamdoL@YC{Ot14X0={-!>;TuHs?>uS<=jU&|_2TnSKP{3}`Gi)=a#3^@ue{*wpcYoV=-EOyQtxfYh^sB>h zZ0`3DclY<#j4^a&ZZ(%ua)LS~!b1G~`CF^9mgbk6RXd(G>*4L~S&y_`Z_tFv)+^^Se<`$`}rrKI-g+)?gBqV0ZOTk=-RMl;st(oaE z7x`(Hsx9e4uwaz!`n*0}eIH(htAo|asy6_0QvhQEW)LB7)oMgzaKzwv^Q?kVG;kzW zZ*v{1HEm1d4I`GUAhzbgVwapUMpA&)v$mdB5UF1ZV5kY|z=wWVN>ujbF0tgY-T3h};UwGcJ zI3A*TBgQ1l#hG)?9p}Q*rHq;0q#eQmfY^x^zv!}DK#M>oCU7*6MeZ$2?#HOmC^6KjR;t{%k=bPW`*4^3FWj%}+j~;J!{aN4d zy8Q9=XSrlN?Oz}EoAnvMq_sZWJ>;B*VNmsw%F9<@9QKFJcDp@0pXU1dL-Oeq##C`7A`N`EeA_e$5=goTEcSAu*4HM@V zFJ52?tr(3Jy^ggIw${L-?}u@!bJNmwxhq8IbBj7lO1WQ|R#ydFE@1?L05ML}IF70n zm)SF60F^X6e)iVOwSIU1QO@G6HJuPlgb=W{*|ZU|kPw$J2UXAjqlkozhRgPpkU&A- zER~k)H6Rg)@Dd+D4|Q)5vra9V;Ub4N2M336HxEP!N3UeMY>dJi5c1+N0`OeAoV##b z;Qp;OZ8{z&o!WFfP2)Jv#;dn`rVtQ-XkI;Fsm`0JYE!N5hCyzw)>@k|=uIBQ+|Aw~ zJ{XuVi4;kxOUoWRiR6?d2@sp1`@*xwH`*5B@I~If%nKX{Gbdb@Vi*V*0ggrj#KZ+z zAcP2W1dtOtL=YIFrvMC8^8jRA$oSSAakXAQdvbn$HuPOrhBc(fJ%YjM)&6XIadv(d zP51kg-!j-Q3?ly!*lXMzGzi zHk*z$HtQY|4SmrzdbQJd0`~FvFjcQjFVA-4Sa0uc9v=2(wUW|XU~Mx}+`PV?jz<7X zr5uk_$wRAE5(mPomoJZ}!{wu^)vD80A8zk1&d)euP9+N+#v^*1?{=%cpC^6&@^;#f z&%gBkZo8iDr+GSgC^U4_I=N)zlr$ho=}MRTf(YzEu~=mcJ(93wY1(QtCW-KI9JQ&r zGA;Q4U;uMWWp(w=TR*_-A00myp{BEf5iZTvKnC@yHoJN=H4O+976N1x00COuZWLk5 zz80KVgop%e$zU(sAG2uciZG)YS+Fk*=ENk73}(S@VG4^c%*TWvM=`_}<^6+e6VPOJr2XlZo-8S>q>YHmopt)*ou$+mOH1xuoL-YlD z511thGc)Cs6X%?|lq3w72=H=RhrlJ=?M~|E0Z4!m?gl^%L0bprJTV|u&4Pkp~mL&@^a?|=XP<;$yKb!>-`lnw{4)8@(3 zXa*sZS)E7FW~L?4>2&<`)6cBw`PHLvS|ZpWuw8F#(%^i3yEo$Xu=3D_g8y*;&<)*N z&tDu5$Nj_p?)Hwt0ig8VJWn?-zqmNNFo>q}@pyXm`u^GTXYalLKBzwIZ#@*8$7v1+ z?mHBk%u*TpJS5)Y=lH6(rJDGpCfqRJmVmUOfBe z;U^!>pJBMF&a;N9syUcOGZ+coqRwrulUai>TK2<>MFuHgG1_^A;*xYG@Wg^Z;2@L{ zG03?fG6Vqh}aPSsVX zahm6uho?Qdq$Es^5MgfSh`!X)YE`ueuyC)fMl7sJ^Z;F4FhIWG?jsg~MG`5cbg4^O zmisU-J}U(C0AMCT!mfjJl$cCQ5#G9dE#L~Bj#r;Sa zh!hU)A#b!3Ow4^p7iYuy`9)cG)Df}x41HaF<>EaN>Q~(xX|+P6bUf|%54XYsDXBv4 zhE#@>GdPT=gRDwz4d&YB5?!`kEX zvvC@0odDwI?!n!Gu-0~VerDhio+Y17lL60arON`rB$LjMuCDfX_q*L$$;0t<`sm{i zApnuqL(j~geEbP`lw1zSkF5MeixawT1xkA`9P4hgeYECJ@A+ReYn2Gpo_h|jzJOA?2-~Pevk5FS8 zr|EPwovTh&XLEO*!km}_(5khn^VoC-R{#sw>Hrv|5UP!k3$eKg3ZW1HA*ILx0i;Vw ziUEX?IRc#^BEUS%F?3O*5*mf^!lhV@Er>`UjN%?oi+yb*^)rPt%@P z&sKG|M3xA^)y+cPbXKsYHqT(b;N;9L0GI4Tn6(A49?Sb5K~2LWrBq7p(jw-d1#*wF z2n!t`!ot*DAwo@^JP2ZO^8rQhl9dw=R#%JaA&3cB83Z*8imI9dxd5nG0rublR-))2pY$D$TkN6gqNuOdni6aja9F=W)D09_mS_sXknPvA?$5{^Ii<@-m*<=H(~GlUBl4RMKYj6)x61kI`oo{}0f7u6X((5hk6*w1cy13} z?sDoH!0|YHv$iEMSeDB?N-+BD(@ib4bZmti91CVsXYEoVLG#6JF4P$Pt&Qk)ZvyJoImw`x5Vxztuqr&HHu5uWBLNh+yxNsjPj_mrMJ`p4h; zXWxJMeFo9V%(S&}u5)eGT6n9=s~8LsQUuS_6t%`|VQ7$%2twS0mY@L!GO?o@E?sa6 zX9gm64*>);1X2ihAVly8GgkvOYmO%5ohzz(xU(>#5fTO=FhIncYB(|BJkM=z;MV3@ zRcjm7XI?)Y%$o(GlPk2QrfSW+VJI$2w)i&}5Xa_0NM`O!7zkns=$ku4q?Egq7e_lU z!luL`LQFuY=4PQwEmFZ0n}%A18!{jw#F7$Xk3fq0rvGlVB-1^tg#dz)HFRqX=!WRH zXw=@QzyzEvF?M7fb4q#GY_{t}t(rKihj-t94_(@+HZ_e%kM++K>sDX077X zP!b?X282K}LID;41aJrR5CmdQUFk|Ti>ft3MF@!NTm@m(6(TV*CVBSsy|&)`wO{=k zpWnV*;mV>yr8=9bs#XsT^Z<8g;h zkfR1V1t4Wab2I=z1we9)a3$*t_Dt-KXo{GEfPerCVp=fkD3nu|B!gM28qwydYPA42 zRrfF(dHZ}tNZMLxxQ8}x&BDkXOu^j{B_d31sUwCi$Z2S*0pY%6nt>c3mbEeEk{6Vj zh)9yfAJfzql8LKnb63^5X>$(@Ty%;H8fj5gAsDsh(L&?w%W#NIvrax zZ3Z60&^a}*`Mvi)c>es^=U;rdKU^<^GDduT_j!AD_l=+Zx!?Wq4^bO|-+u8@EiN8E z9}lm)By;o9b!vWhb9;O9D(A$Qw`W_TlvAb@_qPwsStMKNx-WRWkfg@ovlbm# za*l}L0j6MvDdz}}=Exx|>TGU8RB{1|rlVHKf>o=Bl`av9Z~^3g)nB~*&h_E;um0En z+1XMvW3{V1e(nuB8j{?{1Y)Q zVLM!wXb};PVXkUk-DeLCcXKdAhQNPw5p3$=3{L0>fo=ru7yvF|ZdToz>jI8MSrA2t zLco$3Ga^a`PPi&*yIOI{Rmb6YaUtiIyIp3ve|=}_2z0tXJiLBgtLjv>&8jUd%o+>6 zce)P#tt{z{$^ZvV^efrVe&C7WlQ|c1hTkgNTs{IyS;w-Mb`~;osyKqX>pQUL|`25Zm;id&d<*Q=`@`JAtPRFU$httDpJS@nYsnuEMR$EiE%Ar1=rs<$&4T!+ewGj~{$_WZW zDXDM}c|viI0CQ}MKf%2PC?UHoc};Tz!OT&7={}pQK?I>8P!cH1xg3CmQ_3Z$l$gm0 z;7v|v$$dhARjaM>>gg(C=|y>%BY?e$b9w|Kky*IK;+i#EBF~_X5WGOy7X6fi`vQH9 zV4_7>okWP7k;6gF5W$+eMr&#)MDheEl4Yk9Z-najMXr-$>iO{?x^fN}Tw_5JOgS3qF( zX_}`9Ky&~oT{=I%>^lDNqaV4!lgH2Mbg1(*&LbGKXrF%k*YX`JV|NZxKQ0$_i--<@wZn^iu4^qmiX^q>Fz zzq8+;>SXuFhvR9U#;R7Qd79>#h=5UD!QCw&vH&NL`OwDWY(~Ij<|5b+oY+gkB(X@{ z3KwwHm<;qyBr_^TnEP^n#2_Xi;|L%?i^Ud5f=E9#X9R(%G7AwSkqBd8nA?KP@xbMS zRn5$`DzC1Fuw{ya3k`#u7Uy6DMxa@|Q2{tWFgS%RxdQ?VCL%xtfEH%4TsK4{<^1Mx zWDH+2 zi?B$Mge1z$$U%gJ%$cc_u1J>)%){5uzW$}hZ`bRGX_~O3+LRsd?r+tbH>$09)RfXZ zRbfh9*RR%?2|Y6UXPH*1V=<`0*DK_KioVhjNDNpS}e{d2dE3$g$act z;c{$uVqc&t;p_^E;b)B7zct zL81{dw`tbxJjV)f5Mqa6yFMN7Yi(JQvUj;_!)AguJybXIs+-js$T{Z#Xl+*WOt=}+ z-OU$X=eOT}&SI~xUv0PB`EU~HKK}UQciw*cZhKBhxo(K(CAn0(Ka_O%w&q-FNlY%6noG6*I*ILq+6M|0I>OAeW zO=e!0x10W9-rwzOmv_TzSgnR>I_~%T58io~C1VU&(s#c19h+iUuN)e9pAxa7)fq&& zkl$kCNlO2SOUzKjr%oSBlOl!(QH z3<@(ZuQxhPBii)(`udXA#~3lgpy^?1O>0Vtq+4yc*);BPoU0_>Y}Vsc(W@D^aWsm6 z5RN(@zWDsp%SV@Hc7J!f8M^KI{O<1lWyz19zj*n{XJ7vEm*)wbk#cd!(^x6dbZk`9 z{_tAElax~4o~uS!&Uu=~FFv~tjS!t%HLqsgl>#V|)8X)ts3Z1id>D@ph@5lrMoiML z*TE9*+q2Eh_3N?eZZ&K#&PIc#v0iVaU#rG+Jk;idour&g->=UT!tz@ZZxr_$ha`E| zUAeWX>HYoD9M3mTQgQ&BX9bX9-Otl;{pi{4-OJzjtzYF1Q-^54IfGd9#()&XG{9n- zPwL15o3sL~s!T-4xFF}rqs`R~58`KA8!`hDAzEuJKnYdm_%m~oTn4O8tEFraU(|{#^Vb)qh3`XSje|a6l}c zIzmK5Hw%9Qt_mQ=ym`ZVuZ2*NVUYTLEiYOSqJgh7Pk zc>3(~&$pYab+B57bQhr|6?r}g?QCu-Wp5A>LlU zYOU=yYcuQm^;Fw>HLQlAY9uV{;cUCv8zmYYNv6& zxw!#__3jMGq51J)e}8u?C0#wfP>c187k}@U|H=R9@BPi~)q0RbnMjPqNf4QkGZHbI zldFcsL_~e+!3mAo*qu&oI@P&NA>crkT~<;IEign9p$8cV#sY+r2ntS;1Q87vEg(fo zxj-fa2x1UIKp`ZD#R_P#U_`=cK{deAO{+ScrfHh%+*;EJ13+To-J?wecr?UdSmcuS zQzVgvEwLX82Lcj8L?jHv3@ATE^iY6D1O_k>qNJ2ckuHhj;&S>aJI*N#BOKgP5=Lt3 z(>$4mRYql30~Y`xmbCanC>)6)0RksRg0z7D6LJC(gcKM=?74%|mDHuwMNSbZ0wX0w zOwpv1RA6`{PuG+IoX8LNdu>L-O?8@^hk}EtCE@e)^IRwusy1gqVG3`p&4iecvv482 zzI(Om*H^pC`BVeq+0$pY*LUaVkAn1cs8^5P$wRumdD)jvge4VK-|o(DZ*IWTH0kBz z^RDaaF#;N3II2jxzuTuSZ`SKo$=2-taO;Zee)!_^k6wQE$!@b*Z??##lstHJhRY{^?eG1qU-{^_*6Z!cg$g>D5D+i@sXzu!V(1`^I&kyC zx#P7PvoU(iCqGTq>J-dijH*&FWuid9Dv1aQAcD*=%p*VvW7#VSL6#&TJ*^R785acr zELs(!FxLnVTRh}Kq_u^*H!!og*_(sOlCfk;NtluQtK?zkhQWv#kpdVYxy6za07L>t zA^@PJ%+3G=h>U>$2IYVZQHdt#Wz6OuoB z@#0kLcs#uS-j^J7J)9G}>V(7zQ#;MWW{_@mn(O*Z>0f{Z#(Za&%QX4Vt~$MH1Jr|oL1kXR5nPNxI7_q)yR z;%vxib@e!1J^I`K=pTIRv)>z5kjaC97dvzkbEAZm0!1+yWpEO8N2i1-Dn?ap)tc9_ zjjCvrMMiW7$drI2&>{$hoR(BHx?4^;1rZThBQp^a6NQJ+q6db>4uAk2 zivkXWP?$+DW#Pn3B2oab&KdzC2>{&|x-B9yGJ9aH&E}?6W68aBKpDA^q>!bWi3k`F zK)6IE0Ew7`c-cKrI3WTMU<%0~$&r+kM`nS*(`jGws&vI6a$X?`a^9V7!+d{VA3u3E)x&r?K+2DHPsTc# zdDT|unL?ew0C$&HB55ASQi^&dfai~%9uBuRcXuh}B;49Gj&*zSNOHNkx%&ZHf3G^%b`+*EZ2SJa znYk(&-oL&--rbMKW2=)kv*w|7uC3OXTL57{47=T0t=6#8_obBWYLiRae&vJf+lPPr zuYUEVy=H1D3jjqp3vgoO00tJoguwxXhTsTbh92asb5&R32#D$$8sfx6u8j#PTjCTB z4uMR>2?;n6vC#5A1|~#zMB)gFU{DK34+ujKX!gb{>=9vvL17Wg;^+;Z0dNs!hc92b zB+SAB%K$zQ!XVo6o`x_4Kwtnw0BvqI2IQQ@1H*wV61Z>}Ee|Jzg9`x?p)d+A;~SI9AxIUj6dJpN)Ql$2|V5yryWBB zIZPV{=8}lHeF^5gG@Pr3VG*j%i3TSy&A z->-J-ew%Xsu&9^$@k3vo%YMnS~ILF#wtd zQXn9asJS(DAPP4lMgT|ma0^E?_1PC?=o=KLnqmZz5MW>|3QZ(ivU-bNh&PW0L<(EB z#|$B67+|rq+lkx_AXo?qAvnl=x#>cLnFs!q)=vSzNpemJ1(A_pF#((T;<-UwK7{5L z2tdmoAfaObEhxAJ&K;D<0m7X9|E~&slb~h*V2{uxuQSh52( zLk?GshiUGyzbF?&&aI9fmWi2IaxOV<*K0t_S-QSYDW%ehBoAoSQj%^}5TMqRWMFnc z9ruUQap}89S5J_b2`?@#OWGg2Up#;N-52kFtsho{pv}|na>I#I>TYgtSu(S?@!)l; z?UZuqR@>=VRmZs<-KsU~%hn^^KAaGxFUd`h$4R(5zqnL)un11B4NRLlrUanExLR*c z^Td63etCfiCfE<@>gw|R+4CQN{_=M|``zz;_M_|5eV;iAxG-f-R3gY63_>yiJEjP7 z5^*pnn*|z1fHk+~ z%`glNeA2nq=5HPmkMJ-z4R0P1gcyzySnGu3l88A6B9hA+m|-|_;F7-ph~R~ain!3< z-CZas7H>+$0BVbVZ?Ob;umqAY^YUZvz6^Gj1Vl4)MK3}8<_P2tZW`u{%q*Nk+&#ct zApkW3!O#H!jKKrL5y=B1%n@u3B?CftQdJfV0Lo-F=FtH}SRm9LRRcUJdJ|BubF+gU zR(&_m^E8iV+nuBg5mhHau^P+?xwcUm6ZqKmDZ)z{HW#axFF&uNo^6KJYSp^l%%bTR z_n+*x=R+EvJbv!P#~M0aM+BO$@-X4iB5JhFs`F{m)+BeFQlE=Ehz!i9`@_TWP@g`{ zkFTzN^5G9(zWR8*JG;1i@%YijXgc5TS7qfTROe|vZMSC-b$|P69A^L;wi_V6zrO{W zo6l}YI1K$p1IGLN)DO9o+S)YLq1)`XmoH!4+}$5uJbyY`ef5)j)Ry}p_uc9E5YGF% zqZH`4AVRac!65~de%OorlOO!6Z@v89b-RY1b=F==NUGHhwaxQFuLA@TF;e6J$IKki zTC+-1#w3CQNz`>n&7wuB4G|0h-N`H@Aqg*cN(h2LLICq6OmDuVbRsYWpqXlQ4`q}H zn`{PihT;_AMgZurlnxdekNZ#2XA8#=01*vL+=3Vx1JRLy1kghpgd#G5M+7tlWS2yU zXs)PM-NFfZ*?c?lV&r8(3Uk9C0(Bw^L^7+bTEj5&#qk6Hq25|mw?J4}|G2aekQQ<% z1V94_a`Vn^Le*47-w>Nk5FVlgiaD6n$JMZ@Ee;Q#)zP$JF7WK?;s+mJPtDFR zubMYtn%aa(p1k$`*~O)+_k9^}5B+L=s$-qv{PN=U-RjN0?&fxH^}tZa z`4|yro5w7rn$BZgt+!`q7ZDbiHmfxSU*Ej??A2%6i~g;zy!GJ^e~bZKI!ZE)r+HFZ zbvemqkmJM6Ve+%9N9Pw$S!>_--`n5*;QsTM_TV|T(T|L$HcJq9&=fHX8VDkyM<}AW zx(I;>W6C7aYGk0CgcMv-=$i7}%v^<35=B_6!Av4R!r{@(GAE)G)*#T$RUIOQ!4j9$ zYF2e_5l#Uf=mh9KFA1~=#AOBwVYX0fu{C98Nkq&Z;o#s^ggHV3oJdHJcu`piFxFY) zr>}V7L=Zs6EMy+dH4sx~v4F+d%qb`$mc_7zlLI4J5MdWFwN@8mD02`IsMT7hR@D>$ zmW?kW{4@)P3rIc8wOYgizH&egBKPLtLA02cz+J;Dpw={vW(ZEE1(_f`#IQ9pf^9jw z+&t~OO^=3JP3M#btu0hFG!bZ3Ktu2_ClpS2c6Qn3$=$oFv*TX(57X{!ouoUCr#2o} zXM?&wzI+joKmO#$AAkO%&H3)Fx4%3cj)%KzKt9gnj!^Q>!@7QxFt>KBwSM`%uRVJ5 z*28@NaJosUtXG$P&yOBoFeir?)|;nKUtC>XRPZ7>(Wte8QyKcxJl)=Yk;>}n+h4A# zAAj!bIw_O-O*KfBMf%AB{+v|O>XO?P}NQ694TT@_S;J{^c(;y(s zg$aoy7i=vB6rv=|7@1W$q@YAF8Kj_I96itocy3C<5{MWQ;aHK9kXYC}S6={Y5ui3} zvldpZHbW-_HgJMK3oZ$PYpno)g6QCC0E?Z(7hF}C2ZUsnuH*h95ekrSa$;o`L}W%l zYI<^mjGQ~k9dc4)B%FncDm0x5AW>d~shE+|;<#bq48Q=8k|Zo@;HIV;&7uN8^4gAd zJWXw$W~ej38x~44(1sBl7-kv`V?u9On`cmR2G72f`yE0VEy5HG(EyYoQh*^M0%HUk zxHhofm8Lj}cJFl0AMKv>!zxQci&|@#2?A$^zz8?Bxt>%TA?8vz$!fI{&Jp?i(W9;_ z^YOSEhDVPcOTXUj&ez)=kY7B0EO~W(eRKQj^*Gn{Dy!?=?OkX+wmGQFCG{N=rH9+w zW+bc9_cWiz({U`E0pRBL)!F%WDZ*Y|KG|MgvhZrXnUAOY!{;|QH-f8RxVyhSyEwag z^i+*LfBD&Vor$0VBw1;|G|$KJzF+6A- z-?%sMS;%rXIF)DhBxgdkd=n`j3C@n|GfINUK`itQu-GGqYs@YRHZY zPX?Wkh@4B#LGng^h+Q7KM4dO)(H&fAKTg#H5|XeIxdd?n3`j&_3!%-!gE0OLnj{iB zX?4@^xj_&vVMz@40Hl;eSfBQd!vFw)07*naRNNtv5CId3NI2x&6CtWCos$UXfw_}a zKL~|$@jwiG!x$tagBgWV>gL%&EM;QBoH-D}N!U)uYQ|X5ts){rn4xMENp6505!u4x zLvj&{Tq3|~o9gIQ1u(46^Q>;fkP>^CT1BO33MPOF4b?2dB7%X`7|DSef^!MVT$`Js zwh~~>Z07Sca+28zRYTLvRYD+XS@nZIdCZ%)A3Z>{Pyf-#t2`0AIh&d;_V{^Zkd ze*1fr^c!FLKytpB_F0BLq;#n%vG~-gNbb6IfX{R5a(8p{npvJbeNSgZoS!~@W{QlY zuBu8z;klGu>bqkdce~w|yO($O*l(Ucd+X-2%*(JKJ4JqT}(1Fy&mv zu@P4hvzT+2HW%A@I`Oe<^Z4r37tPyzvN}EtLzhbr5MHZ?^tl_yW_Ic}D@adq=cEDv zQ_QVtC_3ZPZS-gmBti?8p#dP0V{Kl0?Jx-jP&h{jD2BI~0bL>9{96MB3BW^ug#fF0 zfCVutIU{-lQx=v45y;vi8n~ky24wSwBn08Ai7BNdoG_dMBaoTg&E5LaA*LyU`_(cP z#T3%Xu<3G6BAJI_VDZ*wh>YlzSs*u^dCG{WQ8`KJAZ2g}a5iri&RD{rg{73h!3|AA zwegi5LUD zHA>0}hb+?ban^bAaMy~eMhtqw8QiMc6jp_XNaU@~2J&RszJK=K&- zwYJ-w3FqnIfEY_-A*EDGX-$PQ1|4tQpV+UDX(w_e|U{>gNl`cmrY z;dDB2iEiivv1ttJRh?$Fah^pISZ%arATY3Ma5)pK*&;nCX8TU&mA$NGk{W< z0MB04Ei;iLI3T)$GhpOgn3sYKE-;`$I15Kl)jP$Q>-}+mI?mM*BmpmmsT70^^Ch*;+{!F=<@?Rr>AqWim}ySM6n-!tcwx~1pYmBCf(JcS;Ll*-VKcKdLD zcm3-A^{c!6%~YEmj_cLx{ONmt>`(tYfB7%|_y6ku?f+ccZ~em0{?e&Q_vrF?yi1d< zIY-2>DFK>@Plsb*oS&Z`4)?-c5?T+dFfSbwr+KoR!Ay|5sUE_bq+zbQeSEdrUYzb< z=OU}k_TlDws`r#-yV`W!a6GhBI;#rcjFAaNlJqN1$u;IW38gwmou}rOSSroy_0?*7 z`TFiPhixt{fQk}aUR*qWa(0?u_3%6l@Ah{OuOA*P11UK(-d3^zJZ;AvS2Vo7I$yp>_Mi01T4sCP1S)}01*Q*K+PdYohb|m?ag>b z5eacIwPQFFr+@%-cPD{}5T;xbV<1771U!r>51oTg=4Q>2B^Tr}<&HSX!)cC55raqr zh%>Ob8$louuy|lts)Q>M)aGFj?CzmV9XUoM;RplN008u^>xrl&S@ju2Y8bJTh1zHg z(Hs&>aSpX+k_a^@gI8O0(%}$h%#0)f6&cG~R_9EmMa1RVwrN0hUXzzR9;dmgPIH#7 zmmble`p~U+W&Pgn?D6iZ%bSzdE~?LsQM!JhlnJSsy?pt3zgiShKom!cH8p$c;A2V#qeUp{_;5C z-OXz)Tt~G@wau+HB4B}VB1|X}G`-=L1Y+arwH9{C0N`K&Ktv!xnh1g!DH8$;6A=Wy zk*Z{1L`DUV0ED)r&;T6R%-yRixEF*Zi`)kdV4*Q15Sq5|kj3bN0T3dRCAHRQVU`pj z!Fg5+PE0D_1SO6ZOTTmu}TivaMT06-_qEQn-) zp%y@1%Fy>&0!zth=p^Sg;;!#{$;NfRf4F(Q2dd-Q5kjBcf6YEHzFyV(z;P0NP-hp=mr^A1D{d=O2Ff`rE(zqleMdR<#|+cG8>E z#XxuWpWom8%|G|={@FkNOMmjWzw^Dfzx1`!{s?`3dcM86e_7}D;?W~JHVDH^+32XP zRPWAHKV*ftJij^~_oeGmFe3Jc`_OipDxq{;9yaT0?QnlR9&T?w|NLyXlFW%aBAN`Q zYNhX5vs7{^DL`gBwrMOJu0})%t{REtt+$>|)h9hZe*Er!uj6#sovkT}Dm=Qn$T{uj zahoo8vNFA)oVuXrfo&AefaI6oL&)$iM2$@vXiry=& z2mo3DAR`w8Yi0zoI`8wD4?F6*LJn*(C6+WBB*CDj3CntY-sO@~8Yrot;_=n>jULBG z+s(!4WXB#ao^GTU5)E(1eLanJn%q^}DTd89D`O-oGAaJ?*F8{LvR5-rnu&fBmQa^dEci-m^*PXHTBj zcDk$WRBhJ}W(IB)P^384^{`4Qsaxq*hTsv~-KB;G@N{ac;q2zsXAk@F@#CxA?sBfC zZaH@N~$O)zAidGPi~b7*vEA*ybifI5~qb zB*g}T0f=IX&?1E~nRzfU6+jbR;D3oJF*=%}vJ@m^Vemjlf5YNLSg>h^rV|92p*j*d zp(D9hMTR12q5imgN|}Ho0)R~o09tEJAxk7?M70JYl86~;88b=B!OTF_S*Yj85Jnv8 z?oyluh!bL1SQ7T-yT@hNASZ`rVF8c`Ah?ng$s81meyp{*NoMI%N~IT(R8pT)*XM4A zu~|LY-QBS=A&``fP_@IsN+TXHuL+Uc=tK;_b2CqnyBIdOS~F3Q0)YvK6d_Kao&ZT> zbGhnDj|2k>Q*Ka3z8O~C`TEJDuFr&1gAN0^0km4jd7L96q5=Bpbm+RS`S`HEX4jb{ zQT9+|Ak3SKXV2dH(&f|j-}$@$@RQG9|KUIKZ%d=+tKAmFF#~L^qHtPh-fng+}|D6U3Y%5%Ux%_ zFbU=~tN}@_m#(#ko7;!Oqi0W_zj%S%-#?7&%U$1ZfxFxfr~L!fW9oWnc6hiW0pMtJmYK$9@k%uQvT^z3od=J;Fmk@7WdUAvSLE=-}BhO4B2+U2o1tUb8 z9q-O-)T3ulv61H>*4_q?q)C zV4GoBi}bQ8+$Dr?br02G0H`{8BkCwfYgL=aaqk|}aXOt&jv8Q_v#WQ%_KWAwzVg}a z>DPbvcQ0N%Jv%%5wO{+~k3YZrPyW;Y-Q&j>fA#7=ZO^)PI=C2w+GuQtQ_VyC9s=Ckwdlc$ecwCW8bQs&+HTf_SwpdbI?-~YS+@Ynvu zUQa{ns38P(tFkWrs;t+mZZll=X*jbMV38e_MATu6o zp28$y%EClJfka>`CISLs01-&)VBrviK}^U(Ko|h%Oe9DqLKq+{B_*Qj5rj&idyHt0vVsjl;YU&HKLDDkts`LzKjMb+#_l3c!86~$M z(hMoW+ceiYgLz^au$W?CyS=|-W}+bzSDMrgM(eAKN6+8;eXGYG98|vj?Qgr*Cr_WY z)5G=M=imC)5C6hn`0r}?w|?*2nfS9$zWDUxkN-#i!~gJWKl4XE{Pd&S+lTGt1t%7i zzT|tiHl7G@D58|M+q3n0VD+?K&uuKFq*c$uImoWCFnXo^*S_@S>Gt-!zx#V%eD>kP z;fprc`C%sFZr%6W?t?FVtT-KDpih@b-I2V$-dY zkg#)b=HQ%rUybI%$|maMOql=xS~F+ub4E($;iQ1>5I~qRb#FGf$dVx}+!xX%;+t4M zU<4>25=ktjbp~)i2TlkSh{>1e8#GP`NJ6f@SaQLqrman*>xLyN1tXw`VgPumQ=8|L zFsGE6$d{R8w@R%pvQ%aW$>sr6j1Vy(QP*|N0?mblD^CXImN<8Ul!ZhD5RC*7>gjNt zZrA;Kz1oc9zTc)W2@r@z04YP?uTC{vK+X)7CX%HXQl*9OoemFnI*9#B#$73EXbD7jU@t_hMR{WYt^O`T1<0Og3Yj+{8Zn7 z^RT4u)MC9}mpnXw_THnnKIqnu17Lr9^U)`tUtTrysq1`^#_r zzHfYOd-c}59R#5srkt=bosN@h3+5bM+FhRJiE~QG9VS<+Z3GLT)OFpk=6<+P^=X<) z?wdwc%d3>uCHD6*J$&tJUs+#Xe(#Hy$Kx>N%Bt!rybIKTqS*Sr4f!TC|5JE&F zR|v2u77M^H16J^*QKjYzZ_K%i=7HT22?+>%iI6z}5G7uaw_rfZVyFO0ivSpaS|CtJ zLdnJmUSq*G&uvs~?rwo|t0iF&AO=&I&jjerthx}92qA?B5<$+KvbDyH5aC22!YNTn zKv0Q$6hH@HD1}*sIhabO6}TaS5v0hjZ*=mq3iOn#7BOzmUNtOtZ8uNf2kjz*J zd4Rl?q1L@p<_2Npb*l5RU|O%&z;M`)8ck~hfTlCB48xjpdi>~O=q}e6mz(qR(?Q$m zVV=jwZ#}<$b$fSvGu@n{_pp>}(``_q5^-}{gL%3pbY_4xnrzyCiP%Kd5VS3`%) z0p48oIHVNNl|hfkJsKgfC)%7}qP5fM`s`}QtBp3ZN~!N`(%<;yU%k0*AHCGkV*(OB zORMc^e|Y(D+Q{Z2;?v*zvEDt{&&Q*8-ag)sr-!?M=3G+ol(K3&sr7vs601%?aheYZ z-1j{)aZa(sD*+;6wHa!y5HPIz$IsuA-5Jz&7;o~FW$Ppd0nS{ zKb)tOI8o^s0CJ_-Ar=A(w89AqTs7QXl|+P5Py{iO^W>o5O^pZ%2|Pt0vqli6h*-*4 z?uHoR*&RHb1tlS|BO7LMH9#av3p7aBIE)#A9h-vFJU2B!P7vrCtud3c;7_##BU4Z$ z0Wju_oCPsJ*+MeoJOLmYfm6=Xb-5H%n5zOhA$6$)@hmBb(vUkwFqf1GzyNTW6{97n zwtqctw}<U7FkIO%>m>||55jmJtcAW+~aA`tTb`I~>^Klxw$$G`CNKlkYI z)8GE>Z~lQVy<1j;5R+lf9lAY!bipEb_YZxyou`weezV&-VIq-8;+;`$x!LKoF8w#Z z{ms|cryu-y{Qlj8oOh2dAMY+Mbbi=8KZlUp>+#z^`tjGUE_Ulo%W(aSTD;5AA83_9obpvyT@T`vLND;!A2L!;B z8NCIBU}0enoNKLGv4u9IMB*{-+x`7;fYRVM{-_rxN&LJJfM5X2q<2%U(C z8FZ0l%3c-RfV0eJD(U6wwalHG9$j&!LiY6OQ=n8BE_SQSizmPP{g3|4ANv#Uy!-x-KKl6K z{+9S$QXcC#46BcS_?`dh|NMXbrAN>A4>z~Bujc99-R_(h^cmN)-Qx%x+acu)9>@Lu z>hV*-&IyIc5NN$YN@CHk`+D6z`S9~!`K{mk{N%sz=lEY2^I7_ z)g~D_DiCOHSuk?)7Q&e_=AoDM#q|32SAOlk`B&fnoxJH^Ts}TEo*oyIilu%k??^35zWy}LH2bfo2Cz1jsLn0y~!mwc&q))9P<@3#?`{^{!$7!nODxttm z0pUPMog`E6NTo2NW{Jd*SeT;f%#iDZtp<4#L4r4{<3fSb7QW!GKD3+OXDkN+m&?roUDicUfF6I_s0ggJiRbm2W2@YKRA-$EPdvtd33qSJ*|M@@vtuH?N{QWP#|LJERo=)F+ zef!!aN?3r`9fD)BAXsnexW9|3`lD>%a61KmM(6er4Xg|K%?agB=cE7>odbBm^oz(=-LfYCV`4pqDZb zB?}jKSIfD$nujA$&RkL|eV>O5*sNdv_`Bn@e}29_hRgZ3-Oh{W!P4Nc+3VcmP(xFQ zU_)$Ka+V}5Q$&}%23Or@9D3gNB7O3d5(*N*rt9VsnEH*$Z2B;r?(X*Ec$nrxn^lMt zi*U}8&?LCzg2JAYLQD)ZQwXIQ2oi@vAR{OPhgZswq-zS`EL}=K9%={zlMp7slyI&y z03w!@62ZVf^T!{H0C8c;0M@G38m+3EMKEz%4gIhYUe3-K+#?|&u2Wx_0X!1qg+@ng zrga>vHf_$wJ-E?!yGwVQloFxO0DF~;o+a)2SU=j#w?ZHf! zWPc_vnKI_3HR+MYHdXYlq&}}w>WBm*gMl!WL69rR6fp~>m26kkv4_sC;oxzaYcq58 zd7jO+UvJi{Gj{}}uIq`V&6S86v=4vuJ#CKt#ayTNA73_&zyB|P`RS93M~^R8{SeV| z7w^6E;unAZXaD%0_+!H9U;p-ZzWF=9`{LP?Kl>;C$m88+x85XTpHJgFb|nv8N#Mu( zTNXLLI>*&I4Xbf~DC-^M4F;BOb$oUAoo{{fzxYSL{-v+}?Bk2__x`~@{=fX+|JGms zTYvrg-~TOB84rj1`|DQQYPZ^4oagdns`cw%|GJ;FgUQ;xx`MXQI-ib=(69Q^cc;^d z1w~|Pqr(K@feZ*NL?|8r5Xe3}c`H5tz)NcPch`s454T@DJnUDi&CqvUpnyw{kzH{H ziN4FF1fvmqqSV|cm>Ip#0%RTfstiojb+qlvs!#n&QpzbODVg(-rKH5U&)Z>F@=B6~ zqiZD0T`oh;t6{V5hxJg_>u$9wEI|p95CHP;gk=M>nb6>}fvoRUK7S6iDL#(H>l_b-0)TR;Bn<{Q7bZS7`0-T&q{f1`A(v+ZvG z`qiKR_y5v=`oI03{crwP|I6=w>-*>H=i94`hnv^0?jN45hTBiRINpEQj$`#P5*L=z z4Qi*>&MtRX(=;89w}4I|K)^|eh!>7`(`NIkD`~TavLWzc7`g_VZrycVbyvyvj%)5_ zkA`t-YIyHn33{M=iY(}i?k)Nbhn#yr>@xuFeXpNFtKLxjVy zI?FjX+qL*2)FDNFo?!*DzpD4B~iFs}T%L9<#%V zB7+yi0G=cbf50<1hYxPhMx6{qT_O12PtNxSk{_DwUb@k}?|I8oykN(o1 zed}`j8{hio-dws)6+ismhto8D{`p-}{Ez|yneObl&kYCfs2rt zCC;s$O36dlDLB|1hq+&EVCcz}2=70A`NL0N{Sm|MUOxOMk@NY_5L0Km5M8o<3Z|)TZ(NdTOVDz&z3Zd#*NuQei^Qjie1mBJJ$ObJ$(=TC%a zp4W{ErIY&YX}$y3)~XcTY_~!LUFu5em>FkX^Rj2LSjZDV-h9`uS7s1P2tUv z2L+LG7FDf!L?RMS9a=L$ zrV^C|l60;uU`~>)y1O89_|n7&L}u{JlBINP%LG$66H)2NV}_->$t1|*G#@nv$el>h zK$sf9@i1ze*Xu1S69=fND+{Xm@o*Bx<5+KgaQymLzOw1FXteqM*M9StA78!u2fy*? zgLnV<_4UKe-Tr=m;*0HSD4SJ(wj0iOt1qti`@^`~tjN<`Pjf{EJnavgp;xV{nmGay zN|~l<=sE+WdB*WDp8V$K_SMbtWQ7RS{OtTm>es-pI!3mZWcSa1^|wC!^b2u#{^GHU zO{ZBb2?gfUd+&WP-`~|^TjBcde$NEketkThj?-t``~BtRxp0S&+N|z}3a75?DM;N? zDMMOI0MrnzHa*naFIE@b;Q`9tF1vDsY1X^jIvu@H?pMrd%2q&QCOyl&r_|~(*48mm zNgc`LN|^;Scu*2(I?>$Ct5Q}aNsdTPoJ?d6I?Z9glIkp)0L>%NbR-PsU_ll!pMjMT zn>hnARzmjxcXET)T0nG#02`ondEMs?!KO$LSglp3p4m3rN9kB_{~BzZ>St%$l>i#2 zA}I?ccg3#YHWSR(ceHPfBvNK#M1(?O>WG?TMc8FYIcGIQ^wOarnQLp66HAwJ&XsJn zTfOt%+x;-4A^>2-ES?-YE{x8C$jA#t0uX=zOtn&G^V+N>MqKDHK#Ud)VMdS$fl#_4 zQzLJc1uzVNkux|l6{exf;2z-yYl0DcX0ZL$N zRYkaTX_}@?Xs6@%zx(~Kf8%GLbbU$ulh0m%^26_*ZZDr)Ts_+4cOE?&)~k8OX_}Dy zbi9A{`JSNL6*(TRL&x#ZV3(^xn=21%cfY&2-93M_-kwdss`G3rRo7YS{muQI9p~Dm z^6c`-cfR<^{loQFUOa#Iy=UM1@W=I_eIJjXKKku{{p-K*^FR0ATkrhrAN+dGfDy;T ze7RcpPda>k@%CFE)mV8N|k zbmcmip}U;t7~}MCc$i|3>AV9D(vD?}ZXZobN;LOr+YJ{%2d4?6rJ^VfscWM#Mpp{6 zx=mypIAF(FSg?aMjI9Zr5+HJ+amJVt+#3=ov4T;~nFWX&1H>W(W{SoHl2{YVv3Xb^ zxT^zV%3^+^Sp65%AuNdc?*WL^mciI&wN;$qfe4~y{C&~>>4Mqn@% z;a+If=g659)zoQ@99`1XRccke8V8#BtZmko`>tDU@=&DoLL!`!NYf@Mvt+AUy1ZWZ zhvUO~Gn~eG=(@)jTXIDtZ8%R=5^gTepT6_uZne8VoaWwBJl#Ee_INst zH?MDY+g)Z^4@u`K95>tZ-1X!A%`{D$^|oxw{&4u{2cHF(-R@kY{*!0axP1Eh_07**UjE^q`~ADOFJhWt8aW4-q8d=g zq2Hv!5CIU{<~r3>BxRJGO4=}GPRn8wOX=u*!{=9Rn(8M%oQ@9$GWpzWatI<8;qB(4 z6lMw*tgMdKt$5S-S<}GMSoSBol z2LeVyh;GmjXidxvN?UDpx4C$9@uW|MxglsNy~k(<>WvcS+$lOTq0JE^1A5fC-eGJl zpUlFJhTJ$+j~PHC#FY^kfq@JmT0?D)2n;Ap>W#=V3j+}ZP)`vM+*-?=Gj9mGp7Z%` z=z^qL%hPPNcekeQRPq3TI;pAw&I@tElL^y3ddJ=?Bxk$^Vtr)X7EnQOy(n+T`l z;oVnjxf`U+e+*iN$ z!R4c??b-9!FYmS!{h>efrS-D`x-;Ltp842I_L4az*$oyx9;-+`jk7tNU2ccf761W4 zQdcrlrV6kwnMeW(cx~4=?Qjt8ck7L+(sbM=nfl$)+E`B$)KkKlyr#&jE)U%xk4UhT zl=Eu6-rkkloBg%NjKO`!P<0w>E{zi>b;9hLH1T8xY?M=>-q7dcsV~AvC2`HrrZk5l zI>xPogCE#|$pA+SB4(793s2&?AYsRh$d%>)N7JA6TGM3teb|~JB8R>AnV#vLYOZ2+ zvzs%!n-nQg9MqH{0lu*X+Y$^Lf*||K-@^BTFAN*7KZ0SvfFMD(A&ZbK%95HQd#vuR zs&{_IGwi)HGa}aDi(NdQ;GC10F|74pzaJ1bg6!5?e?257dWl3ttd@dY60=M80*SJW zLvbOu_0+67w7|BtH4kS*uGMJm$<@rv6x~!& z1d_0Y(*;q7k%$n~tO6JWfjA)wab^;k3R!3#01teZ^Uhbz$uOX`1%w!Q$b)BBbf6?c zNs6i5e>hpK7tFFF^Y3;pN?n&r-5K`oo{mhxNCA z@`IZnmfiQh;{g499yr#zEl-a_rZn9>t!Hc)#J%e2{z-;$-d!<`rc1ZZ9g}cL1dN`C zln=44X?-x%Xb627wX)<2<&n?5#Zpa#B#F9B*sWkG`>9NlIpai>#spJ70Oj}ZJ_i7# zUP{(&+gbn{Ot$OVBYIHg%| z3=q_wdDu^Nl-6k%p-_NdX^3^5buhz*f<^KLAZCCNyXxOEPU zX4}KlJGE^;KO-7AaZbs-sy|sY0PoG*Bj+(C0`!1NBo-GPc?Lj$3$+26SVSBl5vSo- z88-nQ%2b9cqM-;S;U4w8yj$D*s;Aahi_O=*E@y&h>xSq#<(x|%269U*9{TY3Xa>_T zC&G1E9v@EUK)~gT0^!ClS@7}!q@cx_k@7})t_N(*5H_Pb*LTEEV`Q@Qr$75y-5#Ia?Q&XsJr0aN{LV+; zeKn-6Z{M8nPY?V3L6DYnYftg@S6|L%zx~6{e)G3}@`K;{b?kco=Fk0`&zJjm52uHE zIzd8_AtIZ51PaSI4rZ-eQ>~JLK^(vXO8Atg{PLqX9PHhdEA9MTBmzKj!31rtFu zh;Re9&EjnK1n%LeUEPp?RKZ;XnraV#h|MoH_i&7h4KfpEk4C9-+DMdzkOIlvLbZ46 z$EV}g9$3_TQ9B9^xn#P;CsFt>|En(%eHdnD+1gUlZX9oVe*(r`xz42w)6ATE^hiGE zeaasZmz;$;M_{)Hi{&DEM092*hKMdyN-n9i%;Gk+zM7v;r}MHNNpPADk}?6aP*Byr zxG9jDQg{-PVa$#d006pKySOU>i3pfDr$or^4$z3P(7?i+K!lkyK?w&Z16K9(X?y?J z-fnhm8=59WERqu=fY#N{>(aG)w_bbI*0vf7B;u&5D>!!R7x!B(IhQ;Q5x`I+#R&+9DA^SOJyH0Gv}~Msz`>G&v>hCqRCF`~93tkO`N0982Dhd2(&FF78Iu zG1Od3!C~H0*{2}`IDsRo0f5z5&HAyett+Xv=#gm1JP4Dc*0#7Ehe4TpM4-=zATlx* zByeaEfeaoh(h-v@*~M}iYypUzWMDxAASyX?5<*k}6l4g5?&n0=ygi-2WEh5gt5zd$ z8V5?0@-?P@T!CoEL;(rFb54M^tjZXfvEky*5Js#lid2C|;$mR6f7n`O#;WVq)|9V^ z&pGAV++7kMQo8Sc?}oWBQs>mnfr2k??6s?^vjE+R6F>`}M2ItG#< z3HgDcSagq0ghIrSOP+G%S{tx0&5}je1sszMw)NJldJtpnOYc@qh5Ty1y1se&9G@K@ zj`t6zlveBOt7jj7@x>RX)9Is+KKc6Vug5uk{K+fR_Hh5M*YkcJPLHSXZClsyc|Ywk z?@OMu>}A|{AnzMvm<2GS+S`X?UCv>^1E-?XJh!&pQtYqB^?ZNz@yFl)t-tlfzxeOl z>u>)0U;RW|;=FeX%IW5Ie|>%JLdW-?zx(``Pp`j-^Md9h7&Fo?C8i47S%?ecsh^zj zhUX`gx99e>KEAmA7?mYC7iJ%C=9lyL_aC0#eew10oz9Pmcqm=%zPAtN&+9t64N$Ur zCkVjo0=A7^&q+{tY}DNlA{D+)oKwuF<+b)FmOx6x3_%W_hcJVk4P{7byj88|nhvS; zN<@U+pdukgsA|c%LsP4!8AS+zg!pg#!%qVhsWUPFYd?p_ZhB@Kl5;6ctVjmr5Dsv$ zL^BZtcH-9T(QE?>(`s>175%DgS#lOi;f{o@ZCm?*)FFbI=6Rpl9Xo2<$QkV>k^?(VFZMw z@Q?`2^zP+L$^zQ*i|04r{SlZs=myr?+q>Jt_4RDNY|H(ZfBq-$KL4}FH(%<9w-8-N zsTXgS+UazE(uE1jz=BD&19}+>VHSv#3y2PRIPCB8i;vpf3r9{*N2*7!t!_26Vgv+5 zSbz^H3jhQPt3xdKTR4}qzG+hD6jRLybhA81Qlz|C_m~gl-dCWb6 z5hWZVAY2h7!pt}3l+(zRn3;d)?|*^-j1k^)66VzU1{g!SCSr3BR3bO6O*ez4>VOC- zx}6jji}MAnPLRSPzyQSq5nE2#F0*R+T37&;DFsA8&1o3Q9wQ?JG7tw~n4bayF$qsh zMXd$72llSodP>B?Ib~)-L_!u4H!%;Ql~S-|00T6l5-#Bg&{b=62TQwreN$dd>6XHT zQ=-g()_d2@+8W-Lx*ngFR_g`jTV(8A*JWKE-`CU9wryR{k53P$r}O)F_f3C}A>eFtQ(y+gJetq|8rulGv$Rz`2N@E_2vw0GZ zsM`}lO2ZuiY^Qf61G4UhX}I1$y?@Wk^7!VL6ZNY!XF~LPS{^>U`?fxQ`1%(=-_B1= zu-hH-{w>IUxcEt0mX)78C_c+j^>}1wDiB+=;jm*`>F`fbK28yDDDL&z_hj zW(rUYBS>Kdk<`35C(20%rc6N0$;^o&=yVZ{A&lXP|Hj{cfq+C|aPp{#6ye)eB^73{ z=q!*qT3^?`g!Qf$O8e%~)D{EFX>vnA6D|l$keLb407-Z%NwVxj#$lLK8r7S|k;F@y zm=h5rI}-s!x0Q$j0-cG-$PI!JLYu(PvwzSsPW!cu&T00$A4{m11^9f7N!fS0$r*kmpaa^me zOUvVMxPEnW`&=80yJ_4_8q$np+~;w>RMYSe$FpfV%=6o~U%&q9^ZVDoKx^Zea~Y%z zBn+G|?>6(THo-n+39xm20D%4BCUKhf*L-(Nd5ZhT*MIiMA3l7$AEmF`)8mIs)ayn_ zcQ<#0aXLP{e*5+P;|C_1<}2ak?y5$pX_#BZoOyQ`0wsy$1PN0bX*cYyUwo3EKL-d{ zpWyt6eM2+rPKa(>-6~*E#Kqh^Vgf>U{EolaeihyelAC6|i|x2;EaC1iC6^a#O7 zh$M-#Fp+4DuFb;!B@F%2*2zplm=Tc}keYclH-aGu`L}=f6-lSm0Nf)0E!@Mn^*$s) zai9*?x~q34;PmXe=@$EC~xkL7JvDTGuKmOLUPzmQj`1OQP-*0>OMLnAnBw2K@Z zy=%ATu9#pqmm4hETeIFNLf54&8yI-&+u8yFfl8TDnSt?e*w5F8rK<_&`M_laWX=V1 z$}${o?>_qU;~)OyCx(n^B$+m9UM!_(=DU%dU|i$4c_e@GVn?YnQk ze)rYa$9G>nz5nvz?Q82DOuJ>kToR25hk>ZbG~VPw#G90>a=3A_LH*&~`?L4f^|-9N z`H*B(hd??VpMLpgf3$7KtKIe8_4PR43FmPff-a^|gYY5=qjg;wu#_aijD-^&4%g$& zEneN3dRmU&&frV|+qSt^1UCzF3)5Vrpb)_79l=XrAOfKP49(a$3>%)B->Wq#Gs+0= zW>MSOEIcam`C>2k@D`VqZj4CS6q|;6nAgiBvoG4$tu9ShX2b{}U|GYD+I!nTA)K~Q zBus#D2^frJ4kuGpgVt4KU>cdzILu6iAQK6oU*awv-Q59!(D`@%@k^2>$s!120Mf1% zJat76ErpT5O{>+eHNv{}ZX0m(XyF|79zDDgCL$pb3;`#;2$3KmlVAu%N|~v2>j(gm5CWqUnt_FfhXN$< zAw0Ra-kO@KZWLuqFPUVBVayXXM|I&82^&V(+CjLIH~TKk*V?@sSe zkFS?`nx-)y@83PWecjIQb9MwfJ$(J{!#6w}4u^w;0>a^X_w4SLhcu<+WW#)w4tI+~ zM&W>EU8mjMt507c1h_vueu!xEJnhCi;Y&_FHC=06kTa)@fUUJ^wTB_3VHgp}ni0b7 z)%EUh7}GtHK29f+}DU|u4w+N{nv@PAVkyE!owR7o=;EO7VxIFHGSIj5wQa; z2rHnvH?z>L<|hVPIdQ#}oyc+LZLI8&8Chu?NtE>6&{BZkX zoNv-N&)0X?H!lNHYt5{wo;lIYbTj6`t%C^gfZJ-P*RA#F6~l*IBHVRL$POfwXej$K zsP(Gn0mC&A#4`oKifhO4P^ZV%nwxK1Z(Uo{ZCh(q?LDGvZy3Zu+RQOCj^SN#3w2k} zsJ&V}E!I|mCMm+L`6)n?gfJnZqcH;X7GVJ30Yo_>rIZ6Lz?esX3zC;p%0n55(Om;n zWQYLwMywtN5KNPx1d|{u0u!5RKoEc;W|E~gBoYV#>_h=Th90i2JtVv5aKXeG=Sjj%c(A+tn;i=^hwt%o@? zGYkJp2h+`-x|%5|KM-XX00ls7tpl1!iXe>$=ZMe_j;qLrr3=HY_ie^0C)U=Nx|e%Pt)$* z&%TgSa?U^c(NFicx6>7W#`!P*wZHoLbZ33J9^u{Nc{jkbt1FV5|LQ;gy~x8~__g2o z;g5ea?dh)QN1wgOBcC32r|l$;!|ki|>0d-1wPsh$n8)WoEMLB@$D=mZ!1wR_ybrs& z3-_#RJ#UZq$1Lf^%Y%$N1B7ryDfX`q-R;MSJbrYoH5gO3=|lLYu}4Q4?njDWgWL7|o(~TbVOUg~;NQ)rx@T764#d z&VXcKE0C9gvE_))*_^vIFf(KfXb|EMiJ|1&D{bw>fAe>5h+UWwDT2&EwYwvcFf*e4 zYWzwepu0i0AaV~A&H&OHU=T5yf*T`2&N&=CI$*Dxs`l=++v>OgYD&X?{B+E>=6zcq z&3jzrt^sC^*%1MQFQ6|70stf@g2cc~hz8grK-E2>wRSPw2RMZHz6MZuK^VfwYzdF% zM~4lefiXH05R(uN`|F$C)&A<{<8gjI?{~X-ob$f6ZT0ix)9Lu|;dpv~+ScA$_okqy z<@n7vU%mPATTr{&Pr0OVn39yP0m#pvy_A%{^Mmi-zIyrexPDldwOV2PwZHh&+WVjW z!N0g2XdbWX+SOx!_u?mi`S1Sr-}$$1p1&Ms8TRngpMEx7U*mjzT06F-+py`|27PwKlW|WaP{h~o*q6tJw3Md1 z0hwCJ5(sJ>QM-9J>{%swLS`jm@0xW zGXyd#b5b|J-dea5;;E3Rs)xFRN53G)YOUcH1#!cgg=PR+*7wp6!bA5pbb)Tf zW649wJHf+{p^sQsU+WeeA}*K^M~KD=!aV{36$w1LSGb||Y-Jd3 zKYo65d*_`VA0PdAd^$cX=WRY*0m~rs&CON7)1s&EfBb6OHi|UOhtIzEeG0m|dr@}7 z_4Nz*5&!8gepc7>ZhzH!{|mqV7vKDAfB*OY$^RoQxu2HI!}-*{_u2EZ8z0Yq&V_#P z(We=Rr)#{uz1rUth2^v%4G0inTm}GH@1N?!o8{r{pML!n^dr{$_n*JXoTtOJlp$f1 zt7liYxw)z~Lf=orX*oxadJd&HOfx8K>zdPW*zGyVe%kM@CdI;$t!=%Yz%0y18QXGN zx7EEv7zZ(Biw1!KpuJsKJ>UTl%{!YOSEdC~8z2Be9Cwt5wv9T{}kAUT@x$ zKOpDi=G^-o&+~a~rM%FoqfKr)>fiYL2bfi`iKp*v+S%dpA!v=cuh+APjwSC`QL=AP zjNiIH8;gADmL%gPnv~6-9Iei)c6+)gB>~+91VejP%(B zSzS1nB%*pu|M;< zJ}r77XKOxZ%eF`R+uK#PZ=$(&$i#8!xs<504I=;L1>f0TNuBIoOIdKqQ-T(ba|@ZIFei$68sLW1obI+?K)(GL3y10`)(N= zCB7IeJ1`QdJZsPG+x!AX+wXQysp9;Crm~NCxLsMfeEhwn>okb)AXZIuZ}G3wOtw^s z+cykHg8I+;Dc-wgK?TJvsO1}Br^~oW;J-k55!(AMt_E_GGIN1w+ zpJXV%F7y0(V2~{h6wwn+Be8JLz-#WM{}LQ)e3bo)UkvB}zEyfj)~oBu^<(I2U!gOuErQ9$ zf~2T_6~GC^(zvPbbgWeTJ=l*+(W$1Rw+R;G4@Gopbf)Qsfr-N=Q?&>3Q*Y0yZvEE46DoSUzEcvV=;Sob{Rl@@SydL)=Qm%7TF^=lzm zkq`p?E6b}IHkd$bt;D)`aWLvz&xiu`>Ti>S74wGPUHxP(tDVuel;6ty=`N{$39gD# zDC$rZjCNYCsA~mo05t$CrAG9EzEv|Gq*fpt>}n4OE>}5zj_g0G8z9>F|oCM@oTSkv{-&svikCu?mkW*6~4f zXm9r)=z(v)bZ?vdcnu;A{HhCSrplbjwH%)T7w#m-NcHpf^Upa28nV0>&EiK3sOq(1 z5)$w47jIFJunc(#N#C&&4`r0|XI9{|=c`rWe|HbtrrH;YfD0-PtT6ePwS#iz9{#lE1&**HG5PZwZAwN8LC)Ua6Z3%9(D2Ra%$+}A8YgJ zhyTCI7gG%xr}0%$2VZ6{w=dWD`cK>czi-G>NZGTBbHfFOKq$g_$22x7pV{W)op~BI z3H_3IIlh_ZkW8a850BdqPG($JDi~Q2;u)IJC3|d@&I_b>Rs;8Y)pCma3S?4*K82Ft zG$|t@La4p1djli#EQ|71*2)E}b&K8<*yHP(4Q`UVwO)c74}IJm28a+rWM!>{9G)Fh zdhq`YB&mLlChG^j<%6QZI5?~g1mzNR0! zN0AVI7CQT)d_EypaJhMSc^u`hSa3NudmeTs`AZnuZL*lNl zN{##W##0WhcX82eOF!^l&_{nI2Z+A5V_(z&h>ruOe$5X|DylspOm|+&E*c2>-OL7C z%NcA;HH->i1}IR9eKA%u7mP_N@~XQGrIxTWIdrtvudvqW7I>nzK4(LL=G3y9>NiCX zQ$@GSieUu*XgTRht5shISrdwC@H3OeO%2!i!AWC`_CNz5$INS7c6(#lXE)%0H&WiH zA0pcG+X7ZiY>?CFRiJ6O+X|wG_NHp9{sXjE3wB5C)+y6n>!2hiAd%=%(nD}~E7Pi( z{Erz&l}+3qvq#2cqJPpPrm|QEYh@+ls!E=X~c& z+vgjXk{{3HF83+!J=GhN5`rw9<5{Ste7k7GYF7u({VB}|A=w?OAF`;`YIRj~QWoS9C6st>B z@1_patY=nMw`(o3$OLN`13r~;>cIzT-@WH_;qpY)n+1OSZqY zKh;2xhk2L=kUBo|u*r*1L26V1$pblVq&z`r?N|hhg#1DTjctJ%#dOHRtuMb*M`Hz7 z%@(}P%&4{J*}f%r7-`tQFG2|~xyn(>^Yim6o6CiAxhNDY!Q~&nFoT?C5XZvj9g+UA z>z%dut7^d2Mg6V*&6TK&mF<=Yd7jERMNqQx(V9=>zr5|Ui|zA7t#^-F~#w8qI{u$nRhwCclo1$=&&7OnYp)1fm9fg#Z=px@IkYUHtQ!RxjxM& ze^&IjXPYh#tW^cmW~?h_Ni%P7R8M#qIC4sMPqwm+vpXY}KL`0VRraZJ=|CeqShR&? zJ_cO__Rz6W#(rC{xu$%U5c(0s3?GZ}O~|iLZgTAbHy!niio>(24oB|%VO$m^3-___ zAfB9um+7zU2ixeg(!Rk=3=_ENL+fgvD5(WMrt{q&MMNjO5|Itik(Dgk$}?a~7AZ1S zT#t7No&4nUEfplK!;+e=IiKXzD^O(C|D=6SozxMEC=c_JfpZ|0K~J7K2L1U}B=dZ%HJC>39*|-98D`4?$s~;eb|o zZ2h*c&L-~|>Qc}jp z&Gr<<`b7Os*88e1CZaCGD7w6nipq%c$@O_j<K6qk*~MFC-P zXYOUv#d>Ive1;oOajEX}FxMM;z_IUZjbp2p9?iE?YI!WZZiWZ%u7#iHogUhbcOCL= z*%m;z0?g3@({)|~KG{3IK@=Fm`7+s6`9-b=C?P(m?|i6_aPstCK6Hq+D^Ss0nc;UW z5B|=3lo+O4OpQWh8)|FAu?Ya^Ew%$JKY8)AqPKWOTff0>{xhw^^JN}9v(dkTl&x6- zcs>Hl7qJa)1(z0mq7;^N=IFrLIV1a*u=n*iOa+G3v0?I|*<5Kr%FfI$*;+a{+eqpN zRFVqqfy{ayP|kV%eS%=Y< z2K)lG{2w)TVnFHaeL%o-H1sz}23};smXM>FRdz6jm%)HuN!o;RB0b+OTk2`a$Aa0A zw06KWVvd~V!_3bN2wLiAfPXqgUF{TfWpI*^W_P(+0cc;2?;?9IeJ(8ErT6t3SBD@o z&w*PpiL6gbmz;9{Ydq~?jfzkxh}=z7R{eW^F)={ii?2%=Hw!Wgs-xW6`)k2Daeg@^ ziv1}iUWCwt!;Af>(>}`U-g04k@!@i`<+A1MZ~1uC8AB9hjdJO0uD8`Jwn8KlC7O@k zj~(n#tZ$b)tPjasC(FlQi06$u>C1j%A*e-4fuCL2PrI_XySw{MDU~|yKkU!nIc0%d z(r6tA4xaew(Ccy82mMmU3F+DA7y#C^fdNk-$;B(iSUN7 zMy4V^6EerxW|)4Bef;l6igO}uD@L&#Hla5*KkSABHgFX>ipv+ndnu%@#t#q zbFOEFFpfgtlO#GR#v$`7#yMST;;(iPS@@~iye3P;UpoXL{J*m084$i};{6LrW6=;! zPPo*#mHb;c9Y4GD<)HErRWyKb44-(6Mln7lNyWk0kzP$9sp?ms(yGD_4JrWB#B5V6 z8U=3EZS$P$A5aAgF;iv5K6P;MF0+0K5xbj+0I|h^s03lv2o{*H4>AWMQRlAl>^Tx0 zjRk;A%X0|rT~!bKk`51*`Qm?gjpNOQS$&NP2R1zspv{Nhi^U@EDg6gkK0W$E*;m^} z?I%u^w@03c@id>DY!Ih1;eU^ZEAf}PPa24yJ)-n<2j{t$N6P0dm${c? z$|m^P)9s7ns>{hL7pLmB9~@I6nOe@Y@6=WVmhZ_@CI`$U^`(R514f0FuiU7;uQ>I~=uJpY1$5jw z&2)?pr&9=T;zeT4l*0`GmC;avxSY-=YQmfJ3KJSg84DT}uP z3}@A-dyyHrXtam~Ib_iDVoipPCi{EW#Q?3cSA?CYIe-rKE;m%)v+12pUGA{MmuOYu z90ZdyOT$nuJtT__kBx5nO%}ZvI7t2%5=027AQW;(q+cPa8`)7;Tqdn!* z59!~j%$Jsz1FdiRANQn0p8tDxCULnIwL2BHQD@V1vZ;I-b!n!2&ZMkRPgxJHlp0ag7rjOe$C4BWPZbd0rnQ5!t&{JGQ-u8VxyY#c=4P&9LsN;6(KYuJ zpxWTbW8@Q*b55Mwq=JF?_pjN9$G!$1_J~zn)HI)BKMYa3uvBk z#oM>cT9bkc{ltcBnj49ceqpB$p}SgyllpS%+jniVl%1LE;B z>(1q4zO=epMm_KZAmtf zv&ilT`%8C{h{D8*fca&pL2!n9m*m;=NPxWiq5I>sq}EqX8d4?XU+zBiy^LA>u*a}Q z16|c@zok@UL-)JFehdT+>R*CdTUM;!z-Cj*)J1vJat9hxQ2|cIxEMa=dP=`FASY81 zDLn#US6LQIO-L2JycrquA9cajsjx(IX2{tASz2szu3nB~0 zE|-QP4;KC;+FtI@9t}|-MC1CAe?QEe?(ffM7F?c9d?5x{>z7c5a3vX3Pb`O~j%D>n zBwv#5v9leGdao2a=XAQMnlcYLHZ>5(>hwoMY93JBu|>qmE9_O=|8 z0ACI8S3e6VM9U;7s1(+IdnCssq~QY6(-o}Ogft3-xbQ%{#1xn)2?8K08M(SK51+RW zMd&+K1a(x4Gtz#SZVY;0dl%G<7e8_V%cxBVSrc&W}b6iKV?I+PPs9s za<(ZVqMl0z9HU;}I{0mr5VrRb1$_$?E#aRI`tv=d`SRN3QsSkzg0gO-+Er`4+V#HN z?U?r5|6kTeA8^vCDA6{fx|7Z0zOiwy4a(T1<;Wvy(e{ir>hYD$!#ZevWeOk;l9Hmo zC;K^-c<9|1TIdUx+s0Q|O!ch{ssDT$j;mS@k-NtK#VhI#{XfwXKd8@EWl6~7_OctU z%Wsk#C|YFoLQ)-|ks&LjRjH%e7c{Hh*~O~da^LDT>2@_M59l`NAf9+$&(NBiOZ4qu z46i@^IIZ~MJYWtdR4V86Y2(pyc5!)Mgk=6j^GHU*82}RuG^W+Ty&->|F#N5aCDebdo&J|aQCSL=aAWtBo2q*U>M|&$141cc944pyq(HwWZ5ASj-RRS9>y(*yPl`O1HdDi?d(ds`_M>gq~ z_3;&e=+yQe$EjL6Q4~Slf4f0G4QwNM5p74M*Ma3hSZ89JaYJ*tud?%D1gAJ(LASB7 zN0tHP|3LoDNmt>2=|Lc7DU5<&R)Z)ZWJB{JZ}wadW35VsKhV)kN*nDl3H!PQ#%d`h z0`+_{Y5Ct?|9S;1o#96zdq~=BvuZs>%k05~02X`T zY`a&2=v018#23ONAs!&(1X$YcO~*!Pe%JZ_)9?KCFn(cxB+Rd$JSw4l{_oZ4DQkRtWgVfikKm2WoaEH7!?06PnB1a%pX+hqdXRD)Zt%^%S|vcDY@pQ))!AB%wBruse@feC_?2x8Nwejoj06yl`Hp ztmzQ=c&laq_uz`=ssiig@&LinS5Gh@mHo1;|LME6Amcks$i&qErfq(N*t_sg8w}QY zbOtcA4%O2n0Mx4gq->I4R5vE^{i$c!bvVWc&0+`Fx~c>N@PO=Tb=}=h38SB`?D3#@m zTXB;IUc2+T7zr?(w(C}C6a4S}RYPWjCSpTthkW*Zlv-W-a!An8!oEcGQFR!bMPa?`r1@k>)F{v2~nDFR(Z9yb|y6> zD8f$5gXF!nHPdnlOP^`FJm^xs*rh~i<{EKzeI6rBk!PF2d}cri*r$VKp;SU3KRpGl zuLNf2Pfep1tfy*OK2y@$EA|l6`{-PJNPeduGTkko)yyoQye(aDC4&m~M@oqQZgoG7 z`t{HJ5X{2BtqsZ_SQ_^)h3yzy^LuTC14C(t62o?UNJ@Be`f$kA_q%BZMCL? z+Cu)^79e==V+Q|P7t1WL{09N&k?BdJsh^ES9KcdJHSc+JRy!CxeG3d`cA36kAHP3L zZy_;1$7vI9-`&rGUhVhxp0uATBhb@Q%M|VCBDLgOr_rLhkM_Pd23D|89Pq5oA3&B> zP5Xp9rmw|xfhzMLfOW1q0{}4Sj52~~B(ZI6Sm>|#cXVz>FaO{PMbo9{lm=osE^c}D zrE0c;pLg1eE0)@hfkElMcYGB7h(!Y+pKR_t!ixE+$@42n!xlzIw=U)*$hTJ%3`G@- zGvuiZuk_>ds3Q917=5x_;GBc1@z*4jLoeqo+w5>Jek6C%gx}lklJIUhB}=rB_c8NS z22Y`#YwhRls2IB@ia(`=0=_|fk?E>^v9?pp}iNrsCL{_eir~rRLbrq7d-Wk*`MH4o$qj8 zEJ*+M=ii1}wDHdY`^^f4=L5nj3V@uu!ulaE(ybVmZ#`&i8xhTKep&cK)Z~>o`7C2u z^c_yQaomP<0yC$*O|fGRnoGl^8JVax>QAdQ^puJ+1cmJ3g-lCOHy&**1^(y{5RHE& zga@OJa%$RFYDd{`bk{iYg!*{xIp1NR8K2}#0d^r$B#~DngBZFezcE|C5{-+Fw_Qeu zd0=&M3Ev!vRtHu(N{fV8TiIY)FiYkR)KHp6Zsa%2WRyh1byRmT@5<>7tsJg>Wa*sj z2CWe+?BtoW&ZYK+NZI$Qy^pq{{;jwk7_*9`|2@i`3Ra`Vd%N(eK-g(v-Ll*4DQpQ7 z{(53I9s#UZ)mA63JG}ighjV`VY@g+>(*xi&RpV{q`PYf(YdIm;w6SUNG2g!3&{7<3 z2Z`+dcdXc}xZIOtJv8*0H9}#KMi|F1nX*>v)v)B`6?S=&tNV^0Bbz+3`!%WkYr+3d z?+=+o85u~viI0!Bhfo07$KlN|3-KN=01~4UFY<>2T;z0vpOZ6?$st`Z^IjZKOB-or z>8!;qmF%w_Ys9r|j{M~%LL)V9Vcb*9uL`B&Sr*5U?g3PdnG4}>%Z2Y|(JvE7YUoX$ zo<~krdcw&NZ(C&H@8k@Gw{qO+_{qUTgZNsC@1mjcT;1dRV6>c;yxZ=<$xjQo5@S*$ z*g)%&U_his4yt3$Z7*Ok?s76Oj{d7-i@rMg1D+mgwgF29(R%#*qLffQEb_GvM~mV2 z!soqt6~_7%e=`-x1g;&k+$h`Xod0^8MH0;p^Mxn+x`O$&Mbn4`O9bXi;JW3^*lHe? z^m~9jn-x9tKpT1CJqr1}L5ltIK>6g`_em!EttOAYq9nDR1nhsJZQp*8&}p%34q%)% zrOyB zW!!;atP~biC`ni1QcoY~vQ$4DFD<3=tT4lgR*;%rf?5E>>>TyG$*F&}S&3H@N~PBP-4C0d}cmQTvSsIwW`?d=^@EGs5J85j7Nn_90VTj z=lR+Qkc!oTiZLfJvX>|(DS%Q_g|4dIbguSAbW_Y^%}MurVvS~MZz{Yt`g#j~Fr$Qv z{Z?_9A75CpQ40>-Mu|R`gTYm=bjc#BN?TntX*+7hOZ*ji>q@?_H%wd82q-ouE(IR4 zE4N5&w;YJ+snI-cIsS68V>-k424B%7>>_K&DgC8l3Seb}oYy9K6F{Ui$@njU zn=hvykA~Ixy8g|Ok~Fyk0KD7b5bw{{nikbHVN{gDDtMblOSVntr2>C5xADTUY#5|f zr7Xps!FN8~>Tap@>qjao>uIN0$7bf6=1-ddG7lNqeWo2BGGpML7W)%t1 zKKL9J96c)d?CcA`l_GLht7-w)i0r6weM!DsO_BeL3(Dq)cj+Bht!%~>A<@#q1 zFlU`z4koTYgDngtZ)Gz2B*{Q}ThXDVMa!*4%=L>uBFnzcSh*$kw)aX()z7}u!$X#) zs$AobG4}z+gMXeqSTRB~t}V1I;Sy2WS`;yogpQpk4P2_v`4(v29)hG*(B`6fo6)a} z3x;&QOLF8YOcD#pIZQ7(_Py;)jRYs438U%$R^m2*fT_o5ApSa)l#vo&4_rP(gDUn4 z^2vZgyu#YCE@YoH)jeJ+_|EIzW(wa-_p)>IewW1Vx!RIQyx-~0OE2L}>b*Vk8O6sD zrHd+vSUFu;d_|D9ANMXp%MbYXIBGK{jE#ACP<5yGO4bzG;{=@r18G%dy~<2)Lw@() z*B~DZ9FxqtB(^gd1aH9L%T}!@%OE=AvL^2UL&qSF8}DgbK@QyWp3BRet)lEkG?KKw z6va<5@{MkTSK3IjfSZ2`8n9sxCh>@Su-4rFNL3Gb8zvB^$n4Tmw)A)VZ0k@_JQo`# zBH(zG1uPVMc+hKDI{ z7Z|X$t$d^|tCz9&*1f3?i$Jfg=>X~Eq1#tnf#Spwx`#176EL6 z=M1zPaG&Drk6wRgpJ;7UT=|hlctrJUlE24-#zaMK_-fW^4O?%h)w!F$&&J8c$!JOK zBc=Q*YN)-|s8*efqMTbM!WfC(}7NZ@3r}k&#Ne zB7O_FFDQ*d{?{1{$R`zs_1*)&u;xZoNOgHU`TQg}P-ZS;f-WV(%akbv@;v0~c(K=n zo@rfm-$!jhy)EDQ1=>4_&}dPHw=x0*0c0BgJi_pkaj?y`J2V=}l1aY!ox-iHCoFR+ zx@fAm=ww7c%W6N)h<+8zbV-gnQ)AWyvaL>vR!jEB#_3|`wy;0t)=jD3<9l&GDS15_ z$-aXAJ6QU9bp$Q^v+9NgSb7n_&mjU(@2t#qYE+mu{E9G{m3)?Jjnoo-x!7UwxYvZD zmQVf5|D%5NwBo_X+DWsUnoC}koO?(&I4LWZiH#~-eGd?$@;5nHS30&~&As{Hky>5h zU6J@iuGxX0;+L^pg=(0fjrpyIL`?|#I-)hQ&T*b{tx^<4@5fGde3hA>6WPJ&QG&Fw zwgNnmczkg|1$ZSWGer)>_Tyr^5&>7U6&QuxOfv)0#4x`m1HVCvGsOF%1}8TEE+-sb z75Za8xtwU+Wavu!zWt0Yc<$f4iV-~$POrhqywk5BY>zd%0*1rbqlwjMO`q~w z4M2w^GkeMhrg3~(wx6e^mz8!l`1to=%9JrVLcu3Nqhp$Eb=uQt>IKTLd6T3{vmmr; zihbcIwAR7#qzx07z_j@1Wv`P1VIxoA=>~UnB`0`ZGzN}(38d8mC|&HKlckk z?)ICi<=Jt&w(;04Ez!fSbkAso3Dr01IW9y~hiz24b_jWHRG3RXW;W@R_4e5C9@Wjo z?>FM<0ANOJ>hEE&8*U|Ndv+zG)9-9&UQL?~+*i}TXQl1^u*B`gdmJ4=ujJ41o*Cs3 zsw80kuBTS_#n2i8DnkyBe;77;qN+?8on^`Uoh)*%4y` zuQ_;kJ*UPEX7|K{5GWX+qDtp$rjaUpAMp7P?nQ=_ri=gRR{04{x{3k$_2shiQJN|{ zKP@RV=mpT3l{M&2wd5E4feWQUPnr`FcB1mezQ8V5tld<&x(G<663E0kzlFuf?(*m{ zXRv2dYHAnuVql@5OP<4Tay~g|{PftHdqu?s!vj<>L{>&@?7j`Ok@KI{b_s;}YQ;K~ zT>rNmFd~^U!voNoR;yrI5&Yo(-Nf+g6x%S#t(EuVb9Nnja3k}<>U#_8J7}Z)(2>dY z)OZScH29vj_STF=U&Ai~_(x=mrXZLfE_0vffMQ9@Dn4Fc=LTqtVkMblvEq+dgYt?= zf2x03T(U9c0z;)DUn39zbY+=%tXu+)y8L`H-@e()*qXC>i# z*+Df=U9;#x#c6Tk{DM6&@B3AQpOSB~6|xc@^FF$P$^a_t<$tzA$=1C2syedey*z2@ zL83|c^LP6V5~m=eGH4zw;*4N+0I;NtKHLAOf?qS5>TNkED)&+YZc7p@H+cU;l*Y&0 zr*})ig+`&1kQ_+7qvYAH=H z+MCcqAd!8pTqXM5l!iPZciBTQfu?nneCz|>M%J;P5bG=y`0T3nMsY>XVa0~In!-ST zsdro_YO7xU>rCFa!1TD^9x0+%$K$VA#tVvJi^s}q17lkKCe>22zhsn?Dw&UW*R+u7 z*fKWo7ue6p7J>IzdFYUtSv)Z6aEl~d5PmQDmAj5sRtTiG=>8l3<_vJyw#$uzh z>};%{7JOlA)o*@%MX)&1Ji$NP2-;Me?gn8fZ*oej2~(V5)g3DzV{hfJ=PacJP7wFalr zGHt(y68~DNhOf6}ig>~o)vP>;yqZeRH>B0Ze`B8x%Rb+uW0FY>v>qRAvZz|M5p-r5 zSy$TrOR@?S^WRPbwtm>BAATG>*Q8F3wue52hMK`_>vD{9ic1e8&0B(qdB8*OvNuMP zfIJOO(Wyux_s}GCT<&oC|tBgg&IW-kJs%vyhrQ z1Zdv|Lqmg&V6tsQ$Uey|bUGgj?JT8edk1!R!Bp#G2}axYWBnJ-IlKsb)ka(9i})}f zdR=(77P=-Qp%bj2BA(^{Z_LtbG98u1C7&lSI0{`q;J5|)k0<*#M?bfQ;CrJZBLm)e zIF=fV6)W9OrfzM$rk@H|F?6P7gxxVMFRPsFf1R35^O;En-jg6M{;D;VHVK8m-Y5h# z1^Eo*l;#QuUYK2cJAB0v>;0ob#mw$~E4meEv|)W86aBdqq@^X`$au}E3*ZAWu@nQb zU^^J6`7t|a6sflCPAe5y3pD(Rq5R#=e+X^!dOOnOmt6fm$p$)U_Pw?6dlIZdpAqhT z#kEFutfovd2!!$Da^ix~X^nTJpFh?gj)5iZ_+Gt|AD`AL`ee>8m5Uf{EI;lwT01() z(dOmPl$4admnzs-Tp`EX#mn?^F^jG4(SYJgxWB(+u}h@FdHH&+SG#0}kx}o6>>KHS zm0-ONB5BLW9}+hot_c1ipFH9XjpJVlpRkl?Ok_4^)9Dp0q6H9-VPdN0uk;X4_*e!ux8sZT8~t@LT!X-RNo)0FM^b^(s+gH`>M<1mS#sur)R z7PjQBQ@PmV57+pVA1LCIHC5p^;lDyDkGef)Pz%r0v_Km=W+X|PT?epaWRU(mJ15X< zrKrHH4RM1F+FPBw+_cFs$$rDqt2_>DO$DpzPhf{Q4JxodmE@-bU>K-X0UrYrUx%<` z418NWKd%26urwQGK|}2`6-3{Or~^Ro)Nie59#J;d1TN}UDV}?eM=d;_Balli`zet) z$`&kME`ZdgBAfHvEqFU{&1sayMRrNbP_#xT14JO+A#+&c^$67sGj z-St<8gOjSaKvY>c9Cey;M~d9B6Ot5yYUo`CUz{ zO)MwWtG7SXRFu(4k3%a4l=?wX+fhs4n&Gm>*yvqtS!vo>Ej?g#B{T_>0aQm%JTJD- zVKr;}X< zljkuSEXwGUV}~w3(r%dCrU>u-dqjm??6L0(VNc0(N`Truc5}K;fP0^4w6xu`uzOKc zZ-Q1z>d+&y91Cq6JT4;-ZKtvF9?uC7;Fy{4#&pSiFB`W1o%N&aJJ~hNuq-MpQ2GmCGW9> zk<=hHu6Sg+B$}}Aa=i_b{ESOWc-mcERt|-wo%=y$I0^$kCodpW{iSa>bOMCq6tS9Q zLKgMgE20iq5I@+e*uRx`_{z~QZiS^cm32TEbp}GyRoeJ>+dP) z5*A+MdafT+90h>qRN(y2?ZeZV z)3s;Zac=oRbrct&>>HzLHB+6Q5m_w7r|UnsRos-=EopVnvE3jJ=bygh0wol<-Vkg{ z?~_jgJPuWZJw$g*FXotIamwf7-@z8QFTNy< zYhtpq>pS+ZN%h2eeAk8<12TF}v}bW`AUNPl0m~RCfSU4^yp6SSBI!o703$Z8F3}>- znXoC{>u|#TxCCFoQ@!@cF6a8x{LKCEpMOegO9=acl{VM!>(n4v-*y|xyTa#j%QzSQ z$~{eUd)nTz3h}K5?@tdV#&OZE-8 z{9%#hL&UWVUbg?ZG4xk$a>te{?%>BZH^G?-asdv>y0Pps4i2vAp$Tj(YVxJGJtByn zwztXqBPU~SQ|s}!IUQge^Na}bR7QF+H>Yf%AH*4=p~|q0#K9PUwu;hx5r7CeJ@ZE! z27bsGtECK2_m07zbb5`X-|3FL<_0)&X?We+X2EjUqlRqHN8nraF6;{itrxR*?K1Gmc#aJ#A)#5@+kSRc)mEKA@pKhvUO}MmvnJK zCVqdj5fXa3e@$C)>6`Z5a($l`s3hNPln4!cV&s%{L2>KG60H80?1z1CXr@+~Z#}Yk zydpN}9Y~ZaQP=Wq%d@kwqv}Fg#jshGe z4*uZ40$`vRMU^}gPK7^n4+2>_fcRxdY;02y#tmmHO{Tpk z+=}};^3;Y(LZAnwf|uw>$~qbQr0F$PTZw&L2zCb8`w3Eca;ob6G33 zj*~CW7bPqeZ|~zLC;aYg_QPeJvdwW5pjT?IH$|D~1k>!b;mJU(cw7uJiQ?7>N2QO- z4u7_+;_mDV(W22OX79;o#AIY0f6b#3EwR?7sDb?IlqEKf!|8Y2a(sMz4&&Xd<-Tx! zbGiF)&pRlqM2QWyAg@;zshD5vc8{m>X>*5AaLa6g-b!Ue-7M>(@0wj=w|5m0m?|ynX{X zOHgWQq7e9L-jM8nj}qLr=L74Tz=M=#2s?bbs1(E8@N8qiO5~-&N(X7vNKQp2$jr=M z`YFTpJ;{EvHnntGoQQBSvsjrsUg~jups78DYf&J)7hFc39vi7u`bz%VY0~)?i#OOxiVB^<%K6!iMCr+3IN)2?`}j}b^8ZXYoLEUY8<{6C*{XN zLnBEPp^>!kL0#=eixXD#0GyC~Qle_~9y`lhkNrzx5s+c(% z!;An^jG1uuI9gNIO`C#siMoU6Y?^!TX$}OAoSSY5K#UsX~(SeqiainTm8N z3S$5mIE+_fi?--$O^*}ZHi8;M59Na5%UzQ(lpz6N&pzl*hF{LI8;|nzY(ZuKB+e~o z<(RTCe&ei=r?-{w-#{et#@V+hXDIR%=)v7`mVqy@e%#*P-k{H8IsVWtu#|}@^68+$ zip~o?3jRgaDNQz6jZIw5UK<-6ZlTvjxhSX*LtXKYZZ&w7u#VLpukRdf-TGy0#e-~Z9WaKQm$qz_v~u5*A(ap#ML1V z=#bMn-^T9RmeD~Q9bg#4$8YJ?dqs^EB>Eh9fxp};GGQ*( zQw<)@{ct)1qwKDE_nYyg;DDgu+5#KsGSQ5(1dKdtOlNgW`Tc8oHCf9=2ST5UOHe!;-vzkvmJrnZ;Ok2yAibLelaQd`*v@e>3agy z1a}75Gn+cE5sT1@tF;c}p~Tvat%vVkxxz)lyzqQ1B_Y9~@=D724-}Oz+$p`A+8iiG zrRp5cgGpC22-x9-pa6`ZEILxOId<4Wa~#EAC||^H_~0RH+LzQ+s+(o@X3vtDzi|g^ z!sY;HEfhWZtJI3;m@o)F=9=%!fp<0Cpup8=k!sp!)r3lq&u>P42dE(vR75ls5EAaZ z!`NK&ks0?Y#EvbaC^lankp%q%%%>9B)um+-LVosM&iX5&%fjjOK$p*AqwlZFOd2CU zfgO-#;h_}A0sng8{hKmXM0mO9K>%Ozk6uqFrE#fdNTHx2H?XJf5oX)KN}l?R8uCWtIfC;izW*X zJk2kiYMVpO?3W5lo=y)RUI!7XJ^K#Gas}?Q6r6sD;)6AtF+#pxN_#4COR76lqTmY< ze80XNZlt?*9_n3`a}Pak)Q`h%85{Z{5NRm3Ih#~J@+9D1Om0JfI>MN4yz(`Tsf-$v zTBY}PUEk@`X7YHGkIU^pbDez_M!kH{mj5TRtnJS4?zZp6$G7|4%B;vgBs?SDB~52I za&qZjwGxekiP|Fo?+h&GDg3%w&rARS4bVcWn5+(~rTS&X_{G3*Mvxljx5K}#cI15% zJwm_XRdmhoioUFix^xYw!h7-l`oZg7mj+gIQ6%sL8e~gQ}j*>z*HDV=*m4YwO~Ya+#sq{YwS$C?U5mLXHkSwUVA)|nBr79M4JSjtFIs#vrrK|R#W zpULpCMp}|yktsPZ!LgqQ<7Ag&xsmJW*Wea1>odM_LLlR(fo|P0=&e7}#eTi|j**Ia zohkYyE60Ai4M&lr8Hvm~@6o1b9zZm5avBGJyOU?7qJrZQf<4_Rey+>qx~+SKW_f9% zan{q#pd-$X#sSf&d<6Qi*K&GzIXz9Zsq9maQ1@Z6#Iv|FhhU9?a4PD+RZFk1FU=Xv zwRck%WqGj{7p7$6I%u(oD&? zkYE;`cpe(z`0A|BDA05HX`5{dg`y0k`0bihw+*w6nmF2`P$Tly){?Vw{ z6!PO?de+;_x`N2!nXlKr5Xi3lCr9M}QFQL{O#OcxpZmyVF4fYoxs*k*DA!zEcf4jkNvg3&K~DH_Brp*=XH5T zQHrI7IhPvm_*lN8qLPK+iSQB!lF^B~=~d`wp)F<1`qkZwVl!a|K?2^g-JwC7nsWFH z0;&UGQ>xi&|I6wMDRB#UNmG-!g*nevq^N|qwX=OU^w;Z&fiaLwvNWZ-A~K|I4qdSy z5qDTmZlez_&hL)|SGQa=*B7*dqnQU~RqEY7!1G;*R11?0&(F)-F|@(sos3WidQnCa zC*dJ4kAzk#+iCOpvFQyaSABHLHKgs2hj4R;kjyA2^y^=jhFOXOZ|WXK9j@*&RJfbA zDQy?yv}o7#QuS>da(H}jc0a~;D(RFFG`>i|W&h6}tl~8O>}N#fkJj(au$;FD*aJH# zugSWTqhs^S-MGngiStd3l8usQOgQbnyCR)|3E&C?sWxy(U2C3Mv z$9zn>C_*n}vadLj>A_W_@b35M-Aft;;cd6hRpf<2QtwT%v1t*`!OXw4^Qa6 z2RM^@;@LFS(#lQ+V0b?TOLKZ{PNvt^8GSa!N5K*jqFYvI`qwNJd0iOp9hgF~1wTKx z6-@}+x2i*#OZj&N^dCsTgf}Ii_~*0X$3K@MGGTPFX$beX{VXFzULX!Cq0|L6F^0a! znG37G7G0x6pir((qjZ0TyMChm9o_et@vgxIg-Vs>8#3ZD!g(%Br2Q~*Jozr#=tAPF zPEftA_pw!zb7XAIU_b7ZU1E&K@Vg4|b%GY)ld9Loc%bUEnYq+>DA>d*Q*_Vfuu6=4 zmVCTxfe}QrbWV$nEi|0lP?h2V`b7L;M$!r3`s$E~yD~|lJ$KMK_Jdxww3^6N>mP+U z<>vpK!-H_bi3`)+m1#y@U>z>?7hxe`wn3MtK=yf~0SC(Z(22GisEedPA#Ehdcc3D&1xL+s@i{=-CR@8bY;`18{bx(S30BJw13-8x^d8NA%WkfL!24gf6r4EzF`6izgi z2l2iDDOW(hbv(T9^&-^%OJB3%Hk)DHtnbtVfVO!Ta!Ya}PD%c6tv9&5)MJUdh!_tgG zfr$P+wSyI&=G9F~L{vI)y->~|ZtqF@HqT>q!Nw*weJhY$R87+ScB$$5PO$^9^ZU_9 zK`Tcz0M|#Q)g^LEqS5{Ljk@%}t^xp409wXq6m%2P3X^}qAvJM#eYmOpTJlP3zVCQc zRIdYrM059mM|{%$`2~McxiG*d33m>d3t(caZM9cb2&BkEsMYA}<%LI(Z(j(GRN(kGh0=9SSkj9}Ap#7<~j8=PYbg<)GJ^P)RQy z(4tZ2T$lB9O0Cnm0{dg>t>_iB)>OG(^Q431Pt`9&1?$ashvecB z3r{FnFJLD3Lz%mMD}=iRp`~K!RXLx3p9m60jV#~Ptda@ppr(;gMt@~MmqpO=nL9sV6%*Xrq<)f$qM z%d#O6Vxtq980UOjB2dS8opDcjA0@wTBGMhX0)kZh`B3~qwLfu{^kyDUD<4bXyY~*S zjRfsXK7nLjNS41%;*qa^O^Fnbj@ctdiNN?RsPis6XK*PTvVCPM{o;qqFXbOBk6ka< zxe8U3w^)*zhnt-r!Qbs4ISCmtZMZ9w-4kFws;OV4FY&3ql)Y(&1in}8qt+Q}tgWw; zbVOX~`M%NEgu^Wwi?j4Zg87ll6AT8!1URZm|6o*+SGuk#v#QgSH?q6C9mR3_r;FLl zYBwjhP$zIY72jh}1PKkvjNUfZY+(>86Pz)?atrj;R34+hV}ni5N55kUrBAqmsVDi1 z>?tm4q^S3iv4y5(RHlwPv|}bj!otlJr#}a)Xk2lHe-?lK+<-tKVYt#?njvq0vxISJ zj8cN=r1{C^L31S78zhK>!d`0*uKSpCS>)zk293W{qh57&`VpmCGIsyhnDNpI1!$GYIe;xUGgxv9C}tB`IfNDd$kF$cb;SG<<6i%wV? zL~znIhL>VB7NUDQ_4N%d#a#up&bn_scaJ~v?c3**Z;Og0v$K9N5}T7H=c~!gG=9SG z%t2n6BkEJ*N7JKa!_AC8@J_2jxl+YhC}-FwoHCLTaN(6$6*~E~`z4{MP3B7A0z?Lu zHRG&}@?D{X=YdmXT=Y&7!E&i(Vfu3cqB=D(n}mGnvzJA`!R;R45Tc16xwhsbTUvEC zwj=Jv?@=bb=WL!EeAeFE7#*sstE(JDa0a?w9m(95r}ZtamYquxzsYKS@)AB)>-tko zq1DyZ1${adA-c~3_v5I;^z_oAKQUwpPs=6QeG5*k`}wDm*bfSR-D)08gUI8)d!l$W=Dfb zD1kqs`{&#gJ`vHFDXxxN1(+qbB%}Mh87aVNiXQmToN)K~c;fGOAqDC%C*gk=UT)g()v zvAA)!q*mhejCg~#Jx+(=gT2np<8@ubfqSt(bg&0fl_x*zxmkRE@!z$eA2FA|&+ph1 zDoP9C|8mk5uDVc{+q#WDiDz8JY|Q4A6@`CwzzHhXKha99tR46$7*n&`mX8V|++8H8 z;aQzt@dtla!Z>~4&ntO2fQ9YFArFJ>QGKiAKY#vhaC~|lc|T>~`S!v1T4wP`B98N1 zJrZ4Ns^4z;Hhosqx${9!@0eq^GY?Lx9Y&P!zw*eF*c^@^LM z3X1o{R-6SqRguE=4g8Lfbx4Tq|3&R%>dWa^U&a*oP`=KD+$9i3KH8Nmz1*M`Wdl=q%%iSk6!yznC=rGfP2%>*44%QdzAXQ#q?(h|99&V$r zqoD?4F2jkbX@vuvf+D9A*j~{TdPtBS&#RYkd54wi1qqX=3#`GEq!J?ef~hiQ@o+og za4~(22KA|FaTZIWhxYfd>(F)7KBv7HJr=1>#~zql=mX7A&P~^})_JWj|AXk(OHV9b zf!%*~k-Az*5lp?+FPM{z?Bah1N6KGJ3?2ka&N+wWb>;a0YZn&Q|M)j+2Lxf?dI**V zK!FQ)zalQbd`X7cK1eToj?bbJ1!}x!z z5wZ6Y+8tG@I$t^6tmUjy1)ANXoeJTFm7|?Y<;1e}X;CUOwWy9tYd*($o@*~S^ag{z zDI%T_sb()S%Tmc@_lp5Qxq;b;V%mJ{i5|qf=Q6v0rT$hL1n+q4mkTjY5DC9Jex@;S zs$Vk&_*E6rZSgEWF1)5zN!@G)#S$BmvoLZ)@CrRv1X;qzt_PiknfG&~lWPKk1)FJr zs@Z^2GgJ5cfw4Mf4B2g9Wl$UT0y08A39ipf_mLLM5;nqFn8-JY)r-^d*ZpP4HOFfB zMJout&ZOF_YC*1gcR`PnDsTuSw}cSSDH9`@w`iWv9DBW>4sCd~3wBB9!?8Yut}$e! zuxGQ`WL#t*;~{0FuA)uvo)C^w+C?}1NS7-0IrI70$|VVyPNTeX3=04BW$j+wAvHm} zdsZ`(?nw_`-lfrO3YY`>WU?C&|Gj{@Q}pnBi|Jba;tU2g0jMpPZ-6~ zr)v?`pLj+?d*yseshA-5b#-UHQ;nusWBOgtQi7I$@n3b(E6YDE)6;vriiz`;)^djN zt))XOv*0shZMc)N=)p6nB2o+1#{7Tn^n)_^EzN%pt%rj(M}^IGNS1g@^*10 zn@tLkUM*_EVt@2scLkO|jnR76Bn`8@ZPLI9RKdyiipvcDMwQ z+K=e^ojKt`yIOOp%Gld}wAAPEw~zGFG1iLv1;Aub-~z38c8xxeb`}LL%ze#)tS|H7fhL zhkL^A&L%U=?W(iu*~a_#yg?tq^5u=^?XQbf9(|S)ZWT>_Hs$V7Is)R{rtc>;HsWj~ zMD{oTZpP6N(pNO<97|qd&JLVu*O{ukvBdymVr7ZwC0ioe(RUL zUnZZBs(i7KA}U%PoOS<{GW{;=;n=ZIew)Cj-0$B5y4aykYZ6nj@wz)BU`i(D2iB&?)IVe)&x{btPRq(bkn&cjn`EId29 z^xA$sepWjj)K{N}p%F#IfyV5!Jt2jQC=W_pE|k6CB7NtJLO6i?kDpnW;0b_ygcd6J z!Rm_%m!;~!+td8t^rWbGG}YHNzy8b9WJN30j-Oq(f4fHE9fyH#dPxX}W=62#vxJAD z>l-P(gec_17N30M^6p>CZZQust25&E>-ys#x+es$o5PD8Smeq?JK>Th&=qSg@wdl6 zPl#k37H|XvC8RgYoI1a=wbe2~Av~L^Yj2@Y@$J`ZbQYV(iSG1gIP8>OHFx=2;?G1+ zsJkh2;h3_(3{2kt!b4;A?sFzTx{Uj6d&MVPf&_v*J>3XfC8jHFXChf{ZyVxA_ItCrj_H2XsLQIR*)v~r!e7bL7d*i_<7Uu_vBpvL{AIUA{M7OpW?D_zzQ;CjMj}Q1U^!<~lDkIn*(5wsb$U~i0jHtI-&>IAa$OHHwZP=@(K~as=PA@B#Jq2Up{NL?Ya_~^FgGFJ0> zHa^7}FRLl_znS>EkL*N8CmZOs=&E!bF&?|U)#C|30FAhyj8;QaY53nOvpv~vySuwB zB~>|DRj(q|*Rg$To12&^YEMtP-sF0G#_ff}9gg`JC0Pl&?Tm(>GP#vs!yCD2PjU}} z@@wK-D5Cu?*zsUwB9QVF%(}#NgT&x8F^NTMMqMb#nbnlIufQt{vb**qWmok;=DV*Nsp1@=)nkaj0t+TR>*z8vawV-^*1Ax8nQ$iJ7rEr^ z1+JXHNHYB#Rco$H0na25>kH_XoN=D@%t&4WgJ(o>XPxtZX?AVwDWp+FO36qz4e=R< zyH|(7Co%}@hC9^ffFBJ{!pCCT+R&H)yh~NDmvrS~I=U>o{a|5qe<(5!hqztU5y>e>DfXki75#9mKTKov$V)r3x)IE+}8jmDF!~n6cg8=H*o4 z2{5j(Wb>F$L_;8{vij+FH?JT<{un7TD9+J`hmb|qO!uaId6uXlC-te~E(-0^QY_Mm zFg^twoy{@1NxV9KJm{>YiSUGO>YugQ^x4@ed)my5o%a4hI_JL_yEFzIrdMs78#CJ4 zfD!P z@9S<Wp+R`?b-TQLU-u z-IW+UNOoUa9{x4>xvbon<5+j7bkAD~nSJo*k8Kbt?zmw8?^Sl;9Tv)sN|~T1025)H zGTppDw~r!LJ+KDGIW*emL3;XZAM@erk%qH^1co>dRHXA}Aj&a4AO|dLHGrGd9+Vds zkD+5ffL?D7xb!FwWyN=3K_<>yY7o;|fiC zU{>3O+FVdM_EAPU4gN^d>|+OryHSCY&Xws%%)PFc4lw5&^q;}uq%w3Tnras@m(T-o zwtnJo21xNoig>R4nfAwhn;-^b=o3T~#RWy+)bSe$8(WTJ>ktTm@3k_w6lE89UaT;e ztADvuD}ym;va6Qr7?w@xfA%s3WGc*XsS&#SdZ1eC;8g;H$G4IzPyB63EfY`q85r2| z{_vw#!p_Xh4e}AzN2+#aNw)#qkIHepM?4AXQ?>hK zpLKW1u2=n#25LPX`(LF$T!=5r=ikO&#_}B9*jc&FBiM}=H5DIKCkG}bMjrk(|_bb-AFQ1bgOh?y#46ShsdDsGUREMbp3H9u>DuBvff zdws;18>|VJ%iO$@FP63yKKp;mNK^*E_(CNVYnj2!rxRv)qqD-6t7NU;r}%XiK?3K; zk3N;J0(C2RHLs|AfTStF^f3G@Lio=4zxG=)nvVtW|tpWC$9Wo$Xm%w86cv zCDjfLq?<;5K+)3>byO}Z!5sRe;e=5m6*RF$Y!T=Ua++=q+cz8k;|#X1Xu>( z)U#f-v@{W)*`C0V>8*js1anKLHy70eZU0-~;Jao3iM-06@T_Ru26oB0(1^8<7X}nR`-21uOa4=`$gXZtYtx1-{G*wMA0x{=Iw4*GT)3 zG5TD8oAH4nT(sPKdcwoAxr%Z_xdIU9TQ)BaRxPI6m_Cq~l?*}w|NfcT)q#ko zaK*S5<=PSB@Xbxm1hVrLiEg7bBM7(fY%f>J-<%#PNK(Js@V4Ax2|6f>SN`-V)BDw* z8+3@|-{k1CM>5W@)8_HtQFOJdyKw&7S3VDv=WxMJ56aKsu9ZXvHP;+9;d=u#gJi8c zSe|~5=$VbZ=PBFXmN4Fj>2=Nta^Uv8?Wq;?$v6l1OsQE?5Qqt>J&U4ct(xYHf;oi= zh#n9@&lT*$Abp@X?Y1q|6DnLzra{Ebcin@`;fuU4Ry`~Gb}Md0LYwL5tY*aiFA2sT zMzzI8Z`0%s!dWygjw)1&TS}kW`$LbK@<3Ay*d&j`nL2tdZ^`m(rzy+jYnj8sR7;#C zsmy`5gMrN)?zdEtK#mbe*sTlZ%A}z2T6jic=};YM{i@n-XXrWF#1{EGidN8hPr4iO zvVnqSC7zOpEB*WxdFANV?&IyO+^ZS0CBgVw&h26UgYy5_7wrv=7Us zG_cD|fyTmdb+q+PA5YGialbgwjvLk#C6J?C2~swD+|j!r%8L{B3gNx|Ge^8ArN4nB z3OIH?lz+W1p1ws6$~8iq!oXc=JA^0JOX`1MHa%Y2ycxk0vE?sTr=NN2$HvAVd}g;7 zSM`A8d$dJOt(U^0RcIF%1p8fv-6LqV1Hr0TRLe3WMoZvRVtn0~llBjjwATv7l7aO} zdZsyf|DGR+O>u=j@DbMdkd_kcG{JBF!r^Rl!9nD9z&KisW!Tz!Fkk7>fqikTtH{=* z;M?$cZd6d$8~nMxc*C|Nyr-Y8JaT46dw&LG2rA;0o=fIIZF*Z$j`m)6yT8b#?41K! zPfRJ)<`chuDp1ImRLhx(&tJQ*lMYIQL3|1YeL}ccv@jKVq=zL+RiAf|TjDQehY=hd z^PA3_X8(@G=Xe#b!)eMFNYKt&7i-@xY2U6noLW+kTVIp36AC?0OIUmE4VEh_JN%12 zSZ3{$4UMPk)ap#Xrl*g_7AEY_Sy?@jPbMwa@GA?lrs@t+;GW@0M=btA_X|Rco`i^3 zVlZc>r{ya_L`P{fYQgh_LhkQ;o#2UPPT+dt`|@z%u1YPb28H&{QmiJ z8$O7PU!?u@ty#>%&RKI02-y|!m-Xn(113muDl#|$)^{w=gd0I;K9+Zud{=cwJHaP^ z;2m35aihC{mI~tK)-~_Y+=_+(ZkF(zj`ChpE{}0=SgE87-(zE5-cbB3J z?^d{-BN1+K^ugIMdZm8c&YyvVgNNndgRGqqQ1B$m6nrU>fjez zE}TU>u=ZE|<^m^R=xU?_d-kf+ge6e)#X{gsT5aG$?M-RS6~H@H37^C%>@&Bqf9?AP zQykr>z`?#oqUc0thp~Kw^!lHWdl4uSDqtYU*VM~MLxDd-|1~(Jp9}Dcx4bdmrCC1o z27PM;(2km!bWZnO|?XV zmaueggrwbT&9eKYVftCo()L2&z#3O)?56UkE`-1_do|^W@{Hv?8;B3P+r*f=`Yh?1 zqsSS_N3&~n2McQMQ|@JDZ3Cf@@R3>)b7hy6u)W<^;AOQwqi$7Y&&IfM%J&aW6E^xb zBlXMdg$Pa#&$^okr{rfNCP`;`znT(jDKS=)?_kX}foiYgoIN_muog*V62sM8!uKb1 zPU014k~tlJdT5NCKVbrlnh<)@sNiJ|f9h0ATG!8prT993TZ_;|F(+JAFppr3ohY{f zaivBf@r*ysC|nMw`NUU+iE_g-5u*5`T?TWevVL9|jxu57r5JWQ!tAzZV!!;hyQJwG zh7@~%_}QwQ6d$dza!of^a)Isw{}{Vrw(`%FjYgW#9tqKz?(Qn*L4zlkTQK&q*?bx z!{DCS;V!G}dHdn&=#&?v#GMQ32?@8%a45DJoekC9^1}v@ecnEW!hrJgumJ}NW5+jR z;^W5V0D6oA58B!~L%b!@$m7OZRNd4db2Pi}A7rfqxUA#I+?QH1+vMyt>iJa6vkQsdJ&ec_4Uti81< zt}3~NooD9%HkL-)(7qnxOCj2y3jw7!J48CtXA-R^T3RYWE=;>FNAdm5%_>G8iY(j- zvOh=W$~hss05e}E7X|`zbBa1O`>o2y{DRquGV(>^MEtcrud<-C_@$YUhTz3@S0Kda zRz6<_g$%I~LsT-V36In6R`wBz?&nyGE|$U;L9{+R-W9Efc%4_OI-irq)1&B>7OJ_@ zc*FdJn83PdV&0v*@gD8cIzmu|n;!WX)_h#MdvG0XMF`>}UELYR{Cw0~USUC9*oQ`m zn@Yw3F{70O(c$hoX8;?NR08qgN4{vW+^}O&zKU187RamE3qNgxg4q0lRMZrm7YfSZ z(cxBjrLoRBoWeRn=MoOkhXsKnM)gx?Yvn{(Gwx9_=htDQ-$Vxl$b}#pfJ4m{gcxqd1iOGOYg?S+%ydgMTGc2lGp79G%e1xqz`3 zqRl<6&cV~@%Vu?L%+E9D!w%-v5}d!bsrKdY%je`Ec>$!j(<$K2XLG#2@YlTt;Z1Kr ztGn?nx56GXbbShKdQePr1TSl%GT>B-eN+f;hFyP5D^o|_WCdR%F0TQLW>);hlv%I7 zq1#KRbk2u0DWFS=Q&Ku~PHAYY2%Speyh-z*_2>FlVvZn6FlU)EX7pxCv&8VsA4r-w zGAH*t`NsV$=jpXqgb)F(q7#=Dqpq_QANvWlQRA2m^2$A~cowbN+Jt*BIHz6{ z?>bJ+%-38`@OTq?f2?J1pWj-0CU1~dFFDl{uV)id&7n#jG_&i~8Ui=#FK9;OE7;1m(f5Vq`Xj;}a*dT-)=B>`LGEfT>(Qqe8_{C{LdF zEx?x-ku)FS1(C#bc%}OJN=0XNRo^KBmqpM+XU7kI?u0j+wT({)Tx5DoEvrh;i%Um5 zNi)8D|76q^YYF9zk)1ZK4a)BJ%Gt2Jg%XxGcxaJbP#|X*yBAp|JH;3(plxa!a%!3R zFI6su+}l|}AG)}Cc(jXlhUm&LrlxFq1dNvPH8=Rf-lN=3z*B!#2I#Bub}ackhvfmfF>))8 zM!d8Lt0=$l5OI@5YnBH*j^MjI9&}@Ubj{N-=qIIh zLCrcf`DuNmfPyV~Y|HP(#1EBC_eob);Hkv_YQ`vlyAbZz z=m9`N;`c3bfiO>;c)ttYjfQDiOITME>)9T6yg!G3=D|n+{78q0#K=Bb!sS>%AT1o) zp~MXy1>UeL;qthbpK_9Ufz?iS16)b3RJ5VZ>K0aCxNyM!fsSVR>-nH#zNOYPC%WTQ(QF%Hj}(c0q-`KS4G=c%x3_{ug4rtc?;dQf-9NuBST!N%w{)E!(sH93IF0+p`Ihsk_q=>!G;Czzp)-#u{}rR(fi8t1 zy&2rfD5<+(`z%%5n}*uWShuZ(y%ocp*}YzfOC6mf5#H&z`rySX;lGf!GBv`{m&Y1~ zY(c`Res1_TPRQp!OO>ziT9@C{VBzqAN>a*RqnD}>i|`(w$Dufl&6aP^1aZdP=Z!8@ zo6~>L-&35nC=o0|bQMBQdya8ZJcHNxfiR-0%b2_I>a-aAQeimNwmBGe18~I7zCZeQ z)Jy*F{TE3CU+Bg)few{v0OgU--Nx>!9!w?2uXh zeI@2nfql!e=C##>gDrculA!!J@f?+A|Mg;41|Xk#R5)x92(`n>Ai^ZB@bHM5Lj-%N zCxcS40upD=MEYG)gYYQvMyWi~PVc!QAA`k4d(=|fw0^;4BB+5kp2jt`C8}L$1$%&8 zhr^f9fD!^Bk3qCWx7Nnc-ru#o_=b<_`WD+x4}3hUt?w#eVrswe;FfD$MQ|V>#T$wP zEdPK-0FS;ta>C&uvX+Bzrcnq#^kX^bhxBn&c4@(8+*{T)wv$JygY|4Zo)$wV)l-k? zHvWed^Mam&wxi>?5PY0E_rBVP<9^kmia?jE7ovJ~9{I?cPD_P%l%^+jfMNh)Bx{+% z-u~|ypqmZYpys;;ZLB2I9Q8RbT(nB{4>+7p-H{iG>*-vFCmi9Y-?}7)A8^XO^+KV+ zSVFn5C?=?_rpDFLzxTg!cLJ|YljZG?)zcil!DS10RjfHPEPj8_7tDcfKQz>q<>=&7 zc5|~;HUXB=g(Tm%1UVZU_*}M}!QN_=VfE7J`Y1{#h{ub#ubg10j?6FZ(T6}&`mI5~M-l!#ZVvhc30 zXgc}dqtPENT%Lpf5h5==N0U-<992@=s;@b5R=Xeh8bg{WSjRM-V-nA7Oh`{2ff%Wl zazNAiT~dFIUuttlt+;L9(>&%{#~^{Sw1q>+p&FnqnDm{;aLx!<#qML)qX}coc$Ba? z`3IB2(28^2tN8a46*PY3PHE`vmTs{?+JV;a>rn)^oiOBYUY6ykC?e18EFakWU1&qWH0i6{6pC5O&^7 z{(<&ubxNC~t5J1;aA=NtVUvsLuMU5ASEaPl+nN=6PX%u_u<#yFbrpc1REGthsE9_i z^6^v^zRMKzqi?xhb+%DS%Yi=3#cKv=iLF^K!6kRLe^+(EO>EmYyKf-fA#njs~~86IiSpA%6)M=$Kjq~ zJ9JH7&XLrMTcEP*ew|G-F5F_*@rRVkaeN}=9NQ1N*GyHM`V6kkHmiz>iP3jZ^suif z)<$kE)q$+cQiobXElJ6;l{VLZ-Tbfm27`o((lYwaAflA+d-dzwj)-+VhpG#g4y;L( zHT}^y*tI$lE2p^atKIB?elR#+@1!YSY8v}%fI2_YTrP=74Y_TwC8}u7+l}Px)H723lwQ9p+-f!kL}-4l z9fm))&Bp<{hJ_2c|M^>2v{&EnO$0gIGY>${@dwvt);JTIRK%$P)4%-jn~PkSwa*XgQ5jjoxNj6S7E5fsk&1B(wiyyL zf6t!(@l~tHCrGjAo z9lPF9^y*|}&}x~_py>iM>i$(rg>;;bLj4IlQR`=lFM)FzpXOLvYRB7O{rt-BR<0GM z(l^p^(kOuNpBjy}$d;2i6Mpw770;;M4@1?}ExPM;U&)=T{`JNdz4=L*TlGFWV94z) z0J^Y{Nw*}$;Ym(4I>!Vwc&MVy$y#QwkG&9>(H0H2F0%I)w+K!`2CnWV#~ejv&hx;g{<#@mf{oI4yVsULDr14emU7H4$`}Uy}n(= z{M)R?87;n%P&U!=+LvT((v`Pkbh32}WDQqou4qi@9iG8{d3!=|fl6~_X^e`oV)qZM zF`6?~-z;GE6+F*Q|L-ZvjUk$@{Fp?z%PgR^A-)jLMLC{>lAn8sjs6ZMn$+IxYjQSV^K0lw4I?!(iwa$F^-3pwf&KF3goI@+bBx|E{KP za+HpCy*d`SvG6c9Zg+bV4Gu9Epx(TAxHtQEhlml;xg@ri;|==M`*xGFt#lOO%Ej?{ z`-ywK?f{u{zcNP6zr+{%FuieEww6lBj*F>(LI*jgQSpZnJF8ytrPdBv_cOZ!Cx@ko z_Jey>hofrgGj___&Bb*Pujrx$}w;*bj zh`jlc;zu4^4H`S@Vwy>7{!QcN^)a~CIa*c4lC^n$zHIV6QOW#NHkFAd%4#=8aYKa@ zPZ?{-NydFeP(}t>9_;;o2=F~oq|_j8=U{C+S-N?9KFpvjjT7^Y-{0O}U!3B+;n%(T zlUHc8-I}d@Q(P`53`^f#iL^W0vmMgZs@8WQ^`8FgA;UvnCxCuM)AxaQlIqe$Dmf2< z91e$s5z_v`KXU71^TI;K?l`v~JS+t@rI<3ibUiR`dk2F`B;0(c#gOdwsUPwd!w>GK1?Gz~SfG zlTd%=Nf<8kSK_C0MbSt~HL3;ANqMS~>Pqql%k|1gC!0CIh5-76O`RGw49=gv)CreS zI4=l8Xg9bNzr6~z?lsA@(oWHT9e_*MdtG4U%EF>$f}$K(hDV{JYGpQuzi1u@$=OqT zGg>xN38mSiP>IBw&)5{|NG)?EESi?jq3E^mU_?W~CxBxz2z66j=I>p`)>s4I4JNq) zk`|#UBM6)%sEF&O*$3jE;(Wk#aAugU`ZYqpy0oIs6P<<$N(BtypiH1paF=W)DiM!z zZLqGH#YPv8^rz46!LF_nsPPp)WXhvyE=&04qbqJt!S>@1oKXXlx69 zr4-AFi+_muc#6Dr;Gh&Zd0X~=#XZ~0{O`yOLOrwau25HY$5Lkx+FRPgV+xCgXIIUx zb@qs{SZWEI)I$sGzpWbyrHip~`(e@h#p(A-tH3|5E7^mZ%ZBh{ov}bwYTpI3=$QB) zBpS8O<393+O{hPC-^{^B5N7Fl>LYV=?_LZP`4gJb|89bf(jd8L0en(uD}j|sJkV}^ zSsO8<*d|6WH7X^((8g|r$XZ>+S>0Xs1C83cco0{%Io&X3N>ik;@#EZAZis@5#NQC` z`2z%b*sGLM2P>WmZGO|2_r4VxO@cFdhH>CVr`z@d@|s8?i(z4eW#;1{QeSp~+6}7c z{hXeSzS%#ZOxxt-*k~;IX^`WU*Jzs|;J0@*HFis6`O4n#xg7b+TSlB)9IwODCN>SuW{kh2z%*{C7b2u@&5$AK~xr+ zU4Q4K2ml0VIhYhg>%;%fZ~3B00lM9w6FOfzC#LduicN80!jB96rES*tZciR{S;t3@ z`q5m1nN6F|I9^|smWxw;7&6LpN&QmN5uPgb((d%CP6y$JS`X5`72wymn%@uQ^YaP= za9#lUAm!M?b(rTbde-{J%$g~4YjZyQ!P?r!zd!#%v<=?uh#Bt9yHgCepCm{vaHysS zpa!|_Os@1&ES_>kJfHlI7Dn<@UyCGLn--@1D``LITOk@4#Hwous9^)*oWDw#7FGsK zUG$5=CNL?NKN0c9jf77rxc7B8%>Gcqfc+miH8jd81V>CsWdLNsiOt;nnFwE$vZuz= z^H;xGRaORes>ko|Y(|nnM|ujoXNkW_1!@(y=rFNP^(@$Y&Z`f$nGUkaNWo7gh!5qk z2y=xYIoOapx$eeaetFIcz-VTTu~n{gX_rL8VhkXo>QPXwww3ED@q6k+(f%dJRy?Mr zYH8Mw8wf^R#sy&-@4X5BM@3DIU`OnIz8huMu0AUAftVC3*dX}4^3w$JC3~`^b+EojJ}c;ljvQ$!u&2Zc z{)GF6^ubcVFD-CRI}?3rKg2UIg5R6T;X?AJLb;OHqGfMJx{Z;8qSU*Q2CpMPUzqXn z?R#AkqO)4OFta-!?Sq5kzKYq^>v4rhFN8{uxiIg1&rc$E)VsUIJrI+y&z!TaCR5tp zl@tk9MVH!ihT~6uJI0G`S|YC2cm!QOf^X_F5a|RhYR*9gK1uE8{fggt_>0&&b*_NM zi3z8R$rYxYu$Mht;Lu;4cauH#-MkK#m^NZn>1c!4^?Bw{qEQyFEdfP~)O%j#6`>yW zfsx<0JKK4^FEaj;#=80(!?NEVyZiU=hvcEzNs&o%LH$Yz%mu$p`5Na|*U7PAzX=3> zAM>_`i}pgiBVM|&HzTj!e{K-_b@n=;DLU(f;L&&N7@I$&iTwGCHV$eiH%g={4*H^Q zcVxhrJ_#68=j31w^}Cm#2oaqsSXC!-t*i9iImKkLE1r2!z*j1seH8zScZf$k(dniz zxoC`5P$x3o8P)zcOO17BI<)TOkFyqlO){%)v4Bmx-?bVyrS+lhH_OqL>F(;~l<)TT zM2^Bq&axhU@h8UwrC4YFi(|lt+1ScSn5D0NlfJtf={iWI?X*z;-tZV~-`@G#GQZz? zcDMQcZYSuuUyK3o!Rf=<(*h=WwJ%;!=w45iUp&p^J6&(y@#*6ioP~B!Qic0bddv-4 zrYew6qGIHk(j17BjDQ$IWGhFPh!ZGsHD;zWPYfYy{=ORx+cP(Q<;Q|`%p~m85nT8BYJrbI4G0^C`f|a-) z6x~5s$BIPTouFQgZmB(P%BTK`F%eHAVaP86s0;4TELrq{C3cZ)IUwx93y*$~DSUXZaq zuLdK;>np`iWG{tGU%5EB%b4-D1>5tym2q>FXE*W?1qFw>$k@yFA!6!}mZA&GI9la# z#e_=<&VBhI$D}!7nc=)3^4VQ#?Toe!#uc0^2pGg9sQ3isuty9ovYf4VT`1MRFf)cvWMT zvE4a7hGYO#02 z*;G}B2=hqObZgk9?x}WZo`u``p?2hVV38E53=BCmMd3WM+L8P#_1$&?4>Xi3eBYDY;Wxbo~{o?{DGYO z1+o!C5r^ZoePp}i{c)gKaY5pe+7P}L0Qfu^TwJ}$`V5Z$)uaGB%UIX=rN(3B!++f% z?sox#due+$mn)#~jQXsAvl4&v->kOc9oPLaR(<5P%k}9Dpa;TCZvwoai^1)|u_AX) z5=7KMl9s?(Cfc>?k3lur$gkJConwerc3r$dfh7=?Y~|$ z{%l-w|83zz1;@+k1>+~p)hh2zTh)NIGn6^9u>nm4z0{CeUHFn6&c=j3IoQ+i9QO|4 zR%(176a*>qRkrm!Bxer^Y#+^x%y@B2o~LB({;Hh1ZIF=`BbM&)hB`Ff5+WUO<{M*D zJ|hDw!xXcFp%H|`8~(w=2JRFXp!d4x$i9;5b4Gx{?GJ5y`>+{}%~mp;l?^-Ec;bGz zHQ!eozMHW0+nT;b|C}4P4LrJnLUUc0xYj zMn=Wia*j@3?FO@pyA*@#V?pZL3S9`l5fI0)*`NYnapsc>heS8cdXJoPC!mRQN$6Yd z`UOEI&Qh)@i7@h~@6=Ql1KD&j9piZzU^R$p zBoZTl;=NjdzLnx@9tZHRR_!^dsI%8wCGOOVn}10WxVIn|d!-ndB?1*6Fy;4+P4srz ztifRompD8wtu*G6EPtRxIY#%6;a^7~=F{1T%><8ImCv%$)U4zw_wPoJx6)yuzDi23 zI%1-p)Jiw364x3k6)s&Y7FaQvd>80RDGv63$M$%leJ$bWTc)i)7(PF6`Mm zP^ZSkc%JxN6k*IXAKC-%r`3D3E2VrE6GZoN^H%n12I?vJmbNDTrz^;03f|7x7AZ}V zCAMCo=UrG5^ML70Xxl^^e21vwRjOkeR$EShNjQbea-bZ-+M8u1FYQE4fNARO(_ zQm3tJN1!iOzfBF|S8>_YdU=?*><)rA7-E*vsSRxxGzIxxgT%x2zOY$LHmW`OcsZ(Z zyyjgz*Vx5-vBX&m6ma-LnfU@RNNkmk>b0xUAXa7x2j;nm-DeTHAek64)8E%NjbI5N zy1v-s$=e|xwVl>%Me3s;vBH_+p-%Q{u(2)^I4phwZMk$_RXwuOpPb)bW<%R6!^yA5 z^Nx)|N@DIoEsNVfnA4nZ0u;jq!-?Wumz05--Ggn5z1hu?w1;yg^5$oA3t#RoAe9Yt z+M6c_J?&~1J;Geiz3YJ_fV(vl;8%Py*ihT&KnkDYroL|-iB#~VZmo*@mYI9ATS_w_ zqI_(A$a1%Tsd;G?5fqY615lKl(lUNQ zgH@9xe(Gzx+R(sk%+LR&lzI#f^zWhNE!9aAsGI+8b;Edi!11z$Pr-?uqf8+qzmTjO z)Lj=FC;g=rF0S)&98rjPK&};?==Shwnsz7TVc(md{dctL!VmvI<9FJQUbxs?OS4yr zAkm7B_bfOeztBL;{&?r$b=?YZKTF)dV^Hysx6X4lq;YC05cPE6$Hd!tKg1lYv4J-~o}|MF zDX}0hZUyak38soAbq-@6MLc`{{4MMuDQVtgL=WPuKady<8sAq%sf;rryC#e|W~ z8I_}m6XA#*s)`@2g-&f*@;_W7uL~O*sg>^HYN&`5B8p>XYJ>y+@grjzM_Ol2gZzej z)1u$?oj~YAFVTR&tWHQ8eJ%Aru==Gub$Ru4w;URBnK)G8{l_9DJ<$dL#k%yDVjCs- zC9LN%w))|L?2ZBK>Ps#zQ|rP#wxoGrSyggj=ZZ}U%AU#7UJg{JsS8-J;`#Y8iS1%% zneX`A9S81h&1+Lv&RjO(fR&BorN_s|U(NUv3Tf0PtRA+2$>|z*FZ_ph;?T&B!;hhg z9f#zKksZH0L*MYhBayg8halzTY2bez3CfAtu}0p+TA@jKtUe9rmb4%~;2uQMvzy@r zBDyaC`Hxi1Pnu%x$hqqBcM0wTWih)3(i-VLU5hxhbH|p+UjG)@1Bs+42E=*{RM17b zCl4yW-k!(q=y5YjDR!2RHC_A8@H36^6Fv_yMCVip=$Ya{@rc3~rY=LlFsQ+-y+sq6 zk1us3s33t(-w!3&)MTF%;b7C6Lb#pm=9-{DHVh8_~GxK5h z2-Q03ibZ(vRjm;E!J2ji&FExb(5|dqeD^ znw{a-TTL|E9SSC&lWE=%#(OynK}$ABPnX*QvG2V!MV%g%Dh+bAX2d$Jueo#}T&YCd z^vOm(9l`Vlm$F1Oncf3)Fg_@4cvrdYr#|-!qy4>j{V>l7#M!XhG;ZpV-G{OY0F+*b z0hIA8n1^Pl1{_;t|J;IkcS68^qM96CD1(s^L&a@`VI>XqgPI5 zah=XcpB$;2?5Sj#=0@|gEw~WnL6@9TxQi!rz!G;pe;ivADNl37R;|i8e5ye;lB{vW zEQ_>z>49qh4i5sUwr)$%Z zWb$e#<+eRs>@qW>%v{QMrZ?MT2(6E9G#7ERx{2>|fkE_g#CGN((9^ukM5szDfCe ztNtTUPnIvVoa`@Ket0x_a^!h>bhIa=@DVA`!mw)ol~FL=V*=-FS-TMRU)tZ|CV{oq z$Hc7gD%;^6Zv-Pq^bFi@3CmHomck~P=!PV%l092m3WnU}dN#Z;;F=C|hC2D1E7Hb$v@ zYg+mO^~{swo837Y`Y!f04B&0h-~Uonqoo!G)yp!b4(qYP%Hg^S_k~hx_Vxm_-hqFQ zZNaiVwh?&>GR(zd(F9QAuBrPVGi!J-J>-57XA}tM&nJ>H>*_IejtGo^K?xbAx{M$W z)!zmW+Rt{nhSgEee0lYzghjuN(tjzSY-;$0-);2ac2BBZO<(qWA9YvHj%?tm8d+Rc zJHgLAR%yL%i*J(F1LT1IWO=hUgpYUiA`iofXla*wh@7gQLhrka`@5q%UC&u}VMnd| znlmk4jIG&lGUiD9N=s)+k^<2z@Wd~?*pDl#XYAc@PqHla`VD0h@myUJEQJTo_eRF2 zox`VaRT^as90clu{fF-c*5gEro2>uUWNabrx{sFDxb3Y#>8)*_I<+!MN_q%Rm%C&T!moIG*=&=1qbEMDNj3EM0J(M>nPfb2>~}!w?+^Q9!4eu8IzgjQB98m)Ru2bz zXAzn8GA8S5s&F0y0+YbQ>qe3wN6QK@jdBU&nI%Oj>n{3`eQSwxR5*U%k9|@z`ra#c5Zx@9Z2&VuQyn{XOM%$v4^_Jj>rpZCx zo&B8@NKS5UdMrO{D}NU0E4IyrW3(l-GeIY%4*xR?kIVAf?{;ndWcFw5JgiuczOy;Y zv+KA2QYHK(&=apB+|zrFibi@O+W^=K+M-#8Ai*5ohj6B8|GK=5@)xR4`5&)LnCoHnc}Q|w}>Rtm%CS)PCS7W zz4_rm2;HwS+?#Uo3Z;10gR7Lr6@~G%&_yE2DDtoxsKH78s*5=6F2_G?whgn3ujvy` zoq<2OQVQPJCBp1}P_f?>KDOKTtp-$8x?4}?ar8TcN9;S~@EIUw&}?K}VZ1lMtWx0P zTeY|?E!?^q6r!RMcJ|i?%E=LZJ>qDerqLOIO}Qtj7ewFM zs+c~`o)w&KIrNt_-wnv&1H{E{;K!zk9f*Q0M3kJ!Vnz~EMaGDjud(ZghUQR<@s0iG zDFJ_A+)@v{paC0$o#;Qx;Rl;T(u<1!COjkdH-)nTns=Qk9uu_~4VjAw_0|d%}GFv zyG@7V$+~`2Sgp%s$RC`I-1h0_>A_24bs4oDyJ8Lo8Q-&@MlLa!d)B%+Q<0gjJ4$?ib~v3*$#N zz4HJD?MO}!*+=a!M6}6pTVzX9A|=e`c4R??nPHD?DR%l~XC&g=lM@8DKs@Mr5g+Is zI~U)ON~sr+ffLU$*?apMjY-*-e^YI#nd1~)QfB&yM5di?}I}+fz(~U^; zLU)UF%jTV}1HlkZ93q;3TOp{Q764nBK&io#NYvfXf@kM}mirrRNQK5Nax+DfgCFxz zf6ZQBFo!Xe90-s>{b&~Co}%y;n_45I1iD{8y)=?m7rPwPDQgOr&>XZ{$W73=WHjr? zP3I6qRZ%k9yr%2Sz}JO-UzE^~yskm=_%tQ%VtU%c7qMT#7lE&_;|Wb@UXh;id_ZfG z3AvU8?{D8!-d$Ja{qO!4!`O7~SOvb%_F9@RR$>hZF$#6L8BI8gocG3}1?oA8zBeD! zeochiE%D4Lm>J#?=T6oTFsBYo+8{CvkgO+`r*zL0lTR*G6i%W@Qo=TB$+)DWJNs?cRrr1Ig$*Mzk4;4G!6je2x!zaUU7@k#)T zeXRh46=IiKMbotz(jJG%Kjap9oy^w%y1%Zf2de3ZtRYhATMHg=pkMf{nj9LGkyevU z#bFbIUpP#T|1EZjmq-uFdHr$Rn&&9Q3Rod&OjpI2a(E+jlOxyWVq?7v%9F%;(hT|5 z7e~x~m=!KqV6Gb~oH-e!{GnV`SyrPA?%9Fb>=?shtub(b-W+bv0)3YOdkN&KGg?|>AdPW3^YCTUGN8db- zryCmjqiR3d22@fxmqDDyffu}ZTQ82N&O+IvA0e4h ziD|w9bG5Zaw6J?`3&lIZddFPKn@wqrb=d}mHj{5csw zmWbzr&A3I3#}~L_N0EH+y!Y1ET{xK&dZpmkWxN6fCU9jLXwR@l3aA)04J_kRdJ;%4 zGnvX2cr+5REC0RVY8UC&*Q7LIR9c$%NaN&H*wBd5$EMCSQ+=92s<{5shL}|afwM3@ z!2nNpRt;HZGzPkdfZoeh6yO#6I(!mMty;HpgTRbF5sBZL3-En?^F4iAl|P=FEpT>a z-euS1hHC}BS?cWXOrCoYf7$ez8Yjrl;W!W_%06*s&X6)$ zz2~#(ZtsGP)%1=BU17*k=#;qAjp&5V%ChNjw5GPCR5nOPpAonO7GW=l`d)k~NdG-b z3V9(_Cq5@dWDZKFY*J{`$Me7p*Y0Q!-*UW1cPMxraz;PU0j9P-abOz{lVyd@MGgu% zf?hf1RA_KiXghINJA58C8aWJ1Re|tM&$pJXU^D0Ue8|}d1K+%Y$6*g);$nLsM-GSn z>+*kUG{2PglG4{NXlsL|p`EJ*dK#Y`c2s)`&GajJOlAC`o*UZw1cRMGx%RIVM zA(inui+XKMaXDHVPYp%_yYb)xp1GOLe6kM#i(hX(T-#pE-kyJ*5E>c;0KN(q+?4W4 zV0fJHVhl%>yY5F|xOYZ$l%y#>?_eX(-rEtWKN00*&*{<`EdWm2tIu^ut>UC2AEPLG z6xz9;G=Dw^?Wo(?MZcxu!P?c9(Su7<*j-)GU|3_$-Pso=QT5@Y9cNUm5t%G7Zr)u$S8UL5p&BN z<1e!inYd7C1BWH0J=po7<*@EO=hQEo-FM~lABzq8@5OJIZOD1ZW z>&IV@?-atvvh&QShV`ikn)J!R^fwGmndPH1f#QKUaM0&2BOM>YBzLW>g?Gdc={X?HpWXrgF3UR8 zuBJTB1_rG7ku;E~i2jK0U{Co4Xzgx&+(qv>=v0#;8zhL&|IBMGMun#=q-$WN5)qL^gzLvw45nNz7JC7qN>4oPR3hm6 ztA~NW2gipeD;fZg>3Iun$7En?qY5p>R^1Sb6=!g$}7muU=UaOIdew9xSO|$&PH=?ljZ6{BgD=9A-yQ_s_)Q<@O3>dEHnh<{^)MaW}m`~rR0s_h!DO589} zelpih^GmB1`kJWlldxKU=fvdF;p)%1xpH!rj@566lg>VzQ|;GRo_v;QfXx@txRiLM z$E{dUg46q{jscN2n6C3wNN8ck0a*Tor_b&@T4l0FS@A~?8)K;GbARnZBldw!Okc~% zn%&8+-SNWm@iLXXS|6(5Y4@Yv>(iAR>}|HOzi)ljkq-NlZ9}<&oc0eB}GIZE!0;jS{V5Sod$fG8kv`oqEEkaR~zPq1-}%POd1s{c!clC6j3 zS6X|&cqba!-`c-NEEFpI0^rgvbLzQdO=9G?Ns6MdPwzjpH;ejEn*+KUNc?ZAt$5n5i@~?>ljT%_5At#{{FM#7BjA`1cQvmHh+h+D ze-P{PLxERBghOUvb`%6miq%4wkRh~}-uptfgC_woiwq-C2Os9!-JUy?FB3e&52a5x zX?7=erz58o2MJ!EUfKj8_sA*AO|`0CR@u7ueP41$581ykj_ZN`e#H~>Wimg8o&C;d zmtt&Y^SDQ{hN_yZcuKJ9Bh9CxffVGei6q2B?ws!q1#B-a#{}7#-hn=*5rwEo$muB!czNNj@HJf??;>-Z9q&P|0p|jneZeBG{2Sh z#Mhr=Rk0f%0+#8g9YxAv`y;qog9gDB);D_R_jt4C>zA5hUbCpAEt$QVGml&O`2FU^bE?VNsLh+vByqXphsE)Ut)(un0D*3kCQcMEks!%A) zwazb9wI!F|V|bp6JagoeQh2c&|0tcL+AAu>{IzmV&?hBI62@IaB)c#ea56e_0}!7A z4UW``#qD6^xDR5Gqd&tGVsMWES2OM}_eF`f#=czgRgDFTKp_Djb_b=Rp-47E$?^gp zPYQRAWVg0dqQ}Bv^ZMbSRN`o*?d_Kew*l;6c9HcTVZ)00Y>PmesO|)A_sE$engM8% zq<>q(OY&i`v$DGu{KqppiT#+5@Yjm&Ziy2FW_zfEV5x+IBL@Ut3TaP%-A1?@H>DKx z;%t@JBh5Xq1niQNu|0!d@2q5nu$}Tzh4AT`MfhaHlRYw-96W+{TkHb@sJ5%HhI|XvtDGX5;x}yYrucfs8*q?5 zP-<1y2@()ujmdShyAqIU|ehg-KxzP{06zy5N*i5Px7`tMuE{_6G!{Aq!ZVMRqBE~x7AVzB6UP806C z3`=O=voKd;044GP2KzWxz*OW~${(wck$T!#RjRuE+>Lan?kfnd?lrb%n!xYe)@lJZ zIp9Z1KgRL{7UM}lKKp`3Iz0*iJBDBgE10*wleNfx_Ui%TO=#8q5Cy*AgRa17S|#4+ zEr5wAp#iPHdysN(vb>1n1%@Reo)og4=<1?bTGFAV`@EdH-ygeRwK8ayMo(0R@OXjo>d)(AL&EJ%-v|zGNT{;PCvax{u-gHv1{=26>?Lht03dbs*Ss zb%T>W$cC!6WhI-Fr#!lvGRuEEA?im)3y`;5w0^6Nm&@;>+)5@64vQcguY-P9>r|oU zw4*0@f}ng+PJ$50FH@&|Kyqh)`BW|4`7h8}-hsX1>(HK{23zfIh0OTc%^&#?+7!8& z>+@-Dz21pL4~FvJG4Ui3&U<4nNF<}ZaM7>UyWUSizXc~qx}mdcBUX-)oF%E(Qe``L z20DOR1YM8*J%B_qc-ir5m-On3o~K@9;2l zcKJAVOad02r?bK;(#Sst%{%CIGH;jt`!H!#DZS|Uucr|m=_a3-LU=1#Etq(Kn&$N4 z5{U(Yo0uqF+UC|s66w6WprG%!QFQ^Q%%{JZ8m&DKo3kfKgVxWvCGUL1i;F@7Q1USg zpBQS$Y*J(k75whV$fl)uZ^UM8j|b1&VMotyZiQ5MnS|s#qnfSl^vTh3&;MWap47u; zBQp-Bm7f~bq+4Fee~M-9h;c`~(U#W`{jSsX_D^z>x3&%<>8W@p!)w=Mc-i;Ff;Pp- zyyz(KqHL!hxEt~?^3!uFbyucXAxh)SFMirQZb`^EO6jq=7B8e{bJOccIW<)a{JkRM z4!4H(YoEYjTUx_yXE)5PiC0e&FAj5F{Dje9QnfS-eE7H5NwAw#=jIt_4Zk(Oeectx zadDdMFhk@YOG!*t4a|uTNd)N0S}$@Vo8Yl3m`~95(74 z1?jR6T&}@B8}`>__3f^jkv(}c8QMMo3&CcQ4>0Rmju#w^acb&9do`%#=*TD#*Uk+? z+kxSy$%U`|MK1QL*)^YJN9;?V&djdc)f7>i!oo0(wpDWHQ=(!ej}|Vp94~CbS#?C@ zY-$eA*b_Q#w(5*Aq*;NOMFUpLNhmA;I?-=yqIIJKDFu@T1Lh_2>pvxiK)TDjJySx;0;E4n6P* zzSj~ON`GnBlA2`-(e1zytjoX^v$D8+OO9c&g-c$aZQRv`IH4&8Z4AlUg5O@I%kh6g ztaEqXQgma3vKQ;xPK4C-)j_6B@+4bS?uVTyhBq}wdi_xD4E#^%fio9>^C~g_3shmj zNr*4S+f&}*OV^|XG`-hUeiieFMx|p(x|$APzKUSpr zb>24M5gycje-Qo|JlniJPR(5Jd>-j+wKid@IY~PXAi!k;SBO>a9Is79WzI{Jue#hF zAiagc9{94{`TNzw;9wl=WcX0?h1>5RE zgae2B_I5g6(x^jwlf@kxr|oBXiK%bJdDGt$-{cpD0p`6%5!GP>9qIVZ(hgRv+tcbb_C7pZM* z@?-RRlRP`?$M{!oMPCK0i$7CIc2NCCTn!_Sk3SeZ9lk%r9?D^<&Q~KeJxX#%xmWipJdI4DpwRp z9$~%onfO`lQow7Noou?>p)s+VuB1V>gV}H%9UQk zN<>58owB^!oA9A^*pT;+nu#CRKou=TPHcsZrGaHp(I5pWX+Q~3dC z9=)@wTvEJkX-s7xpbVq=IPF7>sDc)Y1;^XRxy8uqS*;nyvF&Nys+=}YG!kcE!aXxk z`x0~W$#)>QKrycQ7AB)~K%6BoRlpRoNDm??lc>T-nI zSzgC!f(0;;%!}BjC`pTkIPLOIOts5I??n?6P0>6njq9x2hB&D{a^HB6Ut;hxzKU5| zf+xvG&y7J!@HRi+==ZRB=n{onBD&shmb$t-Kkth|`k^6jjJZe$Y@dXTG=SgHkQ|>+ z;LH+JGIPz-33rb~nAKLnwp9AWAn~m4gGc;UBmr3#&f{m1h@5Qt#&F1k1n?G_jJ(yw zkPFaHq}$1^dQ zNXAi|O02m=?|e@DQr}STx(?Fd`2OnqsJ@f_e^TDu(AcTVv9P9WQ|lDT!l~5Y>HM3I z#AQ_1d0hp}ASrMjw}P}dZAV?qbS@oMWGzh$j9*gYznCb(We>G))t)_4Iqf;!PvEly z!aGtL4h`=-Flb=SwK*dpYH*0QQ3>0xqv&SEOjR>YyYR$#Yq~tVgQtiu(j3k^{SXjW!#aL3g!nXcXXxOIU7P`2>(E33up9fTzv% zcp?0*70h)G9uxTE-gfr<(6AnFg5ab#`*kgTg?E>EGc11NLYQX_EBDWa$h>k}dfXu! zw_&jMS(DWR)8Zb%SW#eD#`2m-3Ol?c89#Bf3J7Cvm3$I-%%mr0;=RVZX)3O-O?p=< zSjR8stFHfZTXmiZAf_YYdg%AwnM5c4cEM*^lzo@4(s$3TGs3B{>{bG*;xEoD2<*U49sG(``S&;Xs zIaB?!@-#kE1Dks@Z#iE{%+NRKGju{w4x-y3*-@=f7p|y|fE8`j9xO))GqpVoUnz#NoD%wJmlN zHcD|?%OtXPB=qmn zz^F+O*g>B+*5KplxJuYjk8~~DNxt35!s?y_@hu8T+@qF#J6&^7x+ZhA)dz`33Gc(6 zS&T7PjH3x_YeL;tNtP}gJFZN`=UOOj$|LQD59VH8@}0N;dz#Alkyd^s?=_RgmE4$} zmEouuzLB(2z-rQMnqMNpuvDDoNv@PKi8U5DU9c-9DlmnhR+9BA6^A-xI-`oF1Fa`Wi=0w*!TsH)?`u6L&T4ck)t8Qo))XY@ooA` zTv=cfwDx`~?UJ6vf!h+iTc zfT<5SDGLezXik9AIBSCoJ@LqO3*A=&1AaE=MeoF+?UFbcY;A2rP-|02??4tabZSoz zn1SzM(Ai|Q# zY}J)^QvkHSHa0HqVs4tIfSx#iKKnceh{AO5_1@{a$`R%CfEE#WGrRZOo{yDh?IJ#5 zb5p+MNcq9#p5R-D731R;Zv6?6(ke^*6{s#~G;3B$3?qs*6 zfLrqEU+sVK#UmNrf`vs!iK0qHLWY%iY&F@sX8iN=4Rws$B9%%%*ll{UNZ;St`L8!& znGXDIi#_yU@;~~){Pv>owC$IIvKoSUYjnd}&6kPEN>@&YqT;l>-$?b?%XtE4-B})u zl=Eu2ayOu)KVh)uX9qQul^_u^+q9NY8o&q~IJNq_TwxTUG_CB;L-qGE6?MpSS%?C7 zv0v`i5Tc=4d>r35sjqYRFV9P0uBf zf6*>oWS(iVHNN}-N%aObC?>WDqIcDc#d(K> zgBz|H?+K{ucW8?+_;Lw2Cbqv;U*&PX>YA!+)dMIphR>d7!kYFX?%5Bg#6LQbzlq3)795G`@T(6>K)Gq> zKIENiAnlR!>*5{MlZj;in|M89C~4l5?s<~Wo)X;;*HZPBn1wD~b;;x7Blam7z)R8C z3H-$E#acZqcJ~Aq-t@#a!5cC{&&TSHs{}@V)X*uy!aOO_jWV^p_B^w+5j9 zicbHHw;WhbN6@ktx3{)-hXzO%oCP)_#n-;;*O?&wr!lp}p0u-kl7`|ekrRH?C`y#v z(?MS)HV#3y3VtbpNI%DRK{MWu*&f(|Sq_H9zVX(rlVh_N4&)0Ph0L{ww;tp!GM8}m z$r=vv4W$QJ)k@vh1&;uAHv#tC3VLXxc9w??O8&FIO_FOb=VX@ia;3(gCXnHI$biD` zO@T@>+FdIL3@Vh^T*g9jT+~QSDv1K;uW`$l950L$)mVP! z#(_Wu>8<*vg}e^~$*90q@EdC+{<3wBuuwFJWp9?#X=@@KtfT6AI-92B$f@AQ+F4rVXo5WJY9#L?QS%?TY%p{SY*B&2UaB+7xw8O|mw z*q5S#A3R-Y$&F7`I3pwKKPMyu5!P6)Rk+Wh++dyKJ>6H|?6&P;i$mMs!m6kZZx%hL zPetRFy$|-rRgU&%Hr^7d$-CRx)BeN-*|*bs(sut=f4MiNxFO=+2d(J(+X?n=Mb4zp z$AS)AE`Bay2^P$wks$VICTXpKGQ#cfuHfm3zP<|CSL+e`1BX2wN*kd;1wHHeHH-5` z{_^VvYksT$ z)@lNtu~P;@2ZOE7%af_`stqJ-09P2Y-p|5dbF(R5LC;=OzGy3hIfPuDxlPWt&h`e6 z`@dc6a1g@zN0BN-&LntrM@4r|-QwVroVuXMY!95K*|^&t=frA2n=FGUqfQ{kB( zT1l{(95^rfR&1Q>$-(mK^l?SRDNXpK4~?YaoNo4XY)}Ypg|drJIqYnK8iQYWu+5Kn z-d?}!Zh6tnmp*f$WcnESavqA9)b#y z%g!xL?=MG}s8Jh84Q~0Ze|LQb%tFIYu8nN0(SbU}X2`vW5c*~xRfX4z&uOi-&wrc} zubHrv0N1~BJ^{Z##VM%vrgm&d-T4=Q4YAMjD`8C@pqQAYATf&r2 z8*u@>d~S#WK$LtN zT;g#U;^sfn%nufMH4;0=o0rg5$&{j zE7ba2k=J}lj)l2rJ0p|-ak!<4hX*5-3+;ft1wB9^JD?dLrUjSMhJv+k3qX3vP2b)Q z)h(IOElYSIkqRru+1r484jlj}X-^CToy4Z+b{UxZR={mv0 zGDhtqtGp0K$+hlm?DsqN_5IUoKvD=CA~Px{vnq2zmrl04nu!7?x2S;RP%Rj;7`sn7 zEXHrK$>};i>{rtvpGOE(B_zS)vrVV+VzNLWHzLMfD~3=Z|z*UYEMR zlH?oVHf*q~lV_2&naq#mWcHcRJ7>X)XbHgp2Wg^H{9;(N7$$ zza`K!1-zH<{A1>4)fpHC5#2$B!a^_}Jo4Bo;evBNv$cqQb~=RN=AsGm!M4SW%IQAg z^r&arX3#F$(>szjGK*kUe{gfEoqBM9Bd!v?&)*nyg_~%nv(ym))IA)k3pF+T*YC_% z>EEC0EeLs-ey5c`{mJ8u$pcb#zV!=9@$R)Tog`-MmBH6qydtr%S2?lq2$t_IUX{B( z$nnQ3t{YV#(M}!s!}RlYcXy0Kt_K8MzZU52Bil?-*8CQ?&zoj~&3$nG%y!BHVsJ+X zyi2>~bavXe6VbcdBulC7tD30Ed$N$Y>z%iuRxR;&(%o+3jyRonQ}~4)^yqFg=5*&i zV{>(%&;3m2s$rCwF2wbB<6w`%hDpC+OkgJ-`DXuf!9oN*^>lCgbR^<*b(s*j&Nrge zX+Jx&y#ER>o%396ok6y<1UM3u{x56vCwqH)+qWuzmkN?G5q~Y1s!`kZ zgX;frxBK2z8WT}r1)m>sp*w7-&wrW74AGTj@bYBK4-9PSdtfftRpLGXFXZjfSG;;X zwvTSA>yR>7L$s5wb-539`zSb~&AuupAYkHV@Qyzn7fxtq3{utY03q)AwU<_|6n3{! zYVm!xS%UF!-kKNO*QzB<41Tyg0MZ;=slckY<=E~dVTi0!_G#YfQqsAXK*#4G00TVa zDH&qvF5WY<9iat$CdTwgMb`OFCo=dONo%Q^RNJ^Tm*yMLuHiW+?E zOU}-;JlFk$lPS>tY%r)dGf=Z&qIb(P~(JKJu%qko5id@Z6t zeBz<$^x&CZ+k=}LTo-B03Hu(rkq74DO_^zq(qsAY{pUFje_>4$8S7s9$L?C-Y;#SG zMi|-Kl2>|r`#Znh!hnJg5B_nq(08RFE87)CfHdh{p40E_syXk(>!MsSAKu85_24fs zZZ1updUe>lyYB|Doj%Gfx5xd#-P`og?B-mnbsH={BY$HFA&`>03CvKAJEF{gQpfRt z`y+IF?f%3_v+V?~7%v!0IcSCfY-5f({Ewew)nD?|M=J*cR@nR_PCNL*iE1C(a2A`Lv_@KAphZ3HEK-Y zZ(8^Af24*_LuOn@exZPlSRyJa&i7JJaG{ToBGgsd|6#G@e1~jBhNdHjNKb|j>=|Wc zcPpfsc&jfrt~{7mME#AwO)WW-bQ|(#E?7fKat1R`Lax?)S7;R^^7H-V>xMmLHFgo9 z{!hR+pyw%PTa@}{r_L!oEuE^hca)uUPyJcMtJEA3PNU%07oK6sdU?i4`po|wcEoJ` zr=2VK|Vl$Fi!{Zip>{rC3Dx{RUhf$%>Jk>^pd-Kkb*{ z;Xi1Esk&mj-8xl4+H?0*Go0?%NOK?ZJE2T%lVtu#i$L{WD73Jefn!Af64>2D+cGzSn17OEN&p2GY zy+X>9c~pS7=)WPF7WVfzkq=*th-M zDU6GrCT={}ueB5f@Ybcn5A!2th9hVdDkp1vr*1ZQu!byK_N@R>fQals>iV*dN3|s~ zBXdSzQTAi+@cGT5lp#;#wH20IV)L+0!ZOrw+($&*tDC@NRLJtdWAh;%aFk zi<8!YYlg2QQyxBdfBSd{Njbz;tJ;#vD_Op->V1@Z6?0P(;VsZo#CA0Us>JP9xJa6) z*uL%nN=GC|Z3LVMJc#|=Sx!0^bx}}vRJASLxtKF}Vn;numC{;N*i7F#kbL)0eHEWv z(QE_NcLJi8nlb5-YiP0(pK>y|>(Rx#QUe))VpF3`ZVqmwacS&_tih1c`Xc?2UJLQ9 z9#&$~`kvkNBe_Ize*3MOxnlc?K3ik*ZSiebc}Bq#mZV}@d1WAR1d&o1LZGbu{V=CRp`vYtZQcYo-ZL3Z%ld1$AFzU)DR$MM4lCgnx-QvF~|2jzZLQQhhc$Pdp3;Q zC4Kcv_H!UhEQ(R)k-R2L_g@#Bcm`B`Me3?iPYYlLIBYrYi#YeGXkihL$E!3?LBzEf zpV%RTqp7mMZAa=%0_p{X!JlUzpbePqf)?$tt?ODy`mzrXzl z?{m)1<@I_#pAT7mAVs{O#kGO5s<#uTKRPctu)lIpzS~q;_J*ZJ4uMhq;?HS@p620# zA;hz6hiNnkz1x>BOAmMhInVsomtUL{>|Dyaba-^{P<0$=fH4u()5DhobRK5m#k`E= z>@raG$vP+_3t&3=Tsx*7BIk~j7#GGU;ZB-C| z%b6R?q>?^21vK)^CEm1~rZ)vRW2X%AhohY%?ppUo=}8O#-+wnKX#fVGhPR?dqQA7R z#2?rWMY2V2HrBJcPTCMKjB)0v>K06^Qv)6zGbSL=7Jjztkqr*N+KcZ785sYLxuAPu zVsCL;eR1b_jHH@EFt5H|P2o^0jUB)7t)|~!Q~m64r&)OOK=i>;np;=G!5m{f#9^+q zYae9HI;w z_V)nN%53Kw&33l7#R9bYkkt#!oh#?;o>5{GFb$Ody4EwN|NDeHd1)CHwHG+o(B<0Y z{^wV3)q(G&Fi?C+hnJ3Jy7i}vH72af2Xr8=uIxd8$9bwQNS&M*t z$z#Am19m3Y_yxbtGWn6!exlDCbg6nOYL9TxBv7|Nk^xAZz1YzLNxYba+>p)x*y8`f z7+hv&cd8p0(GZcAfxE1@Q8?q~Lr1jBd#@96f`vimw90d45hP zt)2UiBTEg&;coHyMD4(bH^D{mTSuLPTYt8BnfOwpmlSCO21{_&qoZNcBiQINoDKL3 zXA@vfA(zkfWG@n#iTJjarhGE-zoIg!S|O^D&i7mOBQW&st8D?!)8X@bPJ2#_jz&hu z+_A*$FO)h#wPtq$iaJP$be@Y9&SAA{hS{xCRGD4Hox12v7w5};#7g{YKuVX{i3Bfq z4yoXv4qqq@YRz9xlR$ohr<`?K>iR8=eI8CE{0wYq)4|%8-b;ULSUD5 z-_CwHl>=>W{mgOyNoM4HysG`0#&dhF&z@KDy3 zeKGK7ZiIFYvf#(g`h_MHYsI8Nwl~p|o_FPP{%jvzBs3>CAzy_C+$^Fsm0;uJ`O++X zCK`>WWGbnl&dQATz|J=RAE=t>vclfhO=V@}dJAI|kVba=kw&C&PPA6(Du>EXR##)} z=B&#sg}A%BYd@4ah~&;t26=L-4=ex9Nvsz{RSAZFCAdMtd;B%=$3{Qw`MkNfMH8tgvO`&Nv_rdL7`)$^^LClaK5MK+9TJ+ zH{S7nf_)x2_Fz)aRjDofoT4Lns>4Y13x(E^CoVwJF#NGWz7SMe9mG-sF!TByC$)$q zX!q`}w>}{{%J@ug_aK0?6_bIY>%Hl15}{WNVedX*;8HPBI@FL3lDC-P{U@h{CMd^< z#P)6M3+%FVW<|xTr;QgJuDuKo3Rm;ti-sTwOFsbuV1Qc&1cBMCzEhmn6jWWP%KX0l zscS#Jq_T6z)kzsSTT3c28R`mjMyUnM^vq#D(^vj}XH4gZlu$!Pw0Gw6z1uT-H~H8= z*Ec}{>`!9x<0A+afkMO0L*GvqI`HsN5{uGhDT9}Hdpn0qz7RvxlG8BN@2>5*Q(T@o zsUl|lJNMg80LL{M;~)gY;`!B~qn%mSc5u|Mxv}v5@3lZ!(NP7loZVXLHL0OkYp9KX z9!KoO&#ypb&y$QH9SlCSb_D6!edz%eX<0@b^AP)w{UQIKm(!$9yPvO5oQ?T7F)Ol- z#HsWNF(F?AbwR<|u={3D5Z6`tR<$foIxCQZScL;mFMM$E5`A=xZQy4{ehuPwi6>z{ zq@W4!uvJg?o4s?MQ8|kuP@)?i_r4COey*8{7Hc`CDeUnCJTcxjJ!T~{=K<9Q6mW|*xmRZKVz1%7t#44P911T16J+t z63bOY%uwW~U!`T+VH+&Bowa|DpC|3HF={AxSQo>UydQazk)ODJCufEI2%(e2_};{_ z^=QArf`y}<$Ion^K55UV7+d+1Cvg>5KCYZ_@32`b;fPu8s(-H~YODhHvCT!dG4@qf ze)hoT+zI}{SA_NTgN0V*pJu$a#+goSqP(B(qd(ClPDQwU%0{pabC+8|1U<90Gbc+j zMNFZ=X#cCTV&$Hma!H;9Vl)r8(D@L{5R4)~8f611h6d6s4L@-pDsKfVTCC=%taJx{ z(PfGkLVT#kLa;$@w8Wo?xXJpy5q%ZHw{Nt9FtOzU{(oSDr9W1>uVWz|vw`lejKI=a zXGR0qz|t6O*{zUFB8NL;R%ap@t9*OfDy9g*U=9_5?}1Eplb)_N==b%VD>4_w2kh;f zLyX{U)GPETpYVrD$P*-T%|$D7+-y}bb{Z3_Wnq@t?b?Q5%9aX@N-u3Y^8~**^_t8 zQXaPgc~GsOL_BY=fjmXnPFhM$8f_eT+iXM#qqAJ%+%VkqB~a6@bj{J&0vYLUN%%f@ zK16dBgqsC&-!ZLF_Qmn1Rg~!fEM-1FCwB8N{>C{w<38?A5e@ylMxK!C5(Su+u6Dci z&I_hb$UmRWDuycw4pzPT+*v!2wh+~R?@w>qTj>)C2Y>k~td8CLU8&iYF+u$Gs&pRa z>9t3^N~@>Qul?A*NvT@qxRL|z=hR2A33;L;D+bcmt$4czW2_xV1IH0Q<1e1a0vdDii(HkM9BJ z@on{Gc|))J7LoGrv@(&##$W@Vw@-m{+Ne$UqiAdZa3w7ACm~m2UnjgsulGmpNXW8x zmzD~I@gP1rU8$pJNDZMzn0jM?a;Z4{-0-@m&jqp&7O{ei=5s3 zm`s4Y!9Gwu{Iz}b>%|eju@F+|GUD1dnZMgnQTK}YZ5IOoseI#--{0_aGGFGz0XBPW zM{GLknwcS2VJNJVJP1?Mde|p-({zSjmt>ke`m2CSsWQ+u z_V%}tAFL}>Jtkuqw!Xo0N&1(U1+rB63d4XG(XYN70t_c#$Y6?DVz^7nEsh@)Hy~wU zN418?{IeUOO*om@*_t+K&Q2sz)$^KmFq7(aXA0Zw_nb&Ht!0mr_E#M{amN9pb)QG7 z*31@etYw9E|Cn%{SauID$_Ui>62fS z=x=84!oJ_pk-EM}y*&A%Y z*dymtJ#;KD17~EPjL!%x7nj{#O|~c3U%*mmnesfXo6J(VM5e#A@nXgWSJ1Mi)qwm#y`FBr6TiMqVM*eW7{3ZLJ~v4%Tzj6sUna z4KMZD@-#hPlQ$Y^uBQcNq2P(Mz#9Cs85)+89HI}+mWq=5Z;>=>o{RsS>c#ieIsCFO z8y^=Q3N4BqXdvoj+utjgj#%TtF(NOrn zZ0!48o&H|+Os~O;&Ygg>mGIDl%i-r%_$t05-Wx>`K{QHoilt$bQR2Yl-dnAsgZ=H< z-tT@A{9#4cWN_J-bnR-W_Jhb5E%`SS&VzRbXFfG9c z9Tm>g_4TRUC_G-?JD=5Maeq`CcPkOGYRO()5J?bKIsf!OSAV24 zKJ=gKBviKFC!Rtwo)x&_H*$w(uCr6O+oP;7xsa`!zW?{04%aG8=jn1mTlkAv3{Uk( zv6HnBikb&xD^PlqTdL^^uVdxeWE9pf;9}an;7k}-qA_U0;CAr8O}2Ucg#BNW*25h% z`yX>+7ImGvDnN~CQhnAaTFn;gAchF+kN*o;PLIy9!sGMd3Ps^+kwG;u@Q5>MgkYTb zI)J_s>Nq_$vcWmgJK6g;N_6$Rgq(oQtq@NOBWwUHHM(pwjVZymQj+EYTP;7i;_Vpt zB438>zDbqy+p~;ZDNX@_!c3&swI8`5VoYYQ=DcJAYkeUtNTLj2U2wUpe_Rc8whcn+ zu_Z=xgjzo5bVB09XKe?yKo zy6GpdJ*lltL$0_IOt1|4YFh8s`uc^lA{hO*U9bAq2E6DD`@QT$qaT4}TC{#+SKZ9v zdllwvwqMX?iA9gy+DK?-t|`O4BPWvi6T+UFnfUc99wK4fv$OuUc3jfdB58SYAZwaA z993Xlds)q4dPje(93yHg$Iev)jo$(Iy^|q&QpfDVS%utCyo?!%+}X(j8bw-E*rxJs zYrw|bZ0Oj)QclVn*RgOqIWlrw`xvp)#%p!$|9`AAo;?2Nb3jqfd-QVQpi$yAn{dfusXJ>gK=cy17 zc|G`kfU~Qc8&cPQRVYg>${eU=L{{Vo^NQ;wB zgd=6%4O~7`783~>;oqd3p1Shu1enMP5rKk069TFG-_zdyY54x#hJLiWqV_~&5ZEFq z`;Re0+8hQJD5{x7FN~@6l7KX;TU%jX(Jc9$jrmb;HU^-@8~lG=AFiR~VUh>==M%<9 zNPCzet;}yP&oh8L`e_Cb=S_$z7m0W~{1x0$#289Cbzm7FI=pCeO+*aBwr=g#T8j%`6Wyyr+Y zulfGJxI{m@Lc#25Di{*z{%vEL{tz0L2}93bxCY{i4BNv5(}&{3r7{w2Z`e&yh~X}? zF6{lV|5V2Oo$Fo(L>CS8R;>*{Oq;9Mm_(EdUa^|g;u~0c*Rta? z%i4*F(<*BnJ*6Whm}4eSo+}5|ek>!Fo_(*R=gsIe$sf2He(ehi%CE6A=8DWw$r_-q z`>axKWL%@E_I(&>T~|GU;zMg9eAaj;v}N**2jIldhqzu%egFUWc&QSI$t zAPwr^qf_kOMj_%3-F_~;Q-68s(Ipp}_pGpoMl)ka%W%IITCvp;AjK^m+8)E+NNdW*#?mFY$Eh7qWC8F9OVS>syAK0&{HOn5=glKGN^&n6;x_4BcgQV2MkemGdH$E9{e(kG$AeCsn4P`yJ<&&F zrwDpJ&vt#p$WJ!uF3pHkeTmgwX6J z6bE?cgXpaSfCvbd!i$tx>%DmM)<^Xdb7WfAHp%Z)rOZ3-B72p$ZRP%?NVfOmidIu` z^AuCix4c6SB`L<%=F4{r-gVE? zybb#jBiyV>{^VAKFUaqdiW5@ygd@2@B$1=2Q%8tT-AWB+HThcO-}VaAHIP0NHumpt z(9vpfP}lcSTDX8e`Hz@i5!I;yxtxvtP|~BtM}AK4xMGQ1^Mle)aa><#wGzd0xCt>8|VE6CG+LH$K}aq|M^pTzUM_y6v!T6}Y>SRHPlGBR?QRs+t@Jc#?s*9N)cQ>wqcIb#|P$+xWC*Te)m` zOSjetQkL^f&6bifWjeEJy1yHwp7!Tn%-v0%sW)w=)h(T20s_tD!|$t{$VNBLq{991 z+(jCJv`U;1rh^V^cDQmwGvu%^Iw;SU{cI#)!`8TQ9O)$#dd&{<6T;}&oqNz-5rXs5 zQE7&dhIfvnPy4pDZiw&Bu^MYgYFfGHqRzQE3(E+HUJ&pj&0a{^Tiu_te<3c;YQ1nQ zKn|U_dRq_!NrF8|(tWl&rwiSldDCEa?FKXgzUPXS&h{wrpN$RJu!1iUsU=vK;vITN zqDL+-p?VJd)X%Ro-PlgHdF0)-$Xj5}j~+#`P1E)kjuz|vN-xSKGY29!=ko3M0t`tD zs4b!HXVdYU`_i5_wn?jcw90f{05qJF+t~~Axs07H5ShJxQ8ILs(w@Nl({)Mz!@`pj zcMfws*~@I`oAC#6jA3Pd>j^QDR4oxsW6;@wOgMzgpf>XD{?wi%Eq{3EJ_H0$S5Zq8 zPqncNiv8SrMs0lHat)l#sUe?1x3`}HFc=S#oL;O_ev&P$5$U)9`rI5~^Pr2Lj?fX0 z0jziI+m8y@S*wj{y@tjyK!;!<_!}kR@F1Kn9QhcAW3Ozhsn(G4CkGBUlI}2pPz{-d zKpt~4nP%xd9|h|d&bL+qLfGPH%MU99~8i=QpAteVjPnhj($&6_VWw^V8;^6ao@QV}?~+1|3afCnddR9jjnx2>KO zIa&VVxwmpP5tEI?Wg9(THIN^Zf=Qi(n;Hu;=frp`XkCxVZBk~&-v$lM2ET|u-~+Zx zt!l9izl{VJrwW9L8e;?ZsZ;P*L0Z!nolnGDbY&bKq+QjUy^1V<;g;{sTHSJ<2x!PZ zroBs>Y4x;XY6Vt-DNF!htB>Lu`D)ebypX-GscMw*my$rEX`9i zIo?FpmKJi_jCQ-QIbo;cl&hclkysrhF*8E|I%5ucNec9`M9D^e0mQd^y6`+m2aU4J zGU|NmLOOM;NB)Tg2(^ZL4z!~<(%|1R4eWFitK3)3WR?mTtb8epZrDQGd&b_}#mEUl(H}6ig`LE4-vvQ(iE{{HS73>uNJm^5U z;n0l$^X<9Wi&XFVLbUt$bosFha@^WOt?T&k`HKTWvd=iOPac(YokSQ&{_f)$M!Yw8FU=Y|eDD&QQfmY;!#ZmElx&BvwiImkp29|NNoU)cGV2a$6?2CkbT!F;URq+uk=xvr7ijqZbw& zo)q1(y>ngoT(iQu+Lo*F&B(u>(c6 zRj5u3=Kh<%H>eH}Lw5y{J(Nr;|ES{`=C5ss)AymCj$VckTMKA>W|N}?*V>_0CW>l_ zM1XM<+SBBKJ4GvHI($Z#cuQV2)uSO-Cr6kBRIB~K^1~0NEFo#G300nj-*X7Gyh%A6 zgi=cF0U24M5_43OP!E`5$<|1oM*9_>o@Jl{VNg(#C5}TSSE7N6$KW}T0r1~=LT;s9 zvuIX)T40G3NR~FkxtHeBir`lV|E}eceuj^>p7i=pkSJy z1sjOwRB*56H>be~eL>un>gOV>AqAF}@_j<23sCUpk`~__3wAiFR4Wuqs)h>L8V65n zBAsy8c%w=P&8tVNt!)t!mx_-zw-7wP-4FW)miEvSIWVgyOfnS!hZ=&~ii%~LK&du|e29|H^ zn0lL7JWz9;_9ob1=@zelueeBY;bru*)^y%tasw-Bo0a?s#1$<_Wyj3PSCp3MsH|n020T6(N_B1WJyr) z8VS9qTRy&|g|XOr3*`D8E*b<0OV+HYdh?=hiGFeQps|}JYRL~Qe+xa* zm~j+_KO35=pYtSO*dYszjDyxB(6u3AE=>npx@UMM1!|R%aVC)%N_|k-Vy}Haxa2@c zJY53n@c7K8oCSvc*UL+S1u#SCR~+0}1-x0Zgpsq93%J=r)7re5{!)A`@aI8Y5X+;C z3;Ph&xIR;{SyHIk@J4aD9;2`Z=hWo|r_@RE6ebmAqB*p_>T2? z=FLckqMF9_sgAkX+C_E+K6vdlG`6^Quj5h}K_K}pYhd1AcYbc3XH3A;>=_tthD;`o zh;5tUETJ5bswW3b0b>jE?62yhF=d3Z?JvjH)C%(fX(-luROM~~JiA+qmw;M;6ZwW}zn zw_Q$f_hvby%>PFhqG@wt`qgvhYq zfO&6AMa*=?rWXYByI)fb{pPL_TECfMl#T#{LF^!}ztPL-IiaS=s|e90NF~S^f-vhd z8H5?ZB8=83Ze8auj)TyHW(24gk5sVIwR8fCsWlpN>$-e@UZfDZV69y;hVbg^-ye&D zHSn;)TvrdP~9-%(MJtG66>$xIL&~-g3tDZdC9U%QGV0(QDHz$S{s@0 zlhx=Na8u6?EoILMRWVNTeYVby&He&PO!wq~T)eObd+Hu)=SICnDlMIUw6*ly_vDbp zC=<+mlVpGMrM30==!A4K?CD%5Z0RRCoUf`SaSzykII5p3UO_hBUp(zq;`@~BnElfO zw#(}6DL==kmv07AQ=l!huK2Cr-~UAEZ5Tls!pU_s2=Jyy+&xYw zesDmXory~RdT*0etzbKrCxA!E5oK_ey|)KMyh@&H(tdn}TP9#OUVFQ!WlH0+!`g%U z@^#Nq?|!xlO=bhZ43dzKD+hn~Uo=$OP2>iFsz!z?TdmsG3$GP=i&Se>K|Cvoil|VS z*Tu2k=PA|%LreUg4J2nR9ZGE`jjvPM@`$8KqkmbtVJLY>PM_$Aw-He#gTUrb1Qe_jZ-}N?^j3_|gMyPnFmj zidedr-KqPbviI(D40)p?5Oz8F(NzbIbhhQD8d&upVTViB%(h|(Vn?@b>o>7EF3HQs zm&?u;^po3&U;{3=YjlqIcjwY!t;UGaw8JK(Cs0EB9Ml*D$JKEJAN_LpVlE$+Sdd+P zLOE(djcb+@vf2Lv=RCe?rLv0%ME%?meiFi(QTul0!DY8iqkwloa)h~SC6NG)*p zCjfe^&s~a^X!xRj?zyTlzv2Uh zD5SB=osYsMjwEVtZA=m3;aXajieb%v717B=Pf5e%u~Z`b9So#(j2~eI;Xq5HAxonj z+iZd*5JYpcKJ0}rZ&Xf()NqF0UR)XkIOXxb{nbX;OutIYf>p0Wy3{_LLvZ^Lq=i#I z701Kia7Os~LiH3oZ>4(jWoWkqM-HZ7=273B*pQvOF=cDfKUl=%+vGMD=vjdCGJTe&@j7PCNX)Zygcdl z(>)Xp>;WhEm~`QG4G4l@rdGJoyvA9eUtOS<>nlr*dMPTMh)PG<4B4cQIb*}Ycr>qI zGE8w>8VBj??u5O$iu3@Tv}`VX%8!bXt9nurOoeg4ONxE5;bm(W2m#SuzHoj`tXgQ` zHFQ9FfKql4_Xy*e?2H``P|JL}l^G&}E?Rr_W7y777A)*jJZNWu#4SHhg-f*%6M`tx z*ZN(9Xhs#}Yd|WJKquXZeBOIw*fGId`Y4(zfZ$|i$Jk~V2Kt~>Br~VoSkprcg zNrA=8v-`J#$1+9_GcT-HO!+>om3WsHDcO8eaQ6a8rWyyg{GgVfzOJ*Fh~R=#wJ5LO zSR(uImGrEdGhEqqi=)E~cK}cs2}w2Qw~K3Y^#Y+iWvUI}JY()uA_l>hu1Z|I?Ykyc z8}4fFXm2$s^wcd~x%xVw#quv=YF+4^IJFJ-=sxM4mz@))>EjGW_$g_h&(q*LP1V6{^KMCYdXtA!96<;V(n$ zu(HQ?uHem-W<>P6{l=LP)6-D*BDn@%TsE;#Na2w-DDld|Bew!={ZygE=6A=gUgJT0 z{|rrqE*^g!kg~~=@M_799%?ei6PBWMN~?$noZrFo6BnqTp1Ry#^m{)aUI0ZyxZf4~ zQMuKSQr>{{CR=Y@xbZ{Joh!)xf|~bS<#{*rs?YO!JxWv?8ykDU%!S|8TW3tI`n#xE zwiM=!4271i09Am{cPiL}noa6EO`}M{yXWaA{yE?s9A+xx^?yk9xPWQRV59R%QwxH_8-lDPU}9Qnp4E zT>HX|PtYknh&SWrsYtJMvQotPQC!0eAEIiR`_Tz4O3&>Znnr{j-nR?j4Ai==IeQVP zB49;)nHiF#fs`Hk*0b77116!DaE&2u`pH>y$B6LiOQ2t>n(S$b-?!IqwVY6@40bV- zy`P1Y{nSd@+vuNlfmA3l>Tf<=8UzpANwRtL;StKzg4ct~^VghUGA0>p%i#60bdJ<7 zZ?-&TBH-0RJI|j=o6#PCVT*hge)0N9q_Q2DK`TqntSzcs8#DR^uc?=BQcT0EP^r=W zEIzL{;IZ=^Rrie;CC4jz!Jd7kVTW3hyQ5nZ7D(xb90pLidIbyZM+zq`>lKtWO&o0j z9es%)HqPZmu@ZUxJ$6zf?I>znxOexUsWEcS!={eOd^dJN4$5J=@AIvw@uD{9q9sBK z`;?rA%7m!Jpdk)xaGnx0Rkk+qng!&2y&bt;8ecrRy3v2!@{d*~chBsu&iE-gJrfxd zA6vY@HN+`j2>K?mVEFHZAPl6668X7`Qw1T61B+63b^`bp>GN?M30pl*m&ThVY8f|P z+{e%eXcEXcV#A8XAEJ6|qWGZ&H{9Tb@(X?KfV){C*(K6;w@UncOHfnwgXu5eRhKBN z@B90`>UH&Bs4#6`BF41O6YojVq$YlAs&pq5Mwg8c-9bplAQ%AXjd)!ve2eDaXYZy)BK$l6< z1OZUx)NwbMA%q(-BZ@sQecj@F+()1Pe1@vn-yMUhP~n^qPsde@EkB8(Rx;BVS(|MA zbfaVA$B&Li`**Pjt^DWf#S!zw2B#Ir#`Gq6E7n@b4|pHkqvw{n83A71r?rDxglhQ? zE0|+1j;kSB8nH-kppQjY%1?(TTj!|Mt7amK9%{_VO5XitRqO`?fdc5N2qk4@)O)MT zwPe@RWD^_3;y=Vhlqmy=>wET%6$0Z5aG8%VvGGV6OwadrUH)cJQL#k9W zyD6lsnzeT!mhrp(w9L2Eli<-$+OrZ8qK+-lmD5gZQj5A3W)M@jpiN2drwh!g%U+hh zJ~$oT)mt`-j|@Kn`oS{w9&s*~H^L8Fs>+4FLK77FGwSnHHD@?C=@l8M%;wj&$`-D- zNx&xl8pd%enLFnh!R%Rv-n&~nY-f)Z;I5$)JAiVbNVV{8mZ2&w{?9hyq>y8(+7HiQVAPwM47e#rf*8a3uEUUT zXWv}_O~mG-<(s@kpwtlcu}GKLxLD?osdG@D~^tN z{ab(jZp>OElj`e-n!s>zzO)s0Gvpc)-~%q))j6?rn^fv+o9E4g;LH+%qObKJPiNcw zefyV@P*;V6+=t!_j-fI2oNH}CFi%L%g(3rEhJXQbYJEL}#nM%R^x&X;Hi-~8 z1Zu2s(!|9AX+$W&AdzM{PYe=8ioz0f)Ou2i;k@W&C3Z6vpO3Y-DbtV6+`Yux+~y%V zkY#P{nCIeh(@D5Qtwarsz~PTOP8WlLm+i2SEI`LXi*+JX6IJZn(~xH&CM(+_7DoHp9h~Um?&V7xIEgdCTq-MF=TWigq<={O&4s_JBkaC1)*W0g0%YoAu zS`uRZZLB}31(!%19M-lCis(wrOxF3uS{mmFOGJUBP5$ghZR zhgxoIxCUxClXkYE)Tx+sNCo7bp0X#w+S+=uiW`A+!VXlP=$iP>ZTFRA~WoQ3*xy_9gz8B;s`SM$8rwf=4&)%H%FTwDCY zU(PrF_V16W-9^tWpZ50l{a?Q}w!Zgz{4-bSd4^ANXlO4X896b&PO6V4XmC42bwOX7 znyw;uyk5U5-jcwLpnZHD7t<^rijfw}%m;I*!Yedb}?A zn2t|BRq~l1<74(Nf)5Ulh_8Mg9qGRdj@h`<(f&5p1a_%3vzE!02oyfDDN!K?`yd1R5@T%pBP|Wh@z&2@EWpqi2 z+X(+jvm^u_)eAF`tZbW9{{V^*rvF&%abo@bJEHxzqa$=IZm*Xg(Fb(?!|hUpZqP?# zD1l=Gj`S>6?R#D&E(@fIpF~>xZT)*u(|eR#dN}BlTB6nD_U<}eak!O!9&HTypzaG< z@M(4gc~z@|63IRYNBQd0Q(u~FN^9PWs0{#$cZ@>O8YX(PysWIo@Ao@ZYLlW7MET1M zI7w3j{mWN)3dUC5k~gJgO_nunP zaosWR3L)0weLIM|TD3u=_;6_)0I6-fJ$R8|J~iW8|D^DtnunOpDZ)dgGt|$fiBQK> z6zH0qDtitsMs#P<#hiNpFFmLtqdBd4bK=`y70a|kzh=5=He8PPI8FeU?QSMN<5RrM zak}kb*C}p~i|cP5e;2sXI5xVl|6Oa8 z1Lx66`4kYOQG5aoMSoPk8qCM$AhZG$mu}eEg?lNt|M@-qq9csC-Zmeq^jHv$GIp#H z^b(WSA-GJ3J7KG@mz^UZWyR3yyeWGUJwTbsH{dQ*PZ$k?*;-(3<#HpN-!y{cCe=q` zjJb&oqOyqysSj!1!rFe~UY7dcHA7396WCqu@p7`4RJ%+;gzXw7AETsy9%E5xPL=nr z`rh$m4a(jR3ccGr+t}2z!#w)#(L7TF?rbddm45d1<}F7qDX`VaL+*_ z)4Pg0LSEJ0ho(SXc;n_dKyWUI49KC-*HJFOukpn+Qub+St6cRHSUA-b#8x$tf`>~* zmHFZ)(1*`5LW{U?&>FK)zZ~{!afdhl{XA-LV}r}&t1pRkzNDqPp9d#F2mSDaX*j65 z6*l1UNJ^WNv&FTteB2Yq$P9dSeFpK#WTs%*;+r>6SuOUW+^|f+Q2i3_mA_Ic2tJpk z()abE-gb);GQ5aP5JLX6sV@k^K?HT<{;rlEY6j2`mxBH&4LA9_a0sV*1jnCF$DUEZ z+=-aJapMNabWQKpwUAepD-mJCw*i1I1H}c)FBGj^E#9;ua`QNr341%PL~l?SEUUVo zi;Eq8R>>$=As^b_-d^WAuqPbtNtR0ly=c7QZO*1nb+_~+^s0Ceh7^Mm>4>?-`^iWb~=wrP3wIJZkr3#uI^R2X0f@kp`-+S+0Tx^t(y}w z|Ep(txlEf>$njELoe%v!XdSn#dqSJ>gT-0SIVakT4TaHfGkMt@y8N)~s%@y&D928} zk7Lnj`IB$tEs%$L<2dM$b}AlYT5^TkpY-%Z_0Y!+sYGJ3n(5_o_`3|vGx+a|p$}19 z+~#tIb`IG54yo#!@k+!0#a`k~`QM{c(361RCH%A8h79_HwX5g2-o3v5B`r}91XMP- z??c(F)Y3){HtsvPfXr4DtmUgA+QafWOM3eiuV_Y4JNwky+AuYZS*Vw&t(pEGAps|$ zMJ;N!w|CiEi8)BBukS3sdrPy1Pfhl5S)2^YFcG4lVuo}QZrK?#lQ-~$^$>5ezfTj8 z!@-YD7$&Mz9e=0I{<`baVdTHrw+D+GyOQyHd!Q=+wz)g4K#xXc&9jq|og3CjD9mE5 zDGqx{AZ3N^;u6B25`VDttCw9q&a?*T^18UJA1RKx;x)Y;EylF1%00D8GBq_d1r`7g z0{8vmQPFI5K5_$cZ`7dWm-)9Jolc@5hS6niuC6|gJ_JL&Vi`w9 ztOW!(G4GGIKX0|QnEa$Xuezja?C$l1KvX{)Si+4UgcYqo(WO9n(J{|vq-t4MSUB2I z@8ZQ1lK`{J4vG6lS5h8kv0~S5(lsFOdOZ^K%ZHl?sGB!`5{C}Df{IQjsuvYvoP_$D z9MLpI2SW%OA`!KIAjdVJeHo%6Cttm!Vq}p2=`LxV-R*ec!=$qzxb9p0*4Uu8!XYGn|T4WKv(d=m}1m@9-}V{^DY2I-D2 znLqqF;;>)7dMM*a@rLiBYs9$xmHkyxbEv5<$K*!gb z6)ZrYeq(OO)qZq}w#5Gozrk9@+45BSlxX5D(kL*o8oa%2^YO9aA+KfwFQYSAl(5x} zm5iMjZ&IOL2?k9Bf{HF)h8Wkp*}D?d0~*pZf_#5eO{{?cp|ufVA+I_Y?>KGCQ^!EY zNa39h`sN4cFw9&iyC)Oia9)UCTKHyDY=ZBU8V5? z*OiYwbpi4V(G_|8oQ6&J7Oy;_ozxNe95T3`QS z4N*xsa`+fv+QfuBwrkj_(B8Bj&{TF4U|;=Ag}UQtGa>)2tAF}RA|qZy|MT5bg_RzI zRP=hh{qtE3sK+6zL&};Io99sPhMREQgt+qIHw-RpfXnjoszuiB`euUL4eeoM6+4Ix z#raP6B8G?UF&pURvsqgUxBLx~EMWF*!)8mplR%(j2k zWdo6tbEBrQ0Y0RG_}_q77(3Q4wc|uBXk_H=Wukx$iMZE0!Qb1z(yCywcGHoD!1ZU3 zJ3WLNLR?&3so#Kk{eIU8%w=LHh0BX|%JWuw9siR=u5uu)hWHP#IiIQQg?fM}uZS2c z`J`v!2hnAZho0`m6p_et(b(CA;F2{*l?a{EyaH!zfbQMh0ZG8~K4CqV24(N@3kh8= zQ5IrwPNw2-VXBD{x9&jsE^QsG=n{FzdWCGRF=8%l*JxV~5a^{=U2vYZZ;56Cz&f+ByC22{ zno=Jf7_bJOJi?fvN_pU3I`iEAT;Zv=hmmhj=EfcFOv5YOUAk4M5U=!XcaR)+n-!mQ|I)U zIC(fJVdEKh7Xbokb`JLwPJ1NkImqCEyMYA~OQOl)zIoJZFgk@_=wH+u+12&3L=MmH z)+ns@^aLduV+uOim^1V1N>UGEENwSv(RHnI=ss7lT8v&fp?M`|wj*{#DR#MCc1}&rWg!6Baosc=^g(rHS1Xv=i=u#+T)q*|MzHW4%NgrL(zoC{KQs-(r6);Lrs!$$T>MR za+ol!Ma`l#r<|TVMmZKChY>Pm8MRR4xL6D;!yM;#?~nbr*S-7n`CRYoeO=d^{#b2a zvJ>anm0`CsKl!&mA7y#BS@2mwUK8@<3>;(%f2gjW^HS+bp{zsD0;9SN*%$FY?!dsn zw^gnQ2#VAK{h>>VLY%6vRC~704G&ffv187x4CdITUE|jWu5O;eJVZ@8S%N#rIvvOR z-tHbU29TEHvs6^Ub1p~x3`#*+qvUZVG~Y}VlZn6MANP0T3RXHVvT4LU#LsnC_AWc` z=g?mu?TPem3Dm3IU7ixp3~5W8SO?9mPj{iQtI z$@Axw&w(&x7k#0QhMrUvbV_o`P#?KYqz)b0F*t12caGvl2_tT%wQa7d z7MwshUl}k66S$1b6>dFiOW0fm(&b;ZlwC(2y_E8^Bt1$HtypwL3EnZNG~U$?W+IvGkZ$4vYeey@!%g8X5#?*SdYV`a<2{< zaluYY0|vx5zcWe$uUY!$MSwJT-nFg5|d!I4>#T@q{GQGgt*u(K*FDQ$T2`W z#%65O2H{6j-?s<+ccDCJ`91dyx`QCEDg2hG%$J5A zc~O;Lt?x^+;6IHJZw%y`t72>saI$=2;BQLNyYC*>N)ksadbpo3)*9_cR33sryD=)t zX$W1=Q8^?o5r>sEgC=aRc#465v2lUAx_GWSfsxI3qDX^rGPbT151Dq;v@h3znV?Wf z_^(?Th@4#@HFRrtwyxE|260nWui;$*Aip)V7mO2+K-U!w^s5%D!V1!oMPcLdE7Q5L z4e8{)!#7LYb`sK{jcsk+53dE4evt%OXy9;_k#aW}!yfLQHi$m^a|g(Ir-PJs-J#+$ z{WymC4y6yw>Zz(s81Lut-*8f8bRin;MRm@^v)!rkUQ62}>iWjlv!Q^Z%K;)Sk;eUK z+Sb-K9vo#ZUgLI))GO*ROGO`nXtN3O!rIBL-9(#?>w7{t9~$HKAJcv(=zkkQ!~rwo+TLwR_fB)NTx0Dk_47#sVX zM`(7fJQ-Bt8y@sMoN^EQZ;@v#)DnTdmZ+=8!x8|6I7U& z%8N9?$5gMAFM|H8_Xk5E(5~R=c5oLJq=>Nc znCag@=0p2H+Qe{vzsV`^L~rkCtLdO$c_rb;n^n@ z*TQt@ge%8&F?VDM5r043by9SLQ1K&%DX=cn2I8qWVYm6uF?S_D)06jKmj4E_ZEu_0 ztmF~g!UdUkU!$U)C+o4Qs;csgQ@R=^-1>x5(KUvX^vlQET7N&1$FOwX*y#hb`}dvR z6(cf|RZ~`W(0R9O$RJQcDt`bfO5#`mfEbdVjI|MCViOjdQg36W$zaooN{^ej9{jo! z7=_YizP!)8Zd^RcE!~5dt}$B~J855gvrh?@0<8&#WwEquKEn9%WXOVk6=3#e*-HbusWAfgpSlD@}{m5bB-xSZ~ z&{O$r7Z>A{s{0Z8zW$ZT;28`PQhZsL)l^j*k!?L9MO*}~X)HrqakkwCp{#H%h)HmD zw)UtMhfgy0jN-^mzo@Ucmy< z7qLd%672BJ>60Lv9uPYqtj?^CJ>WRiqQxky_jl;$u zaNvYvYlho@A?Q#A^>dW|Q)lEDv~WVEH&vq8tWWE|JXDhW`;XoIb?1iaMaCinj}{Z7 zO8m(O?~rI55c?q#j01Ye@>6s$$gT1g!W85CMg0ME=7%=~1q{#Sx!E!A=7QGWnggt) zxjo0kapjhCR?ve7YLUhw02tcWU65uET0%7(^uJ>cqKnf6W5ciZz|d&(+#fgxNPwgh z`Qnkp02wA&;s_b4i^L+oLnW>AE-Ax5l3SXZ?#t!(ozH$B%4lqBhLg?WHh|2e){P~8 zEZP&vvTqhpzS}SqGxIkd>g7;o8E0Zlh{%F`+w9gBwiqY;WoNp zKm4kU7&9eVNxr;R-H@f!CotDxgSwJCPjtW3k@1*0@_{pJ=;(AwQMP$7FpEbZi#er^ zR8-j3WZV+`ww5U`taVGqX=A%#{31C8i1Ei}TvwO=?@Q_8+fq4&&rHJH@KJbi*-*$x ztUw?LMKT9tt-F8;EH=Z+KAhq{-U+yGLATbrES%;S{`B=}C4kET7LVcjh0T-9Y#u!# z^w1{$kg~HTb8Tt*LXz!JByj?NPEv zYaD_eH)ftRf$*aqwbtU9Nlpao%=KJjv3bJv;B%$#dW0=yx@-c(;kFv4KXwUy9Pu!J z-$LtlA5b#8>P!1`4E-8^VUi3z$K6i$uCK4-n@7X-^G{I!>#}puW#`0gEN{(DPAavn z;bv+ARWM6tF615nJA1~jSjqi6%LW*jz~`&Its$GgIld)ng$1;a%r`ELmNc^k^%r}Z zb8|}sNE-}gAe0ZFT@~}{vWf?&xmIKR-MNfVR*Z{Ydxd#nfta{1$Jg zNao0ytt~V+*j-6GCTW1>cI@>1Pd9ll3o4rwHNePENO`MPY=YzwwL(!ID#(tS zaJIUv#Re|kTDFlkH{4U`U6A4Th6y|FK!%1szYS>mQj>Q*d~#7bL{WDa0&X%`{) zaIc>n$Z+}jUIVobU4*6k`R_{Oxg^vZu(9PD6 z5f+P8q*IZW0;56G4}d|6^k3fn@9MYo4E_2y|72p1rDWjI2w&^CGI5D{y3X$!i!`aBzb|E z_%ZWE;+nYIb89JOL}>`cq#dEZK0e(vFDkpglHn8J&zgl^?aB6WM=KJGbV6UXE5H}l$DJZeHSpb!+ z_H0Wm`({)by|}oTDvPq`1RQ=M680-t8$@4+I=xPf(5373EXA1V zAN(KT1q3b<8N|PiT`eD=picG)4fldOyV$rHSH_rrz2pVJoiX2;9NoPw?%Mu8-d;M{ zyCy>hPJ&cuR+U%i=(1i}_MEFB7qpDabrT`-`{2|{ina-FzQU6M473XY zh&B}e3wvyCf>A0b38}2(0)^Jl{%2*BUjJzylX=zberT|YBl>EgoP3S4HA1WRIRC$2 zxR2Beu6}d9{Mfs1B#>98wXZ8}i+{c4lAup29yflJzktdiAUJPpmQy~{8~{j(lR=gS;JpfyH=b+!uNcFxWRF#c!4*~E30C-6TB1re_fa-|&}yh(tYC)4~Gw(QP01Ww)1e^(RU(&FxR2QILKyMEM`wG|nF;snpUSp@sZ> z-?3hY0!v4+T}LAigWpxv6Rc^UrFgjT99wYB=)l0_vUsu-5Efz*p`h0v@gxeoqfz;e z{xQtQdl31W!Ca{PLxd&FD<^|%Vy)Cu6Fe+lpVid72W_w?Mnpu!<9`_Lh5w2P9SLkb z_)|I8@2iOwjL~-YOj^{u$b9P$r();N#!3)qYJ8`gxc0Xjhy~kl0Y;z@|CW31JTBNB zz)9IO#^_j11b2)?t9vpC_)~|)3vHVXq^D&%VO5?jO+xxE77&gRZ? zp_m(%AXKd+3`Nqu4%}Ki+IYlVQ4B>PJ4*u8pml9MANf7dTsRr#2APt+b(`?^Mw7lA) zi!dLyl+6v;4EL`NU6&F!YlHJIb-IAav^tnx<x*-dJjP((S2v*V?2BcI3z*U(f=1 zEzzj6J+K#BKkM6@YxH=ZVtC{UA9EBU`vB)#mK7@XevY;CFH~1mkTM`C#k@jUKhJbh^gaxmXGWN)0CTWGW=BQ`QJvT)k*SP*nR~2bZM1JZerHsK@gqlMge|S?gVflTX$^MLLvH;fysD<%gQak%Dtd>&`rDsbqKISRR@HWxbA|UaQ1g)n|MAf zWc5fZd^V9qC@US%WWR$IDSk~hNmJ1#A%{baF}8MB>paRed}#gzbe}K)*+)3Tx2l_G z?4PVvuM-uZD2RF{TR6{XKz~roBC9fE#-oL12Ft}Y6(nKy4XiZyh*TO%gQ`fV^!0zc z8`_ev(sip&5{b0V0&8Nt#vR!N@(oC)mSy2pWFk4tH23+p+!?mQ(~fG zI?te83iEIw7TEctYF(X3LfkP$y)%H0@$~5Fu+qTiNgiKG7wboZqnh2_hpIgou9e1q zIjZ~?(a7lP)YO4pzkZr6cM}Yyi<((kBYY)8gQAmT%KIle(uLy zSnGD@>JmvhiVzw2*)Vl`y348{YjDjmZU4E`fJ4{eoOyKEI5B2ey`?rX)07Fz(;2Msd)33$pS%)<#gQhy&h`qNDouBN7zTFQt%2;Toi_rq;5@&Za{u@!!)8Q3diz@*e{8 z2Fs7VFk@bJHo_p8mXQ1swHu$`**%m&!01?iWJkqkCk*zbi-D(&))9bB&M0>cQZ;+= z?ej()`ULZU9oUH~uT>FpDu|?b;E2u%Tj|Gee^(F1^#iYKM}fyV9S5}rh*V*X9)eDu zSh>Y8Sw4a7DeIwpHZ9D$#i-)PK7h_Pp~*MqZ&pe@+PDFikzVuqoq@~2F@H~lnCJ1G zR~(7kLHZ})|GOuR`Ru$~Uhb0wKhq4A5rDI`R;JVNIo?I&qlwDX=&L+Eo*^?PG?$aG zAEnFBFpAyT$^+dT@ybiu+}!kAKa4>RYEbJ?*cq20Kv&W$oX`6aYMfWwT?$|vc}rvz zke7yRt*WL3Z%&C*JhwLt07kN>tZXRKxys~O-Xj{0g61BQ|60H_W*#+_$b~86MyPm zNvRoz>dwVFXOxf5%!#{H0T&xgVe0-fw=O6PJFp_vZYXu5k|>;E#nvHemKJB!G~SMe zdbA}}(sU?uGh(ZPX+VSXOnG|<*t%G`{PCU1w4J}|;ukuyU&# Date: Mon, 26 Oct 2015 19:27:53 -0400 Subject: [PATCH 131/630] fix #8, more informative error when libmxnet not found --- src/base.jl | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/src/base.jl b/src/base.jl index 5e547de727c1..0988400b9d31 100644 --- a/src/base.jl +++ b/src/base.jl @@ -19,6 +19,12 @@ typealias char_pp Ptr{char_p} const MXNET_LIB = Libdl.find_library(["libmxnet.so","libmxnet.dll"], [joinpath("$(get(ENV,"MXNET_HOME",""))","lib"), joinpath(Pkg.dir("MXNet"),"deps/usr/lib")]) +if isempty(MXNET_LIB) + # touch this file, so that after the user properly build libmxnet, the precompiled + # MXNet.ji will be re-compiled to get MXNET_LIB properly. + touch(@__FILE__) + error("Cannot find or load libmxnet.so. Please see the document on how to build it.") +end function __init__() _import_ndarray_functions() From 8bb82e437b5ae1b947e2650139c2b69f13d37a6d Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 26 Oct 2015 22:04:46 -0400 Subject: [PATCH 132/630] use sphinx as documentation system --- .gitignore | 1 + docs/Makefile | 180 +++++++++++++++++ docs/api/ndarray.md | 247 ----------------------- docs/api/symbol.md | 73 ------- docs/build.jl | 10 - docs/conf.py | 277 ++++++++++++++++++++++++++ docs/index.md | 8 - docs/index.rst | 34 ++++ docs/sphinx/julia.py | 23 +++ docs/tutorial/mnist.rst | 252 +++++++++++++++++++++++ docs/tutorials/mnist.md | 150 -------------- docs/user-guide/install.md | 29 --- docs/user-guide/install.rst | 54 +++++ docs/user-guide/overview.md | 267 ------------------------- docs/user-guide/overview.rst | 376 +++++++++++++++++++++++++++++++++++ examples/mnist/mlp.jl | 2 +- src/io.jl | 7 +- src/model.jl | 6 +- 18 files changed, 1209 insertions(+), 787 deletions(-) create mode 100644 docs/Makefile delete mode 100644 docs/api/ndarray.md delete mode 100644 docs/api/symbol.md delete mode 100644 docs/build.jl create mode 100644 docs/conf.py delete mode 100644 docs/index.md create mode 100644 docs/index.rst create mode 100644 docs/sphinx/julia.py create mode 100644 docs/tutorial/mnist.rst delete mode 100644 docs/tutorials/mnist.md delete mode 100644 docs/user-guide/install.md create mode 100644 docs/user-guide/install.rst delete mode 100644 docs/user-guide/overview.md create mode 100644 docs/user-guide/overview.rst diff --git a/.gitignore b/.gitignore index 503353f37bd0..e2b2ea70b3fc 100644 --- a/.gitignore +++ b/.gitignore @@ -7,3 +7,4 @@ data deps/src deps/usr deps/deps.jl +docs/_build diff --git a/docs/Makefile b/docs/Makefile new file mode 100644 index 000000000000..e1763e330fc7 --- /dev/null +++ b/docs/Makefile @@ -0,0 +1,180 @@ +# Makefile for Sphinx documentation +# + +# You can set these variables from the command line. +SPHINXOPTS = +SPHINXBUILD = sphinx-build +PAPER = +BUILDDIR = _build + +# User-friendly check for sphinx-build +ifeq ($(shell which $(SPHINXBUILD) >/dev/null 2>&1; echo $$?), 1) +$(error The '$(SPHINXBUILD)' command was not found. Make sure you have Sphinx installed, then set the SPHINXBUILD environment variable to point to the full path of the '$(SPHINXBUILD)' executable. Alternatively you can add the directory with the executable to your PATH. If you don't have Sphinx installed, grab it from http://sphinx-doc.org/) +endif + +# Internal variables. +PAPEROPT_a4 = -D latex_paper_size=a4 +PAPEROPT_letter = -D latex_paper_size=letter +ALLSPHINXOPTS = -d $(BUILDDIR)/doctrees $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) . +# the i18n builder cannot share the environment and doctrees with the others +I18NSPHINXOPTS = $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) . + +.PHONY: help clean html dirhtml singlehtml pickle json htmlhelp qthelp devhelp epub latex latexpdf text man changes linkcheck doctest gettext + +help: + @echo "Please use \`make ' where is one of" + @echo " html to make standalone HTML files" + @echo " dirhtml to make HTML files named index.html in directories" + @echo " singlehtml to make a single large HTML file" + @echo " pickle to make pickle files" + @echo " json to make JSON files" + @echo " htmlhelp to make HTML files and a HTML help project" + @echo " qthelp to make HTML files and a qthelp project" + @echo " devhelp to make HTML files and a Devhelp project" + @echo " epub to make an epub" + @echo " latex to make LaTeX files, you can set PAPER=a4 or PAPER=letter" + @echo " latexpdf to make LaTeX files and run them through pdflatex" + @echo " latexpdfja to make LaTeX files and run them through platex/dvipdfmx" + @echo " text to make text files" + @echo " man to make manual pages" + @echo " texinfo to make Texinfo files" + @echo " info to make Texinfo files and run them through makeinfo" + @echo " gettext to make PO message catalogs" + @echo " changes to make an overview of all changed/added/deprecated items" + @echo " xml to make Docutils-native XML files" + @echo " pseudoxml to make pseudoxml-XML files for display purposes" + @echo " linkcheck to check all external links for integrity" + @echo " doctest to run all doctests embedded in the documentation (if enabled)" + +clean: + rm -rf $(BUILDDIR)/* + +livehtml: + sphinx-autobuild -b html $(ALLSPHINXOPTS) $(BUILDDIR)/html + +html: + $(SPHINXBUILD) -b html $(ALLSPHINXOPTS) $(BUILDDIR)/html + @echo + @echo "Build finished. The HTML pages are in $(BUILDDIR)/html." + +dirhtml: + $(SPHINXBUILD) -b dirhtml $(ALLSPHINXOPTS) $(BUILDDIR)/dirhtml + @echo + @echo "Build finished. The HTML pages are in $(BUILDDIR)/dirhtml." + +singlehtml: + $(SPHINXBUILD) -b singlehtml $(ALLSPHINXOPTS) $(BUILDDIR)/singlehtml + @echo + @echo "Build finished. The HTML page is in $(BUILDDIR)/singlehtml." + +pickle: + $(SPHINXBUILD) -b pickle $(ALLSPHINXOPTS) $(BUILDDIR)/pickle + @echo + @echo "Build finished; now you can process the pickle files." + +json: + $(SPHINXBUILD) -b json $(ALLSPHINXOPTS) $(BUILDDIR)/json + @echo + @echo "Build finished; now you can process the JSON files." + +htmlhelp: + $(SPHINXBUILD) -b htmlhelp $(ALLSPHINXOPTS) $(BUILDDIR)/htmlhelp + @echo + @echo "Build finished; now you can run HTML Help Workshop with the" \ + ".hhp project file in $(BUILDDIR)/htmlhelp." + +qthelp: + $(SPHINXBUILD) -b qthelp $(ALLSPHINXOPTS) $(BUILDDIR)/qthelp + @echo + @echo "Build finished; now you can run "qcollectiongenerator" with the" \ + ".qhcp project file in $(BUILDDIR)/qthelp, like this:" + @echo "# qcollectiongenerator $(BUILDDIR)/qthelp/Mocha.qhcp" + @echo "To view the help file:" + @echo "# assistant -collectionFile $(BUILDDIR)/qthelp/Mocha.qhc" + +devhelp: + $(SPHINXBUILD) -b devhelp $(ALLSPHINXOPTS) $(BUILDDIR)/devhelp + @echo + @echo "Build finished." + @echo "To view the help file:" + @echo "# mkdir -p $$HOME/.local/share/devhelp/Mocha" + @echo "# ln -s $(BUILDDIR)/devhelp $$HOME/.local/share/devhelp/Mocha" + @echo "# devhelp" + +epub: + $(SPHINXBUILD) -b epub $(ALLSPHINXOPTS) $(BUILDDIR)/epub + @echo + @echo "Build finished. The epub file is in $(BUILDDIR)/epub." + +latex: + $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex + @echo + @echo "Build finished; the LaTeX files are in $(BUILDDIR)/latex." + @echo "Run \`make' in that directory to run these through (pdf)latex" \ + "(use \`make latexpdf' here to do that automatically)." + +latexpdf: + $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex + @echo "Running LaTeX files through pdflatex..." + $(MAKE) -C $(BUILDDIR)/latex all-pdf + @echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex." + +latexpdfja: + $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex + @echo "Running LaTeX files through platex and dvipdfmx..." + $(MAKE) -C $(BUILDDIR)/latex all-pdf-ja + @echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex." + +text: + $(SPHINXBUILD) -b text $(ALLSPHINXOPTS) $(BUILDDIR)/text + @echo + @echo "Build finished. The text files are in $(BUILDDIR)/text." + +man: + $(SPHINXBUILD) -b man $(ALLSPHINXOPTS) $(BUILDDIR)/man + @echo + @echo "Build finished. The manual pages are in $(BUILDDIR)/man." + +texinfo: + $(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo + @echo + @echo "Build finished. The Texinfo files are in $(BUILDDIR)/texinfo." + @echo "Run \`make' in that directory to run these through makeinfo" \ + "(use \`make info' here to do that automatically)." + +info: + $(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo + @echo "Running Texinfo files through makeinfo..." + make -C $(BUILDDIR)/texinfo info + @echo "makeinfo finished; the Info files are in $(BUILDDIR)/texinfo." + +gettext: + $(SPHINXBUILD) -b gettext $(I18NSPHINXOPTS) $(BUILDDIR)/locale + @echo + @echo "Build finished. The message catalogs are in $(BUILDDIR)/locale." + +changes: + $(SPHINXBUILD) -b changes $(ALLSPHINXOPTS) $(BUILDDIR)/changes + @echo + @echo "The overview file is in $(BUILDDIR)/changes." + +linkcheck: + $(SPHINXBUILD) -b linkcheck $(ALLSPHINXOPTS) $(BUILDDIR)/linkcheck + @echo + @echo "Link check complete; look for any errors in the above output " \ + "or in $(BUILDDIR)/linkcheck/output.txt." + +doctest: + $(SPHINXBUILD) -b doctest $(ALLSPHINXOPTS) $(BUILDDIR)/doctest + @echo "Testing of doctests in the sources finished, look at the " \ + "results in $(BUILDDIR)/doctest/output.txt." + +xml: + $(SPHINXBUILD) -b xml $(ALLSPHINXOPTS) $(BUILDDIR)/xml + @echo + @echo "Build finished. The XML files are in $(BUILDDIR)/xml." + +pseudoxml: + $(SPHINXBUILD) -b pseudoxml $(ALLSPHINXOPTS) $(BUILDDIR)/pseudoxml + @echo + @echo "Build finished. The pseudo-XML files are in $(BUILDDIR)/pseudoxml." diff --git a/docs/api/ndarray.md b/docs/api/ndarray.md deleted file mode 100644 index fae68df32c2b..000000000000 --- a/docs/api/ndarray.md +++ /dev/null @@ -1,247 +0,0 @@ -# MXNet.mx - -## Internal - ---- - - -#### _import_ndarray_functions() -Import dynamic functions for NDArrays. The arguments to the functions are typically ordered -as - -```julia -func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) -``` - -unless NDARRAY_ARG_BEFORE_SCALAR is not set. In this case, the scalars are put before the input arguments: - -```julia -func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) -``` - -If `ACCEPT_EMPTY_MUTATE_TARGET` is set. An overloaded function without the output arguments will also be defined: - -```julia -func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) -``` - -Upon calling, the output arguments will be automatically initialized with empty NDArrays. - -Those functions always return the output arguments. If there is only one output (the typical situation), that -object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. - - -*source:* -[MXNet/src/ndarray.jl:468](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L468) - ---- - - -#### convert{T<:Real}(t::Type{Array{T<:Real, N}}, arr::MXNet.mx.NDArray) -Convert copy: NDArray -> Julia Array - -*source:* -[MXNet/src/ndarray.jl:237](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L237) - ---- - - -#### copy!(dst::Array{Float32, N}, src::MXNet.mx.NDArray) -Copy data from NDArray to Julia Array - -*source:* -[MXNet/src/ndarray.jl:201](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L201) - ---- - - -#### copy!(dst::MXNet.mx.NDArray, src::MXNet.mx.NDArray) -Copy data between NDArrays - -*source:* -[MXNet/src/ndarray.jl:189](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L189) - ---- - - -#### copy!{T<:Real}(dst::MXNet.mx.NDArray, src::Array{T<:Real, N}) -Copy data from Julia Array to NDArray - -*source:* -[MXNet/src/ndarray.jl:209](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L209) - ---- - - -#### copy(arr::MXNet.mx.NDArray) -Create copy: NDArray -> Julia Array - -*source:* -[MXNet/src/ndarray.jl:219](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L219) - ---- - - -#### copy(arr::MXNet.mx.NDArray, ctx::MXNet.mx.Context) -Create copy: NDArray -> NDArray in a given context - -*source:* -[MXNet/src/ndarray.jl:225](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L225) - ---- - - -#### copy{T<:Real}(arr::Array{T<:Real, N}, ctx::MXNet.mx.Context) -Create copy: Julia Array -> NDArray in a given context - -*source:* -[MXNet/src/ndarray.jl:231](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L231) - ---- - - -#### getindex(arr::MXNet.mx.NDArray, ::Colon) -Shortcut for `slice`. **NOTE** the behavior for Julia's built-in index slicing is to create a -copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. - - -*source:* -[MXNet/src/ndarray.jl:177](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L177) - ---- - - -#### load(filename::AbstractString, ::Type{MXNet.mx.NDArray}) -Load NDArrays from binary file. - -**Parameters**: - -* `filename`: the path of the file to load. It could be S3 or HDFS address - if the `libmxnet` is built with the corresponding component enabled. Examples - - * `s3://my-bucket/path/my-s3-ndarray` - * `hdfs://my-bucket/path/my-hdfs-ndarray` - * `/path-to/my-local-ndarray` - -**Returns**: - - Either `Dict{Base.Symbol, NDArray}` or `Vector{NDArray}`. - - -*source:* -[MXNet/src/ndarray.jl:384](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L384) - ---- - - -#### ones{N}(shape::NTuple{N, Int64}) -Create NDArray and initialize with 1 - -*source:* -[MXNet/src/ndarray.jl:118](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L118) - ---- - - -#### save(filename::AbstractString, data::MXNet.mx.NDArray) -Save NDarrays to binary file. - -**Parameters**: - -* `filename`: path to the binary file to write to. -* `data`: an `NDArray`, or a `Vector{NDArray}` or a `Dict{Base.Symbol, NDArray}`. - - -*source:* -[MXNet/src/ndarray.jl:409](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L409) - ---- - - -#### setindex!(arr::MXNet.mx.NDArray, val::Real, ::Colon) -Assign all elements of an NDArray to a scalar - -*source:* -[MXNet/src/ndarray.jl:158](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L158) - ---- - - -#### size(arr::MXNet.mx.NDArray) -Get the shape of an `NDArray`. Note the shape is converted to Julia convention. - So the same piece of memory, in Julia (column-major), with shape (K, M, N), will be of the - shape (N, M, K) in the Python (row-major) binding. - - -*source:* -[MXNet/src/ndarray.jl:84](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L84) - ---- - - -#### slice(arr::MXNet.mx.NDArray, ::Colon) -`slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest -changing dimension is supported. In Julia's column-major perspective, this is the last -dimension. For example, given an `NDArray` of shape (2,3,4), `sub(array, 2:3)` will create -a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is -used in data parallelization to split mini-batch into sub-batches for different devices. - - -*source:* -[MXNet/src/ndarray.jl:137](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L137) - ---- - - -#### zeros{N}(shape::NTuple{N, Int64}) -Create zero-ed NDArray of specific shape - -*source:* -[MXNet/src/ndarray.jl:105](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L105) - ---- - - -#### MXNet.mx.NDArray -Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block -of tensor-based computation. - -**Note** since C/C++ use row-major ordering for arrays while Julia follows a -column-major ordering. To keep things consistent, we keep the underlying data -in their original layout, but use *language-native* convention when we talk -about shapes. For example, a mini-batch of 100 MNIST images is a tensor of -C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory -have shape (28,28,1,100). - - -*source:* -[MXNet/src/ndarray.jl:32](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L32) - ---- - - -#### @inplace(stmt) -Julia does not support re-definiton of `+=` operator (like `__iadd__` in python), -When one write `a += b`, it gets translated to `a = a+b`. `a+b` will allocate new -memory for the results, and the newly allocated `NDArray` object is then assigned -back to a, while the original contents in a is discarded. This is very inefficient -when we want to do inplace update. - -This macro is a simple utility to implement this behavior. Write - -```julia -@mx.inplace a += b -``` - -will translate into - -```julia -mx.add_to!(a, b) -``` - -which will do inplace adding of the contents of b into a. - - -*source:* -[MXNet/src/ndarray.jl:266](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/ndarray.jl#L266) - diff --git a/docs/api/symbol.md b/docs/api/symbol.md deleted file mode 100644 index a17f0c261fa2..000000000000 --- a/docs/api/symbol.md +++ /dev/null @@ -1,73 +0,0 @@ -# MXNet.mx - -## Internal - ---- - - -#### Group(symbols::MXNet.mx.Symbol...) -Create a symbol that groups symbols together - -*source:* -[MXNet/src/symbol.jl:77](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L77) - ---- - - -#### Variable(name::Union{AbstractString, Symbol}) -Create a symbolic variable with the given name - -*source:* -[MXNet/src/symbol.jl:70](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L70) - ---- - - -#### from_json(repr::AbstractString, ::Type{MXNet.mx.Symbol}) -Load Symbol from a JSON string representation. - -*source:* -[MXNet/src/symbol.jl:240](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L240) - ---- - - -#### get_internals(self::MXNet.mx.Symbol) -Get a new grouped symbol whose output contains all the internal outputs of this symbol. - -*source:* -[MXNet/src/symbol.jl:63](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L63) - ---- - - -#### list_auxiliary_states(self::MXNet.mx.Symbol) -List all auxiliary states in the symbool. - -Auxiliary states are special states of symbols that do not corresponds to an argument, -and do not have gradient. But still be useful for the specific operations. -A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. -Most operators do not have Auxiliary states. - - -*source:* -[MXNet/src/symbol.jl:58](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L58) - ---- - - -#### load(filename::AbstractString, ::Type{MXNet.mx.Symbol}) -Load Symbol from a JSON file. - -*source:* -[MXNet/src/symbol.jl:247](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L247) - ---- - - -#### to_json(self::MXNet.mx.Symbol) -Save Symbol into a JSON string - -*source:* -[MXNet/src/symbol.jl:233](https://github.com/dmlc/MXNet.jl/tree/7fa151104fb51d7134da60a5084dfa0d240515f0/src/symbol.jl#L233) - diff --git a/docs/build.jl b/docs/build.jl deleted file mode 100644 index 9576e4112c38..000000000000 --- a/docs/build.jl +++ /dev/null @@ -1,10 +0,0 @@ -using MXNet -using Lexicon - -config = Config(md_permalink = false, mathjax = true) - -doc = Lexicon.metadata(MXNet.mx) -for mod in [:ndarray, :symbol] - save("api/$mod.md", MIME("text/md"), filter(doc, files=["$mod.jl"]), config) -end - diff --git a/docs/conf.py b/docs/conf.py new file mode 100644 index 000000000000..ca57eed31146 --- /dev/null +++ b/docs/conf.py @@ -0,0 +1,277 @@ +# -*- coding: utf-8 -*- +# +# MXNet documentation build configuration file, created by +# sphinx-quickstart on Thu Nov 13 00:43:40 2014. +# +# This file is execfile()d with the current directory set to its +# containing dir. +# +# Note that not all possible configuration values are present in this +# autogenerated file. +# +# All configuration values have a default; values that are commented out +# serve to show the default. + +import sys +import os + +# If extensions (or modules to document with autodoc) are in another directory, +# add these directories to sys.path here. If the directory is relative to the +# documentation root, use os.path.abspath to make it absolute, like shown here. +#sys.path.insert(0, os.path.abspath('.')) +sys.path.insert(0, os.path.abspath("sphinx")) +import julia + +# -- General configuration ------------------------------------------------ + +# If your documentation needs a minimal Sphinx version, state it here. +#needs_sphinx = '1.0' + +# Add any Sphinx extension module names here, as strings. They can be +# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom +# ones. +extensions = [ + 'sphinx.ext.mathjax', + 'julia' +] + +# Add any paths that contain templates here, relative to this directory. +templates_path = ['_templates'] + +# The suffix of source filenames. +source_suffix = '.rst' + +# The encoding of source files. +#source_encoding = 'utf-8-sig' + +# The master toctree document. +master_doc = 'index' + +# General information about the project. +project = u'MXNet' +copyright = u'2015, pluskid' + +# The version info for the project you're documenting, acts as replacement for +# |version| and |release|, also used in various other places throughout the +# built documents. +# +# The short X.Y version. +version = '0.0.3' +# The full version, including alpha/beta/rc tags. +release = '0.0.3' + +# The language for content autogenerated by Sphinx. Refer to documentation +# for a list of supported languages. +#language = None + +# There are two options for replacing |today|: either, you set today to some +# non-false value, then it is used: +#today = '' +# Else, today_fmt is used as the format for a strftime call. +#today_fmt = '%B %d, %Y' + +# List of patterns, relative to source directory, that match files and +# directories to ignore when looking for source files. +exclude_patterns = ['_build'] + +# The reST default role (used for this markup: `text`) to use for all +# documents. +#default_role = None + +# If true, '()' will be appended to :func: etc. cross-reference text. +#add_function_parentheses = True + +# If true, the current module name will be prepended to all description +# unit titles (such as .. function::). +#add_module_names = True + +# If true, sectionauthor and moduleauthor directives will be shown in the +# output. They are ignored by default. +#show_authors = False + +# The name of the Pygments (syntax highlighting) style to use. +pygments_style = 'sphinx' + +# A list of ignored prefixes for module index sorting. +#modindex_common_prefix = [] + +primary_domain = 'jl' +highlight_language = 'julia' + +# If true, keep warnings as "system message" paragraphs in the built documents. +#keep_warnings = False + + +# -- Options for HTML output ---------------------------------------------- + +# The theme to use for HTML and HTML Help pages. See the documentation for +# a list of builtin theme +html_theme = 'default' + +import os +on_rtd = os.environ.get('READTHEDOCS', None) == 'True' + +if not on_rtd: # only import and set the theme if we're building docs locally + try: + import sphinx_rtd_theme + html_theme = "sphinx_rtd_theme" + html_theme_path = [sphinx_rtd_theme.get_html_theme_path()] + except: + pass + +# Theme options are theme-specific and customize the look and feel of a theme +# further. For a list of options available for each theme, see the +# documentation. +#html_theme_options = {} + +# Add any paths that contain custom themes here, relative to this directory. +#html_theme_path = [] + +# The name for this set of Sphinx documents. If None, it defaults to +# " v documentation". +#html_title = None + +# A shorter title for the navigation bar. Default is the same as html_title. +#html_short_title = None + +# The name of an image file (relative to this directory) to place at the top +# of the sidebar. +#html_logo = None + +# The name of an image file (within the static path) to use as favicon of the +# docs. This file should be a Windows icon file (.ico) being 16x16 or 32x32 +# pixels large. +#html_favicon = None + +# Add any paths that contain custom static files (such as style sheets) here, +# relative to this directory. They are copied after the builtin static files, +# so a file named "default.css" will overwrite the builtin "default.css". +html_static_path = ['_static'] + +# Add any extra paths that contain custom files (such as robots.txt or +# .htaccess) here, relative to this directory. These files are copied +# directly to the root of the documentation. +#html_extra_path = [] + +# If not '', a 'Last updated on:' timestamp is inserted at every page bottom, +# using the given strftime format. +#html_last_updated_fmt = '%b %d, %Y' + +# If true, SmartyPants will be used to convert quotes and dashes to +# typographically correct entities. +#html_use_smartypants = True + +# Custom sidebar templates, maps document names to template names. +#html_sidebars = {} + +# Additional templates that should be rendered to pages, maps page names to +# template names. +#html_additional_pages = {} + +# If false, no module index is generated. +#html_domain_indices = True + +# If false, no index is generated. +#html_use_index = True + +# If true, the index is split into individual pages for each letter. +#html_split_index = False + +# If true, links to the reST sources are added to the pages. +#html_show_sourcelink = True + +# If true, "Created using Sphinx" is shown in the HTML footer. Default is True. +#html_show_sphinx = True + +# If true, "(C) Copyright ..." is shown in the HTML footer. Default is True. +#html_show_copyright = True + +# If true, an OpenSearch description file will be output, and all pages will +# contain a tag referring to it. The value of this option must be the +# base URL from which the finished HTML is served. +#html_use_opensearch = '' + +# This is the file name suffix for HTML files (e.g. ".xhtml"). +#html_file_suffix = None + +# Output file base name for HTML help builder. +htmlhelp_basename = 'MXNetdoc' + + +# -- Options for LaTeX output --------------------------------------------- + +latex_elements = { +# The paper size ('letterpaper' or 'a4paper'). +#'papersize': 'letterpaper', + +# The font size ('10pt', '11pt' or '12pt'). +#'pointsize': '10pt', + +# Additional stuff for the LaTeX preamble. +#'preamble': '', +} + +# Grouping the document tree into LaTeX files. List of tuples +# (source start file, target name, title, +# author, documentclass [howto, manual, or own class]). +latex_documents = [ + ('index', 'MXNet.tex', u'MXNet Documentation', + u'pluskid', 'manual'), +] + +# The name of an image file (relative to this directory) to place at the top of +# the title page. +#latex_logo = None + +# For "manual" documents, if this is true, then toplevel headings are parts, +# not chapters. +#latex_use_parts = False + +# If true, show page references after internal links. +#latex_show_pagerefs = False + +# If true, show URL addresses after external links. +#latex_show_urls = False + +# Documents to append as an appendix to all manuals. +#latex_appendices = [] + +# If false, no module index is generated. +#latex_domain_indices = True + + +# -- Options for manual page output --------------------------------------- + +# One entry per manual page. List of tuples +# (source start file, name, description, authors, manual section). +man_pages = [ + ('index', 'mxnet', u'MXNet Documentation', + [u'pluskid'], 1) +] + +# If true, show URL addresses after external links. +#man_show_urls = False + + +# -- Options for Texinfo output ------------------------------------------- + +# Grouping the document tree into Texinfo files. List of tuples +# (source start file, target name, title, author, +# dir menu entry, description, category) +texinfo_documents = [ + ('index', 'MXNet', u'MXNet Documentation', + u'pluskid', 'MXNet', 'One line description of project.', + 'Miscellaneous'), +] + +# Documents to append as an appendix to all manuals. +#texinfo_appendices = [] + +# If false, no module index is generated. +#texinfo_domain_indices = True + +# How to display URL addresses: 'footnote', 'no', or 'inline'. +#texinfo_show_urls = 'footnote' + +# If true, do not generate a @detailmenu in the "Top" node's menu. +#texinfo_no_detailmenu = False diff --git a/docs/index.md b/docs/index.md deleted file mode 100644 index c411cc86fd95..000000000000 --- a/docs/index.md +++ /dev/null @@ -1,8 +0,0 @@ -# MXNet.jl - -MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julialang.org/) package. MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of features include: - -* Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. -* Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. - -To install MXNet.jl, please follow the [installaton guide](user-guide/install.md). See the navigation menu in the sidebar for an [overview](user-guide/overview.md) of MXNet.jl and tutorials on training neural networks in MXNet.jl. diff --git a/docs/index.rst b/docs/index.rst new file mode 100644 index 000000000000..8d0890e0c6a0 --- /dev/null +++ b/docs/index.rst @@ -0,0 +1,34 @@ +%%%%%%%%%%%%%%%%%%% +MXNet Documentation +%%%%%%%%%%%%%%%%%%% + +`MXNet.jl `_ is `Julia +`_ package of `dmlc/mxnet +`_. MXNet.jl brings flexible and efficient GPU +computing and state-of-art deep learning to Julia. Some highlight of features +include: + +- Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. +- Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. + + +.. toctree:: + :maxdepth: 2 + :caption: Tutorials + + tutorial/mnist + +.. toctree:: + :maxdepth: 2 + :caption: User's Guide + + user-guide/install + user-guide/overview + +Indices and tables +================== + +* :ref:`genindex` +* :ref:`modindex` +* :ref:`search` + diff --git a/docs/sphinx/julia.py b/docs/sphinx/julia.py new file mode 100644 index 000000000000..49d6af95b545 --- /dev/null +++ b/docs/sphinx/julia.py @@ -0,0 +1,23 @@ +# Julia domain for Sphinx (stolen from StrPack.jl) +# http://sphinx.pocoo.org/domains.html + +import re +import sphinx.domains.python + +sphinx.domains.python.py_sig_re = re.compile( + r'''^ ([\w.]*\.)? # class name(s) + ([^\s(]+) \s* # thing name + (?: \((.*)\) # optional: arguments + (?:\s* -> \s* (.*))? # return annotation + )? $ # and nothing more + ''', re.VERBOSE | re.UNICODE) + +class JuliaDomain(sphinx.domains.python.PythonDomain): + """Julia language domain.""" + name = 'jl' + label = 'Julia' + +JuliaDomain.directives['type'] = JuliaDomain.directives['class'] + +def setup(app): + app.add_domain(JuliaDomain) diff --git a/docs/tutorial/mnist.rst b/docs/tutorial/mnist.rst new file mode 100644 index 000000000000..2e5d087a5242 --- /dev/null +++ b/docs/tutorial/mnist.rst @@ -0,0 +1,252 @@ +Digit Recognition on MNIST +========================== + +In this tutorial, we will work through examples of training a simple multi-layer +perceptron and then a convolutional neural network (the LeNet architecture) on +the `MNIST handwritten digit dataset `_. The +code for this tutorial could be found in `examples/mnist +`_. + +Simple 3-layer MLP +------------------ + +This is a tiny 3-layer MLP that could be easily trained on CPU. The script starts with + +.. code-block:: julia + + using MXNet + +to load the ``MXNet`` module. Then we are ready to define the network +architecture via the :doc:`symbolic API `. We start with +a placeholder ``data`` symbol, + +.. code-block:: julia + + data = mx.Variable(:data) + +and then cascading fully-connected layers and activation functions: + +.. code-block:: julia + + fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) + act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) + fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) + act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) + fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) + +Note each composition we take the previous symbol as the `data` argument, forming a feedforward chain. The architecture looks like + +.. code-block:: julia + + Input --> 128 units (ReLU) --> 64 units (ReLU) --> 10 units + +where the last 10 units correspond to the 10 output classes (digits 0,...,9). We +then add a final ``Softmax`` operation to turn the 10-dimensional prediction to proper probability values for the 10 classes: + +.. code-block:: julia + + mlp = mx.Softmax(data = fc3, name=:softmax) + +As we can see, the MLP is just a chain of layers. For this case, we can also use +the ``mx.chain`` macro. The same architecture above can be defined as + +.. code-block:: julia + + mlp = @mx.chain mx.Variable(:data) => + mx.FullyConnected(name=:fc1, num_hidden=128) => + mx.Activation(name=:relu1, act_type=:relu) => + mx.FullyConnected(name=:fc2, num_hidden=64) => + mx.Activation(name=:relu2, act_type=:relu) => + mx.FullyConnected(name=:fc3, num_hidden=10) => + mx.Softmax(name=:softmax) + +After defining the architecture, we are ready to load the MNIST data. MXNet.jl +provide built-in data providers for the MNIST dataset, which could automatically +download the dataset into ``Pkg.dir("MXNet")/data/mnist`` if necessary. We wrap +the code to construct the data provider into ``mnist-data.jl`` so that it could be shared by both the MLP example and the LeNet ConvNets example. + +.. code-block:: julia + + batch_size = 100 + include("mnist-data.jl") + train_provider, eval_provider = get_mnist_providers(batch_size) + +If you need to write your own data providers for customized data format, please refer to **TODO**: pointer to data provider API. + +Given the architecture and data, we can instantiate an *model* to do the actual +training. ``mx.FeedForward`` is the built-in model that is suitable for most feed-forward architectures. When constructing the model, we also specify the *context* on which the computation should be carried out. Because this is a really tiny MLP, we will just run on a single CPU device. + +.. code-block:: julia + + model = mx.FeedForward(mlp, context=mx.cpu()) + +You can use a ``mx.gpu()`` or if a list of devices (e.g. ``[mx.gpu(0), +mx.gpu(1)]``) is provided, data-parallelization will be used automatically. But for this tiny example, using a GPU device might not help. + +The last thing we need to specify is the optimization algorithm (a.k.a. *optimizer*) to use. We use the basic SGD with a fixed learning rate 0.1 and momentum 0.9: + +.. code-block:: julia + + optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) + +Now we can do the training. Here the ``n_epoch`` parameter specifies that we +want to train for 20 epochs. We also supply a ``eval_data`` to monitor validation accuracy on the validation set. + +.. code-block:: julia + + mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) + +Here is a sample output + +.. code-block:: text + + INFO: Start training on [CPU0] + INFO: Initializing parameters... + INFO: Creating KVStore... + INFO: == Epoch 001 ========== + INFO: ## Training summary + INFO: :accuracy = 0.7554 + INFO: time = 1.3165 seconds + INFO: ## Validation summary + INFO: :accuracy = 0.9502 + ... + INFO: == Epoch 020 ========== + INFO: ## Training summary + INFO: :accuracy = 0.9949 + INFO: time = 0.9287 seconds + INFO: ## Validation summary + INFO: :accuracy = 0.9775 + + +Convolutional Neural Networks +----------------------------- + +In the second example, we show a slightly more complicated architecture that +involves convolution and pooling. This architecture for the MNIST is usually +called the [LeNet]_. The first part of the architecture is listed below: + +.. code-block:: julia + + # input + data = mx.Variable(:data) + + # first conv + conv1 = @mx.chain mx.Convolution(data=data, kernel=(5,5), num_filter=20) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) + + # second conv + conv2 = @mx.chain mx.Convolution(data=conv1, kernel=(5,5), num_filter=50) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) + +We basically defined two convolution modules. Each convolution module is +actually a chain of ``Convolution``, ``tanh`` activation and then max ``Pooling`` operations. + +Each sample in the MNIST dataset is a 28x28 single-channel grayscale image. In +the tensor format used by ``NDArray``, a batch of 100 samples is a tensor of +shape ``(28,28,1,100)``. The convolution and pooling operates in the spatial +axis, so ``kernel=(5,5)`` indicate a square region of 5-width and 5-height. +The rest of the architecture follows as: + +.. code-block:: julia + + # first fully-connected + fc1 = @mx.chain mx.Flatten(data=conv2) => + mx.FullyConnected(num_hidden=500) => + mx.Activation(act_type=:tanh) + + # second fully-connected + fc2 = mx.FullyConnected(data=fc1, num_hidden=10) + + # softmax loss + lenet = mx.Softmax(data=fc2, name=:softmax) + +Note a fully-connected operator expects the input to be a matrix. However, the +results from spatial convolution and pooling are 4D tensors. So we explicitly +used a ``Flatten`` operator to flat the tensor, before connecting it to the +``FullyConnected`` operator. + +The rest of the network is the same as the previous MLP example. As before, we can now load the MNIST dataset: + +.. code-block:: julia + + batch_size = 100 + include("mnist-data.jl") + train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) + +Note we specified ``flat=false`` to tell the data provider to provide 4D tensors instead of 2D matrices because the convolution operators needs correct spatial shape information. We then construct a feedforward model on GPU, and train it. + +.. code-block:: julia + + #-------------------------------------------------------------------------------- + # fit model + model = mx.FeedForward(lenet, context=mx.gpu()) + + # optimizer + optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) + + # fit parameters + mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) + +And here is a sample of running outputs: + +.. code-block:: text + + INFO: == Epoch 001 ========== + INFO: ## Training summary + INFO: :accuracy = 0.6750 + INFO: time = 4.9814 seconds + INFO: ## Validation summary + INFO: :accuracy = 0.9712 + ... + INFO: == Epoch 020 ========== + INFO: ## Training summary + INFO: :accuracy = 1.0000 + INFO: time = 4.0086 seconds + INFO: ## Validation summary + INFO: :accuracy = 0.9915 + + +.. [LeNet] Lecun, Y.; Bottou, L.; Bengio, Y.; Haffner, P., + *Gradient-based learning applied to document recognition*, + Proceedings of the IEEE, vol.86, no.11, pp.2278-2324, + Nov 1998. + +Predicting with a trained model +------------------------------- + +Predicting with a trained model is very simple. By calling ``mx.predict`` with the +model and a data provider, we get the model output as a Julia Array: + +.. code-block:: julia + + probs = mx.predict(model, eval_provider) + +The following code shows a stupid way of getting all the labels from the data +provider, and compute the prediction accuracy manually: + +.. code-block:: julia + + # collect all labels from eval data + labels = Array[] + for batch in eval_provider + push!(labels, copy(mx.get_label(batch))) + end + labels = cat(1, labels...) + + # Now we use compute the accuracy + correct = 0 + for i = 1:length(labels) + # labels are 0...9 + if indmax(probs[:,i]) == labels[i]+1 + correct += 1 + end + end + println(mx.format("Accuracy on eval set: {1:.2f}%", 100correct/length(labels))) + +Alternatively, when the dataset is huge, one can provide a callback to +``mx.predict``, then the callback function will be invoked with the outputs of +each mini-batch. The callback could, for example, write the data to disk for +future inspection. In this case, no value is returned from ``mx.predict``. See +also **TODO** provide link to prediction API. diff --git a/docs/tutorials/mnist.md b/docs/tutorials/mnist.md deleted file mode 100644 index ecf7bab8f631..000000000000 --- a/docs/tutorials/mnist.md +++ /dev/null @@ -1,150 +0,0 @@ -In this tutorial, we will work through examples of training a simple multi-layer perceptron and then a convolutional neural network (the LeNet architecture) on the [MNIST handwritten digit dataset](http://yann.lecun.com/exdb/mnist/). The code for this tutorial could be found in [`Pkg.dir("MXNet")`/examples/mnist/](https://github.com/dmlc/MXNet.jl/tree/master/examples/mnist). - -# Simple 3-layer MLP - -This is a tiny 3-layer MLP that could be easily trained on CPU. The script starts with -```julia -using MXNet -``` -to load the `MXNet` module. Then we are ready to define the network architecture via the [symbolic API](../user-guide/overview.md#symbols-and-composition). We start with a placeholder `data` symbol, -```julia -data = mx.Variable(:data) -``` -and then cascading fully-connected layers and activation functions: -```julia -fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) -act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) -fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) -act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) -fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) -``` -Note each composition we take the previous symbol as the `data` argument, forming a feedforward chain. The architecture looks like -``` -Input --> 128 units (ReLU) --> 64 units (ReLU) --> 10 units -``` -where the last 10 units correspond to the 10 output classes (digits 0,...,9). We then add a final `Softmax` operation to turn the 10-dimensional prediction to proper probability values for the 10 classes: -```julia -mlp = mx.Softmax(data = fc3, name=:softmax) -``` -As we can see, the MLP is just a chain of layers. For this case, we can also use the `mx.chain` macro. The same architecture above can be defined as -```julia -mlp = @mx.chain mx.Variable(:data) => - mx.FullyConnected(name=:fc1, num_hidden=128) => - mx.Activation(name=:relu1, act_type=:relu) => - mx.FullyConnected(name=:fc2, num_hidden=64) => - mx.Activation(name=:relu2, act_type=:relu) => - mx.FullyConnected(name=:fc3, num_hidden=10) => - mx.Softmax(name=:softmax) -``` - -After defining the architecture, we are ready to load the MNIST data. MXNet.jl provide built-in data providers for the MNIST dataset, which could automatically download the dataset into `Pkg.dir("MXNet")/data/mnist` if necessary. We wrap the code to construct the data provider into `mnist-data.jl` so that it could be shared by both the MLP example and the LeNet ConvNets example. -```julia -batch_size = 100 -include("mnist-data.jl") -train_provider, eval_provider = get_mnist_providers(batch_size) -``` -If you need to write your own data providers for customized data format, please refer to **TODO**: pointer to data provider API. - -Given the architecture and data, we can instantiate an *model* to do the actual training. `mx.FeedForward` is the built-in model that is suitable for most feed-forward architectures. When constructing the model, we also specify the *context* on which the computation should be carried out. Because this is a really tiny MLP, we will just run on a single CPU device. -```julia -model = mx.FeedForward(mlp, context=mx.cpu()) -``` -You can use a `mx.gpu()` or if a list of devices (e.g. `[mx.gpu(0), mx.gpu(1)]`) is provided, data-parallelization will be used automatically. But for this tiny example, using a GPU device might not help. - -The last thing we need to specify is the optimization algorithm (a.k.a. *optimizer*) to use. We use the basic SGD with a fixed learning rate 0.1 and momentum 0.9: -```julia -optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) -``` -Now we can do the training. Here the `n_epoch` parameter specifies that we want to train for 20 epochs. We also supply a `eval_data` to monitor validation accuracy on the validation set. -```julia -mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) -``` -Here is a sample output -``` -INFO: Start training on [CPU0] -INFO: Initializing parameters... -INFO: Creating KVStore... -INFO: == Epoch 001 ========== -INFO: ## Training summary -INFO: :accuracy = 0.7554 -INFO: time = 1.3165 seconds -INFO: ## Validation summary -INFO: :accuracy = 0.9502 -... -INFO: == Epoch 020 ========== -INFO: ## Training summary -INFO: :accuracy = 0.9949 -INFO: time = 0.9287 seconds -INFO: ## Validation summary -INFO: :accuracy = 0.9775 -``` - -# Convolutional Neural Networks - -In the second example, we show a slightly more complicated architecture that involves convolution and pooling. This architecture for the MNIST is usually called the *LeNet*. The first part of the architecture is listed below: -```julia -# input -data = mx.Variable(:data) - -# first conv -conv1 = @mx.chain mx.Convolution(data=data, kernel=(5,5), num_filter=20) => - mx.Activation(act_type=:tanh) => - mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) - -# second conv -conv2 = @mx.chain mx.Convolution(data=conv1, kernel=(5,5), num_filter=50) => - mx.Activation(act_type=:tanh) => - mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) -``` -We basically defined two convolution modules. Each convolution module is actually a chain of `Convolution`, `tanh` activation and then max `Pooling` operations. - -Each sample in the MNIST dataset is a 28x28 single-channel grayscale image. In the tensor format used by `NDArray`, a batch of 100 samples is a tensor of shape `(28,28,1,100)`. The convolution and pooling operates in the spatial axis, so `kernel=(5,5)` indicate a square region of 5-width and 5-height. -The rest of the architecture follows as: -```julia -# first fully-connected -fc1 = @mx.chain mx.Flatten(data=conv2) => - mx.FullyConnected(num_hidden=500) => - mx.Activation(act_type=:tanh) - -# second fully-connected -fc2 = mx.FullyConnected(data=fc1, num_hidden=10) - -# softmax loss -lenet = mx.Softmax(data=fc2, name=:softmax) -``` -Note a fully-connected operator expects the input to be a matrix. However, the results from spatial convolution and pooling are 4D tensors. So we explicitly used a `Flatten` operator to flat the tensor, before connecting it to the `FullyConnected` operator. - -The rest of the network is the same as the previous MLP example. As before, we can now load the MNIST dataset: -```julia -batch_size = 100 -include("mnist-data.jl") -train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) -``` -Note we specified `flat=false` to tell the data provider to provide 4D tensors instead of 2D matrices because the convolution operators needs correct spatial shape information. We then construct a feedforward model on GPU, and train it. -```julia -#-------------------------------------------------------------------------------- -# fit model -model = mx.FeedForward(lenet, context=mx.gpu()) - -# optimizer -optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) - -# fit parameters -mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) -``` -And here is a sample of running outputs: -``` -INFO: == Epoch 001 ========== -INFO: ## Training summary -INFO: :accuracy = 0.6750 -INFO: time = 4.9814 seconds -INFO: ## Validation summary -INFO: :accuracy = 0.9712 -... -INFO: == Epoch 020 ========== -INFO: ## Training summary -INFO: :accuracy = 1.0000 -INFO: time = 4.0086 seconds -INFO: ## Validation summary -INFO: :accuracy = 0.9915 -``` diff --git a/docs/user-guide/install.md b/docs/user-guide/install.md deleted file mode 100644 index eb4e1ecec80d..000000000000 --- a/docs/user-guide/install.md +++ /dev/null @@ -1,29 +0,0 @@ -# Automatic Installation - -To install MXNet.jl, simply type -```jl -Pkg.add("MXNet") -``` -in the Julia REPL. MXNet.jl is built on top of [libmxnet](https://github.com/dmlc/mxnet). Upon installation, Julia will try to automatically download and build libmxnet. - -The libmxnet source is downloaded to `Pkg.dir("MXNet")/deps/src/mxnet`. The automatic build is using default configurations, with OpenCV, CUDA disabled. -If the compilation failed due to unresolved dependency, or if you want to customize the build, it is recommended to compile and install libmxnet manually. Please see [below](#manual-compilation) for more details. - -To use the latest git version of MXNet.jl, use the following command instead -```jl -Pkg.checkout("MXNet") -``` - -# Manual Compilation - -It is possible to compile libmxnet separately and point MXNet.jl to a the existing library in case automatic compilation fails due to unresolved dependencies in an un-standard environment; Or when one want to work with a seperate, maybe customized libmxnet. - -To build libmxnet, please refer to [the installation guide of libmxnet](http://mxnet.readthedocs.org/en/latest/build.html). After successfully installing libmxnet, set the `MXNET_HOME` environment variable to the location of libmxnet. In other words, the compiled `libmxnet.so` should be found in `$MXNET_HOME/lib`. - -When the `MXNET_HOME` environment variable is detected and the corresponding `libmxnet.so` could be loaded successfully, MXNet.jl will skip automatic building during installation and use the specified libmxnet instead. - -Basically, MXNet.jl will search `libmxnet.so` or `libmxnet.dll` in the following paths (and in that order): - -* `$MXNET_HOME/lib`: customized libmxnet builds -* `Pkg.dir("MXNet")/deps/usr/lib`: automatic builds -* Any system wide library search path diff --git a/docs/user-guide/install.rst b/docs/user-guide/install.rst new file mode 100644 index 000000000000..43f882928d39 --- /dev/null +++ b/docs/user-guide/install.rst @@ -0,0 +1,54 @@ +Installation Guide +================== + +Automatic Installation +---------------------- + +To install MXNet.jl, simply type + +.. code-block:: julia + + Pkg.add("MXNet") + +in the Julia REPL. Or to use the latest git version of MXNet.jl, use the following command instead + +.. code-block:: julia + + Pkg.checkout("MXNet") + +MXNet.jl is built on top of `libmxnet +`_. Upon installation, Julia will try to +automatically download and build libmxnet. + +The libmxnet source is downloaded to ``Pkg.dir("MXNet")/deps/src/mxnet``. The +automatic build is using default configurations, with OpenCV, CUDA disabled. +If the compilation failed due to unresolved dependency, or if you want to +customize the build, it is recommended to compile and install libmxnet manually. +Please see :ref:`below ` for more details. + + +Manual Compilation +------------------ + +It is possible to compile libmxnet separately and point MXNet.jl to a the existing library in case automatic compilation fails due to unresolved dependencies in an un-standard environment; Or when one want to work with a seperate, maybe customized libmxnet. + +To build libmxnet, please refer to `the installation guide of libmxnet +`_. After successfully +installing libmxnet, set the ``MXNET_HOME`` environment variable to the location +of libmxnet. In other words, the compiled ``libmxnet.so`` should be found in +``$MXNET_HOME/lib``. + +.. note:: + + The constant ``MXNET_HOME`` is pre-compiled in MXNet.jl package cache. If you + updated the environment variable after installing MXNet.jl, make sure to + update the pre-compilation cache by ``Base.compilecache("MXNet")``. + +When the ``MXNET_HOME`` environment variable is detected and the corresponding +``libmxnet.so`` could be loaded successfully, MXNet.jl will skip automatic building during installation and use the specified libmxnet instead. + +Basically, MXNet.jl will search ``libmxnet.so`` or ``libmxnet.dll`` in the following paths (and in that order): + +* ``$MXNET_HOME/lib``: customized libmxnet builds +* ``Pkg.dir("MXNet")/deps/usr/lib``: automatic builds +* Any system wide library search path diff --git a/docs/user-guide/overview.md b/docs/user-guide/overview.md deleted file mode 100644 index 7689b3fba921..000000000000 --- a/docs/user-guide/overview.md +++ /dev/null @@ -1,267 +0,0 @@ -# MXNet.jl Namespace - -Most the functions and types in MXNet.jl are organized in a flat namespace. Because many some functions are conflicting with existing names in the Julia Base module, we wrap them all in a `mx` module. The convention of accessing the MXNet.jl interface is the to use the `mx.` prefix explicitly: -```julia -using MXNet - -x = mx.zeros(2,3) # MXNet NDArray -y = zeros(eltype(x), size(x)) # Julia Array -copy!(y, x) # Overloaded function in Julia Base -z = mx.ones(size(x), mx.gpu()) # MXNet NDArray on GPU -mx.copy!(z, y) # Same as copy!(z, y) -``` -Note functions like `size`, `copy!` that is extensively overloaded for various types works out of the box. But functions like `zeros` and `ones` will be ambiguous, so we always use the `mx.` prefix. If you prefer, the `mx.` prefix can be used explicitly for all MXNet.jl functions, including `size` and `copy!` as shown in the last line. - -# High Level Interface - -## Symbols and Composition - -The way we build deep learning models in MXNet.jl is to use the powerful symbolic composition system. It is like [Theano](http://deeplearning.net/software/theano/), except that we avoided long expression compiliation time by providing *larger* neural network related building blocks to guarantee computation performance. See also [this note](http://mxnet.readthedocs.org/en/latest/program_model.html) for the design and trade-off of the MXNet symbolic composition system. - -The basic type is `mx.Symbol`. The following is a trivial example of composing two symbols with the `+` operation. -```julia -A = mx.Variable(:A) -B = mx.Variable(:B) -C = A + B -``` -We get a new *symbol* by composing existing *symbols* by some *operations*. A hierarchical architecture of a deep neural network could be realized by recursive composition. For example, the following code snippet shows a simple 2-layer MLP construction, using a hidden layer of 128 units and a ReLU activation function. -```julia -net = mx.Variable(:data) -net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) -net = mx.Activation(data=net, name=:relu1, act_type=:relu) -net = mx.FullyConnected(data=net, name=:fc2, num_hidden=64) -net = mx.Softmax(data=net, name=:out) -``` -Each time we take the previous symbol, and compose with an operation. Unlike the simple `+` example above, the *operations* here are "bigger" ones, that correspond to common computation layers in deep neural networks. - -Each of those operation takes one or more input symbols for composition, with optional hyper-parameters (e.g. `num_hidden`, `act_type`) to further customize the composition results. - -When applying those operations, we can also specify a `name` for the result symbol. This is convenient if we want to refer to this symbol later on. If not supplied, a name will be automatically generated. - -Each symbol takes some arguments. For example, in the `+` case above, to compute the value of `C`, we will need to know the values of the two inputs `A` and `B`. For neural networks, the arguments are primarily two categories: *inputs* and *parameters*. *inputs* are data and labels for the networks, while *parameters* are typically trainable *weights*, *bias*, *filters*. - -When composing symbols, their arguments accumulates. We can list all the arguments by -```julia -julia> mx.list_arguments(net) -6-element Array{Symbol,1}: - :data # Input data, name from the first data variable - :fc1_weight # Weights of the fully connected layer named :fc1 - :fc1_bias # Bias of the layer :fc1 - :fc2_weight # Weights of the layer :fc2 - :fc2_bias # Bias of the layer :fc2 - :out_label # Input label, required by the softmax layer named :out -``` -Note the names of the arguments are generated according to the provided name for each layer. We can also specify those names explicitly: -```julia -net = mx.Variable(:data) -w = mx.Variable(:myweight) -net = mx.FullyConnected(data=data, weight=w, name=:fc1, num_hidden=128) -mx.list_arguments(net) -# => -# 3-element Array{Symbol,1}: -# :data -# :myweight -# :fc1_bias -``` -The simple fact is that a `Variable` is just a placeholder `mx.Symbol`. In composition, we can use arbitrary symbols for arguments. For example: -```julia -net = mx.Variable(:data) -net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) -net2 = mx.Variable(:data2) -net2 = mx.FullyConnected(data=net2, name=:net2, num_hidden=128) -mx.list_arguments(net2) -# => -# 3-element Array{Symbol,1}: -# :data2 -# :net2_weight -# :net2_bias -composed_net = net2(data2=net, name=:composed) -mx.list_arguments(composed_net) -# => -# 5-element Array{Symbol,1}: -# :data -# :fc1_weight -# :fc1_bias -# :net2_weight -# :net2_bias -``` -Note we use a composed symbol, `net` as the argument `data2` for `net2` to get a new symbol, which we named `:composed`. It also shows that a symbol itself is a call-able object, which can be invoked to fill in missing arguments and get more complicated symbol compositions. - -## Shape Inference - -Given enough information, the shapes of all arguments in a composed symbol could be inferred automatically. For example, given the input shape, and some hyper-parameters like `num_hidden`, the shapes for the weights and bias in a neural network could be inferred. -```julia -net = mx.Variable(:data) -net = mx.FullyConnected(data=net, name=:fc1, num_hidden=10) -arg_shapes, out_shapes, aux_shapes = mx.infer_shape(net, data=(10, 64)) -``` -The returned shapes corresponds to arguments with the same order as returned by `mx.list_arguments`. The `out_shapes` are shapes for outputs, and `aux_shapes` can be safely ignored for now. -```julia -for (n,s) in zip(mx.list_arguments(net), arg_shapes) - println("$n => $s") -end -# => -# data => (10,64) -# fc1_weight => (10,10) -# fc1_bias => (10,) -for (n,s) in zip(mx.list_outputs(net), out_shapes) - println("$n => $s") -end -# => -# fc1_output => (10,64) -``` - -## Binding and Executing - -In order to execute the computation graph specified a composed symbol, we will *bind* the free variables to concrete values, specified as `mx.NDArray`s. This will create an `mx.Executor` on a given `mx.Context`. A context describes the computation devices (CPUs, GPUs, etc.) and an executor will carry out the computation (forward/backward) specified in the corresponding symbolic composition. -```julia -A = mx.Variable(:A) -B = mx.Variable(:B) -C = A .* B -a = mx.ones(3) * 4 -b = mx.ones(3) * 2 -c_exec = mx.bind(C, context=mx.cpu(), args=Dict(:A => a, :B => b)) - -mx.forward(c_exec) -copy(c_exec.outputs[1]) # copy turns NDArray into Julia Array -# => -# 3-element Array{Float32,1}: -# 8.0 -# 8.0 -# 8.0 -``` -For neural networks, it is easier to use `simple_bind`. By providing the shape for input arguments, it will perform a shape inference for the rest of the arguments and create the `NDArray`s automatically. In practice, the binding and executing steps are hidden under the `Model` interface. - -**TODO** Provide pointers to model tutorial and further details about binding and symbolic API. - -# Low Level Interface - -## NDArrays - -`NDArray`s are basic building blocks of the actual computations in MXNet. It is like a Julia `Array` object, with some important differences listed here: - -* The actual data could live on different `Context` (e.g. GPUs). For some contexts, iterating into the elements one by one is very slow, thus indexing into `NDArray` is not supported in general. The easiest way to inspect the contents of an `NDArray` is to use the `copy` function to copy the contents as a Julia `Array`. -* Operations on `NDArray`s (including basic arithmetics and neural network related operators) are executed in parallel with automatic dependency tracking to ensure correctness. -* There is no generics in `NDArray`, the `eltype` is always `mx.MX_float`. Because for applications in machine learning, single precision floating point numbers are typical a best choice balancing between precision, speed and portability. Also since libmxnet is designed to support multiple languages as front-ends, it is much simpler to implement with a fixed data type. - -While most of the computation is hidden in libmxnet by operators corresponding to various neural network layers. Getting familiar with the `NDArray` API is useful for implementing `Optimizer`s or customized operators in Julia directly. - -The followings are common ways to create `NDArray` objects: - -* `mx.empty(shape[, context])`: create on uninitialized array of a given shape on a specific device. For example, `mx.empty(2,3)`, `mx.((2,3), mx.gpu(2))`. -* `mx.zeros(shape[, context])` and `mx.ones(shape[, context])`: similar to the Julia's built-in `zeros` and `ones`. -* `mx.copy(jl_arr, context)`: copy the contents of a Julia `Array` to a specific device. - -Most of the convenient functions like `size`, `length`, `ndims`, `eltype` on array objects should work out-of-the-box. Although indexing is not supported, it is possible to take *slices*: -```julia -a = mx.ones(2,3) -b = mx.slice(a, 1:2) -b[:] = 2 -println(copy(a)) -# => -# Float32[2.0 2.0 1.0 -# 2.0 2.0 1.0] -``` -A slice is a sub-region sharing the same memory with the original `NDArray` object. A slice is always a contiguous piece of memory, so only slicing on the *last* dimension is supported. The example above also shows a way to set the contents of an `NDArray`. -```julia -a = mx.empty(2,3) -a[:] = 0.5 # set all elements to a scalar -a[:] = rand(size(a)) # set contents with a Julia Array -copy!(a, rand(size(a))) # set value by copying a Julia Array -b = mx.empty(size(a)) -b[:] = a # copying and assignment between NDArrays -``` -Note due to the intrinsic limitation design of the Julia language, a normal assignment -```julia -a = b -``` -does **not** mean copying the contents of `b` to `a`. Instead, it just make the variable `a` pointing to a new object, which is `b`. Similarly, inplace arithmetics does not work as expected: -```julia -a = mx.ones(2) -r = a # keep a reference to a -b = mx.ones(2) -a += b # translates to a = a + b -println(copy(a)) -# => Float32[2.0f0,2.0f0] -println(copy(r)) -# => Float32[1.0f0,1.0f0] -``` -As we can see, `a` has expected value, but instead of inplace updating, a new `NDArray` is created and `a` is set to point to this new object. If we look at `r`, which still reference to the old `a`, its content has not changed. There is currently no way in Julia to overload the operators like `+=` to get customized behavior. - -Instead, you will need to write `a[:] = a+b`, or if you want *real* inplace `+=` operation, MXNet.jl provides a simple macro `@mx.inplace`: -```julia -@mx.inplace a += b -macroexpand(:(@mx.inplace a += b)) -# => :(MXNet.mx.add_to!(a,b)) -``` -As we can see, it translate the `+=` operator to an explicit `add_to!` function call, which invokes into libmxnet to add the contents of `b` into `a` directly. For example, the following is the update rule in the SGD `Optimizer` (both `grad` and `weight` are `NDArray` objects): -```julia -@inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) -``` -Note there is no much magic in `mx.inplace`: it only does a shallow translation. In the SGD update rule example above, the computation like scaling the gradient by `grad_scale` and adding the weight decay all create temporary `NDArray` objects. To mitigate this issue, libmxnet has a customized memory allocator designed specifically to handle this kind of situations. The following snippet does a simple benchmark on allocating temp `NDArray`s vs. pre-allocating: -```julia -using Benchmark -using MXNet - -N_REP = 1000 -SHAPE = (128, 64) -CTX = mx.cpu() -LR = 0.1 - -function inplace_op() - weight = mx.zeros(SHAPE, CTX) - grad = mx.ones(SHAPE, CTX) - - # pre-allocate temp objects - grad_lr = mx.empty(SHAPE, CTX) - - for i = 1:N_REP - copy!(grad_lr, grad) - @mx.inplace grad_lr .*= LR - @mx.inplace weight -= grad_lr - end - return weight -end - -function normal_op() - weight = mx.zeros(SHAPE, CTX) - grad = mx.ones(SHAPE, CTX) - - for i = 1:N_REP - weight[:] -= LR * grad - end - return weight -end - -# make sure the results are the same -@assert(maximum(abs(copy(normal_op() - inplace_op()))) < 1e-6) - -println(compare([inplace_op, normal_op], 100)) -``` -The comparison on my laptop shows that `normal_op` while allocating a lot of temp `NDArray`s in the loop (the performance gets worse when increasing `N_REP`), is only about twice slower than the pre-allocated one. - -| Row | Function | Average | Relative | Replications | -|-----|--------------|-----------|----------|--------------| -| 1 | "inplace_op" | 0.0074854 | 1.0 | 100 | -| 2 | "normal_op" | 0.0174202 | 2.32723 | 100 | - -So it will usually not be a big problem unless you are at the bottleneck of the computation. - -## Distributed Key-value Store - -The type `KVStore` and related methods are used for data sharing across different devices or machines. It provides a simple and efficient integer-`NDArray` key-value storage system that each device can pull or push. - -The following example shows how to create a `local` `KVStore`, initialize a value and then pull it back. -```julia -kv = mx.KVStore(:local) -shape = (2,3) -key = 3 - -mx.init!(kv, key, mx.ones(shape)*2) -a = mx.empty(shape) -mx.pull!(kv, key, a) # pull value into a -println(copy(a)) -# => -# Float32[2.0 2.0 2.0 -# 2.0 2.0 2.0] -``` diff --git a/docs/user-guide/overview.rst b/docs/user-guide/overview.rst new file mode 100644 index 000000000000..2fb2738008cd --- /dev/null +++ b/docs/user-guide/overview.rst @@ -0,0 +1,376 @@ +Overview +======== + +MXNet.jl Namespace +------------------ + +Most the functions and types in MXNet.jl are organized in a flat namespace. +Because many some functions are conflicting with existing names in the Julia +Base module, we wrap them all in a ``mx`` module. The convention of accessing +the MXNet.jl interface is the to use the ``mx.`` prefix explicitly: + +.. code-block:: julia + + using MXNet + + x = mx.zeros(2,3) # MXNet NDArray + y = zeros(eltype(x), size(x)) # Julia Array + copy!(y, x) # Overloaded function in Julia Base + z = mx.ones(size(x), mx.gpu()) # MXNet NDArray on GPU + mx.copy!(z, y) # Same as copy!(z, y) + +Note functions like ``size``, ``copy!`` that is extensively overloaded for +various types works out of the box. But functions like ``zeros`` and ``ones`` +will be ambiguous, so we always use the ``mx.`` prefix. If you prefer, the +``mx.`` prefix can be used explicitly for all MXNet.jl functions, including +``size`` and ``copy!`` as shown in the last line. + +Low Level Interface +------------------- + +NDArrays +~~~~~~~~ + +``NDArray`` is the basic building blocks of the actual computations in MXNet. It +is like a Julia ``Array`` object, with some important differences listed here: + +* The actual data could live on different ``Context`` (e.g. GPUs). For some + contexts, iterating into the elements one by one is very slow, thus indexing + into ``NDArray`` is not supported in general. The easiest way to inspect the + contents of an ``NDArray`` is to use the ``copy`` function to copy the + contents as a Julia ``Array``. +* Operations on ``NDArray`` (including basic arithmetics and neural network related operators) are executed in parallel with automatic dependency tracking to ensure correctness. +* There is no generics in ``NDArray``, the ``eltype`` is always ``mx.MX_float``. Because for applications in machine learning, single precision floating point numbers are typical a best choice balancing between precision, speed and portability. Also since libmxnet is designed to support multiple languages as front-ends, it is much simpler to implement with a fixed data type. + +While most of the computation is hidden in libmxnet by operators corresponding +to various neural network layers. Getting familiar with the ``NDArray`` API is +useful for implementing ``Optimizer`` or customized operators in Julia directly. + +The followings are common ways to create ``NDArray`` objects: + +* ``mx.empty(shape[, context])``: create on uninitialized array of a given shape + on a specific device. For example, ``mx.empty(2,3)`, `mx.((2,3), mx.gpu(2))``. +* ``mx.zeros(shape[, context])`` and ``mx.ones(shape[, context])``: similar to + the Julia's built-in ``zeros`` and ``ones``. +* ``mx.copy(jl_arr, context)``: copy the contents of a Julia ``Array`` to a specific device. + +Most of the convenient functions like ``size``, ``length``, ``ndims``, ``eltype`` on array objects should work out-of-the-box. Although indexing is not supported, it is possible to take *slices*: + +.. code-block:: julia + + a = mx.ones(2,3) + b = mx.slice(a, 1:2) + b[:] = 2 + println(copy(a)) + # => + # Float32[2.0 2.0 1.0 + # 2.0 2.0 1.0] + +A slice is a sub-region sharing the same memory with the original ``NDArray`` +object. A slice is always a contiguous piece of memory, so only slicing on the +*last* dimension is supported. The example above also shows a way to set the +contents of an ``NDArray``. + +.. code-block:: julia + + a = mx.empty(2,3) + a[:] = 0.5 # set all elements to a scalar + a[:] = rand(size(a)) # set contents with a Julia Array + copy!(a, rand(size(a))) # set value by copying a Julia Array + b = mx.empty(size(a)) + b[:] = a # copying and assignment between NDArrays + +Note due to the intrinsic design of the Julia language, a normal assignment + +.. code-block:: julia + + a = b + +does **not** mean copying the contents of ``b`` to ``a``. Instead, it just make +the variable ``a`` pointing to a new object, which is ``b``. Similarly, inplace arithmetics does not work as expected: + +.. code-block:: julia + + a = mx.ones(2) + r = a # keep a reference to a + b = mx.ones(2) + a += b # translates to a = a + b + println(copy(a)) + # => Float32[2.0f0,2.0f0] + println(copy(r)) + # => Float32[1.0f0,1.0f0] + +As we can see, ``a`` has expected value, but instead of inplace updating, a new +``NDArray`` is created and ``a`` is set to point to this new object. If we look +at ``r``, which still reference to the old ``a``, its content has not changed. +There is currently no way in Julia to overload the operators like ``+=`` to get customized behavior. + +Instead, you will need to write ``a[:] = a+b``, or if you want *real* inplace +``+=`` operation, MXNet.jl provides a simple macro ``@mx.inplace``: + +.. code-block:: julia + + @mx.inplace a += b + macroexpand(:(@mx.inplace a += b)) + # => :(MXNet.mx.add_to!(a,b)) + +As we can see, it translate the ``+=`` operator to an explicit ``add_to!`` +function call, which invokes into libmxnet to add the contents of ``b`` into +``a`` directly. For example, the following is the update rule in the SGD +``Optimizer`` (both ``grad`` and ``weight`` are ``NDArray`` objects): + +.. code-block:: julia + + @inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) + +Note there is no much magic in ``mx.inplace``: it only does a shallow +translation. In the SGD update rule example above, the computation like scaling +the gradient by ``grad_scale`` and adding the weight decay all create temporary +``NDArray`` objects. To mitigate this issue, libmxnet has a customized memory +allocator designed specifically to handle this kind of situations. The following +snippet does a simple benchmark on allocating temp ``NDArray`` vs. pre-allocating: + +.. code-block:: julia + + using Benchmark + using MXNet + + N_REP = 1000 + SHAPE = (128, 64) + CTX = mx.cpu() + LR = 0.1 + + function inplace_op() + weight = mx.zeros(SHAPE, CTX) + grad = mx.ones(SHAPE, CTX) + + # pre-allocate temp objects + grad_lr = mx.empty(SHAPE, CTX) + + for i = 1:N_REP + copy!(grad_lr, grad) + @mx.inplace grad_lr .*= LR + @mx.inplace weight -= grad_lr + end + return weight + end + + function normal_op() + weight = mx.zeros(SHAPE, CTX) + grad = mx.ones(SHAPE, CTX) + + for i = 1:N_REP + weight[:] -= LR * grad + end + return weight + end + + # make sure the results are the same + @assert(maximum(abs(copy(normal_op() - inplace_op()))) < 1e-6) + + println(compare([inplace_op, normal_op], 100)) + +The comparison on my laptop shows that ``normal_op`` while allocating a lot of +temp ``NDArray`` in the loop (the performance gets worse when increasing +``N_REP``), is only about twice slower than the pre-allocated one. + ++-----+--------------+-----------+----------+--------------+ +| Row | Function | Average | Relative | Replications | ++=====+==============+===========+==========+==============+ +| 1 | "inplace_op" | 0.0074854 | 1.0 | 100 | ++-----+--------------+-----------+----------+--------------+ +| 2 | "normal_op" | 0.0174202 | 2.32723 | 100 | ++-----+--------------+-----------+----------+--------------+ + +So it will usually not be a big problem unless you are at the bottleneck of the computation. + +Distributed Key-value Store +~~~~~~~~~~~~~~~~~~~~~~~~~~~ + +The type ``KVStore`` and related methods are used for data sharing across +different devices or machines. It provides a simple and efficient +integer - ``NDArray`` key-value storage system that each device can pull or push. + +The following example shows how to create a local ``KVStore``, initialize a value and then pull it back. + +.. code-block:: julia + + kv = mx.KVStore(:local) + shape = (2,3) + key = 3 + + mx.init!(kv, key, mx.ones(shape)*2) + a = mx.empty(shape) + mx.pull!(kv, key, a) # pull value into a + println(copy(a)) + # => + # Float32[2.0 2.0 2.0 + # 2.0 2.0 2.0] + +Intermediate Level Interface +---------------------------- + +Symbols and Composition +~~~~~~~~~~~~~~~~~~~~~~~ + +The way we build deep learning models in MXNet.jl is to use the powerful +symbolic composition system. It is like `Theano +`_, except that we avoided long +expression compiliation time by providing *larger* neural network related +building blocks to guarantee computation performance. See also `this note +`_ for the design and trade-off of the MXNet symbolic composition system. + +The basic type is ``mx.Symbol``. The following is a trivial example of composing +two symbols with the ``+`` operation. + +.. code-block:: julia + + A = mx.Variable(:A) + B = mx.Variable(:B) + C = A + B + +We get a new *symbol* by composing existing *symbols* by some *operations*. A hierarchical architecture of a deep neural network could be realized by recursive composition. For example, the following code snippet shows a simple 2-layer MLP construction, using a hidden layer of 128 units and a ReLU activation function. + +.. code-block:: julia + + net = mx.Variable(:data) + net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) + net = mx.Activation(data=net, name=:relu1, act_type=:relu) + net = mx.FullyConnected(data=net, name=:fc2, num_hidden=64) + net = mx.Softmax(data=net, name=:out) + +Each time we take the previous symbol, and compose with an operation. Unlike the +simple ``+`` example above, the *operations* here are "bigger" ones, that correspond to common computation layers in deep neural networks. + +Each of those operation takes one or more input symbols for composition, with +optional hyper-parameters (e.g. ``num_hidden``, ``act_type``) to further customize the composition results. + +When applying those operations, we can also specify a ``name`` for the result symbol. This is convenient if we want to refer to this symbol later on. If not supplied, a name will be automatically generated. + +Each symbol takes some arguments. For example, in the ``+`` case above, to +compute the value of ``C``, we will need to know the values of the two inputs +``A`` and ``B``. For neural networks, the arguments are primarily two categories: *inputs* and *parameters*. *inputs* are data and labels for the networks, while *parameters* are typically trainable *weights*, *bias*, *filters*. + +When composing symbols, their arguments accumulates. We can list all the arguments by + +.. code-block:: julia + + julia> mx.list_arguments(net) + 6-element Array{Symbol,1}: + :data # Input data, name from the first data variable + :fc1_weight # Weights of the fully connected layer named :fc1 + :fc1_bias # Bias of the layer :fc1 + :fc2_weight # Weights of the layer :fc2 + :fc2_bias # Bias of the layer :fc2 + :out_label # Input label, required by the softmax layer named :out + +Note the names of the arguments are generated according to the provided name for each layer. We can also specify those names explicitly: + +.. code-block:: julia + + net = mx.Variable(:data) + w = mx.Variable(:myweight) + net = mx.FullyConnected(data=data, weight=w, name=:fc1, num_hidden=128) + mx.list_arguments(net) + # => + # 3-element Array{Symbol,1}: + # :data + # :myweight + # :fc1_bias + +The simple fact is that a ``Variable`` is just a placeholder ``mx.Symbol``. In composition, we can use arbitrary symbols for arguments. For example: + +.. code-block:: julia + + net = mx.Variable(:data) + net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) + net2 = mx.Variable(:data2) + net2 = mx.FullyConnected(data=net2, name=:net2, num_hidden=128) + mx.list_arguments(net2) + # => + # 3-element Array{Symbol,1}: + # :data2 + # :net2_weight + # :net2_bias + composed_net = net2(data2=net, name=:composed) + mx.list_arguments(composed_net) + # => + # 5-element Array{Symbol,1}: + # :data + # :fc1_weight + # :fc1_bias + # :net2_weight + # :net2_bias + +Note we use a composed symbol, ``net`` as the argument ``data2`` for ``net2`` to +get a new symbol, which we named ``:composed``. It also shows that a symbol itself is a call-able object, which can be invoked to fill in missing arguments and get more complicated symbol compositions. + +Shape Inference +~~~~~~~~~~~~~~~ + +Given enough information, the shapes of all arguments in a composed symbol could +be inferred automatically. For example, given the input shape, and some +hyper-parameters like ``num_hidden``, the shapes for the weights and bias in a neural network could be inferred. + +.. code-block:: julia + + net = mx.Variable(:data) + net = mx.FullyConnected(data=net, name=:fc1, num_hidden=10) + arg_shapes, out_shapes, aux_shapes = mx.infer_shape(net, data=(10, 64)) + +The returned shapes corresponds to arguments with the same order as returned by +``mx.list_arguments``. The ``out_shapes`` are shapes for outputs, and +``aux_shapes`` can be safely ignored for now. + +.. code-block:: julia + + for (n,s) in zip(mx.list_arguments(net), arg_shapes) + println("$n => $s") + end + # => + # data => (10,64) + # fc1_weight => (10,10) + # fc1_bias => (10,) + for (n,s) in zip(mx.list_outputs(net), out_shapes) + println("$n => $s") + end + # => + # fc1_output => (10,64) + + +Binding and Executing +~~~~~~~~~~~~~~~~~~~~~ + +In order to execute the computation graph specified a composed symbol, we will +*bind* the free variables to concrete values, specified as ``mx.NDArray``. This +will create an ``mx.Executor`` on a given ``mx.Context``. A context describes the computation devices (CPUs, GPUs, etc.) and an executor will carry out the computation (forward/backward) specified in the corresponding symbolic composition. + +.. code-block:: julia + + A = mx.Variable(:A) + B = mx.Variable(:B) + C = A .* B + a = mx.ones(3) * 4 + b = mx.ones(3) * 2 + c_exec = mx.bind(C, context=mx.cpu(), args=Dict(:A => a, :B => b)) + + mx.forward(c_exec) + copy(c_exec.outputs[1]) # copy turns NDArray into Julia Array + # => + # 3-element Array{Float32,1}: + # 8.0 + # 8.0 + # 8.0 + +For neural networks, it is easier to use ``simple_bind``. By providing the shape +for input arguments, it will perform a shape inference for the rest of the +arguments and create the ``NDArray`` automatically. In practice, the binding and +executing steps are hidden under the ``Model`` interface. + +**TODO** Provide pointers to model tutorial and further details about binding and symbolic API. + + +High Level Interface +-------------------- + +The high level interface include model training and prediction API, etc. diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 6e40c00b6b15..03be2f7d336b 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -43,7 +43,7 @@ probs = mx.predict(model, eval_provider) # collect all labels from eval data labels = Array[] for batch in eval_provider - push!(labels, copy(mx.get_label(batch)[1])) + push!(labels, copy(mx.get_label(batch))) end labels = cat(1, labels...) diff --git a/src/io.jl b/src/io.jl index dcbefb145859..c8396c1d7182 100644 --- a/src/io.jl +++ b/src/io.jl @@ -118,7 +118,12 @@ function _get_data_or_label(batch::AbstractDataBatch, provide_func::Function, lo batch_size = get_batch_size(batch.provider) data_arrays_fake_slice = [SlicedNDArray[(1:batch_size, x)] for x in data_arrays] loader(batch, data_arrays_fake_slice) - return data_arrays + + if length(data_arrays) == 1 + return data_arrays[1] + else + return data_arrays + end end function get_data(batch :: AbstractDataBatch) _get_data_or_label(batch, provide_data, load_data!) diff --git a/src/model.jl b/src/model.jl index 80ee36d10674..84b581b00b09 100644 --- a/src/model.jl +++ b/src/model.jl @@ -178,7 +178,11 @@ function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::B push!(o_list, copy(slice(o_nd, 1:batch_size-get_pad(batch)))) end else - callback(self.pred_exec.outputs) + outputs = self.pred_exec.outputs + if length(outputs) == 1 + outputs = outputs[1] + end + callback(outputs) end end From bcc90ef8c6d564706991aa0cd062d74e96498ce3 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 26 Oct 2015 22:06:15 -0400 Subject: [PATCH 133/630] switch from mkdocs to sphinx --- mkdocs.yml | 14 -------------- 1 file changed, 14 deletions(-) delete mode 100644 mkdocs.yml diff --git a/mkdocs.yml b/mkdocs.yml deleted file mode 100644 index 78822e3ada5a..000000000000 --- a/mkdocs.yml +++ /dev/null @@ -1,14 +0,0 @@ -site_name: MXNet.jl -site_author: pluskid -repo_url: https://github.com/dmlc/MXNet.jl -theme: readthedocs -pages: - - Home: index.md - - User Guide: - - 'Installation Guide' : 'user-guide/install.md' - - 'Overview' : 'user-guide/overview.md' - - Tutorials: - - 'MNIST': 'tutorials/mnist.md' - - API Documentation: - - 'ndarray': 'api/ndarray.md' - - 'symbol': 'api/symbol.md' From 8d56a9f6284789f84a383d172f8189cdc22ed0b7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 26 Oct 2015 22:38:44 -0400 Subject: [PATCH 134/630] a dead simple embedded sphinx doc system (cf #3) --- docs/api/ndarray.rst | 99 ++++++++++++++++++++++++ docs/build-api.jl | 17 +++++ docs/index.rst | 8 ++ docs/user-guide/overview.rst | 32 ++++---- src/ndarray.jl | 143 +++++++++++++++++++++++++---------- 5 files changed, 244 insertions(+), 55 deletions(-) create mode 100644 docs/api/ndarray.rst create mode 100644 docs/build-api.jl diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst new file mode 100644 index 000000000000..1d6be0498e4a --- /dev/null +++ b/docs/api/ndarray.rst @@ -0,0 +1,99 @@ + +NDArray +======= + + + + +.. class:: NDArray + + Wrapper of the ``NDArray`` type in ``libmxnet``. This is the basic building block + of tensor-based computation. + + .. _ndarray-shape-note: + + .. note:: + + since C/C++ use row-major ordering for arrays while Julia follows a + column-major ordering. To keep things consistent, we keep the underlying data + in their original layout, but use *language-native* convention when we talk + about shapes. For example, a mini-batch of 100 MNIST images is a tensor of + C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory + have shape (28,28,1,100). + + + + +.. function:: context(arr :: NDArray) + + Get the context that this :class:`NDArray` lives on. + + + + +.. function:: + empty(shape :: Tuple, ctx :: Context) + empty(shape :: Tuple) + empty(dim1, dim2, ...) + + Allocate memory for an uninitialized :class:`NDArray` with specific shape. + + + + +Interface functions similar to Julia Arrays +------------------------------------------- + + + + +.. function:: + zeros(shape :: Tuple, ctx :: Context) + zeros(shape :: Tuple) + zeros(dim1, dim2, ...) + + Create zero-ed :class:`NDArray` with specific shape. + + + + +.. function:: + ones(shape :: Tuple, ctx :: Context) + ones(shape :: Tuple) + ones(dim1, dim2, ...) + + Create an :class:`NDArray` with specific shape and initialize with 1. + + + + +.. function:: + size(arr :: NDArray) + size(arr :: NDArray, dim :: Int) + + Get the shape of an :class:`NDArray`. The shape is in Julia's column-major convention. See + also the :ref:`notes on NDArray shapes `. + + + + +.. function:: length(arr :: NDArray) + + Get the number of elements in an :class:`NDArray`. + + + + +.. function:: ndims(arr :: NDArray) + + Get the number of dimensions of an :class:`NDArray`. Is equivalent to ``length(size(arr))``. + + + + +.. function:: eltype(arr :: NDArray) + + Get the element type of an :class:`NDArray`. Currently the element type is always ``mx.MX_float``. + + + diff --git a/docs/build-api.jl b/docs/build-api.jl new file mode 100644 index 000000000000..9ddf9ff53b5b --- /dev/null +++ b/docs/build-api.jl @@ -0,0 +1,17 @@ +# extract API docs + +function extract_doc(output_filename::AbstractString, input_filenames::AbstractString...) + src_dir = joinpath(Pkg.dir("MXNet"), "src") + api_dir = joinpath(Pkg.dir("MXNet"), "docs", "api") + + mkpath(api_dir) + open(joinpath(api_dir, output_filename), "w") do io + for in_fn in input_filenames + for doc in eachmatch(r"^#=doc\s*$(.*?)^=#\s*$"ms, readall(joinpath(src_dir, in_fn))) + println(io, doc.captures[1], "\n\n") + end + end + end +end + +extract_doc("ndarray.rst", "ndarray.jl") diff --git a/docs/index.rst b/docs/index.rst index 8d0890e0c6a0..6af0d3b6fde7 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -11,6 +11,8 @@ include: - Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. - Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. +For more details, see documentation below. Please also checkout the `examples +`_ directory. .. toctree:: :maxdepth: 2 @@ -25,6 +27,12 @@ include: user-guide/install user-guide/overview +.. toctree:: + :maxdepth: 1 + :caption: API Documentation + + api/ndarray + Indices and tables ================== diff --git a/docs/user-guide/overview.rst b/docs/user-guide/overview.rst index 2fb2738008cd..b93de48fed7f 100644 --- a/docs/user-guide/overview.rst +++ b/docs/user-guide/overview.rst @@ -31,22 +31,22 @@ Low Level Interface NDArrays ~~~~~~~~ -``NDArray`` is the basic building blocks of the actual computations in MXNet. It +:class:`NDArray` is the basic building blocks of the actual computations in MXNet. It is like a Julia ``Array`` object, with some important differences listed here: * The actual data could live on different ``Context`` (e.g. GPUs). For some contexts, iterating into the elements one by one is very slow, thus indexing - into ``NDArray`` is not supported in general. The easiest way to inspect the - contents of an ``NDArray`` is to use the ``copy`` function to copy the + into :class:`NDArray` is not supported in general. The easiest way to inspect the + contents of an :class:`NDArray` is to use the ``copy`` function to copy the contents as a Julia ``Array``. -* Operations on ``NDArray`` (including basic arithmetics and neural network related operators) are executed in parallel with automatic dependency tracking to ensure correctness. -* There is no generics in ``NDArray``, the ``eltype`` is always ``mx.MX_float``. Because for applications in machine learning, single precision floating point numbers are typical a best choice balancing between precision, speed and portability. Also since libmxnet is designed to support multiple languages as front-ends, it is much simpler to implement with a fixed data type. +* Operations on :class:`NDArray` (including basic arithmetics and neural network related operators) are executed in parallel with automatic dependency tracking to ensure correctness. +* There is no generics in :class:`NDArray`, the ``eltype`` is always ``mx.MX_float``. Because for applications in machine learning, single precision floating point numbers are typical a best choice balancing between precision, speed and portability. Also since libmxnet is designed to support multiple languages as front-ends, it is much simpler to implement with a fixed data type. While most of the computation is hidden in libmxnet by operators corresponding -to various neural network layers. Getting familiar with the ``NDArray`` API is +to various neural network layers. Getting familiar with the :class:`NDArray` API is useful for implementing ``Optimizer`` or customized operators in Julia directly. -The followings are common ways to create ``NDArray`` objects: +The followings are common ways to create :class:`NDArray` objects: * ``mx.empty(shape[, context])``: create on uninitialized array of a given shape on a specific device. For example, ``mx.empty(2,3)`, `mx.((2,3), mx.gpu(2))``. @@ -66,10 +66,10 @@ Most of the convenient functions like ``size``, ``length``, ``ndims``, ``eltype` # Float32[2.0 2.0 1.0 # 2.0 2.0 1.0] -A slice is a sub-region sharing the same memory with the original ``NDArray`` +A slice is a sub-region sharing the same memory with the original :class:`NDArray` object. A slice is always a contiguous piece of memory, so only slicing on the *last* dimension is supported. The example above also shows a way to set the -contents of an ``NDArray``. +contents of an :class:`NDArray`. .. code-block:: julia @@ -101,7 +101,7 @@ the variable ``a`` pointing to a new object, which is ``b``. Similarly, inplace # => Float32[1.0f0,1.0f0] As we can see, ``a`` has expected value, but instead of inplace updating, a new -``NDArray`` is created and ``a`` is set to point to this new object. If we look +:class:`NDArray` is created and ``a`` is set to point to this new object. If we look at ``r``, which still reference to the old ``a``, its content has not changed. There is currently no way in Julia to overload the operators like ``+=`` to get customized behavior. @@ -117,7 +117,7 @@ Instead, you will need to write ``a[:] = a+b``, or if you want *real* inplace As we can see, it translate the ``+=`` operator to an explicit ``add_to!`` function call, which invokes into libmxnet to add the contents of ``b`` into ``a`` directly. For example, the following is the update rule in the SGD -``Optimizer`` (both ``grad`` and ``weight`` are ``NDArray`` objects): +``Optimizer`` (both ``grad`` and ``weight`` are :class:`NDArray` objects): .. code-block:: julia @@ -126,9 +126,9 @@ function call, which invokes into libmxnet to add the contents of ``b`` into Note there is no much magic in ``mx.inplace``: it only does a shallow translation. In the SGD update rule example above, the computation like scaling the gradient by ``grad_scale`` and adding the weight decay all create temporary -``NDArray`` objects. To mitigate this issue, libmxnet has a customized memory +:class:`NDArray` objects. To mitigate this issue, libmxnet has a customized memory allocator designed specifically to handle this kind of situations. The following -snippet does a simple benchmark on allocating temp ``NDArray`` vs. pre-allocating: +snippet does a simple benchmark on allocating temp :class:`NDArray` vs. pre-allocating: .. code-block:: julia @@ -171,7 +171,7 @@ snippet does a simple benchmark on allocating temp ``NDArray`` vs. pre-allocatin println(compare([inplace_op, normal_op], 100)) The comparison on my laptop shows that ``normal_op`` while allocating a lot of -temp ``NDArray`` in the loop (the performance gets worse when increasing +temp :class:`NDArray` in the loop (the performance gets worse when increasing ``N_REP``), is only about twice slower than the pre-allocated one. +-----+--------------+-----------+----------+--------------+ @@ -189,7 +189,7 @@ Distributed Key-value Store The type ``KVStore`` and related methods are used for data sharing across different devices or machines. It provides a simple and efficient -integer - ``NDArray`` key-value storage system that each device can pull or push. +integer - :class:`NDArray` key-value storage system that each device can pull or push. The following example shows how to create a local ``KVStore``, initialize a value and then pull it back. @@ -364,7 +364,7 @@ will create an ``mx.Executor`` on a given ``mx.Context``. A context describes th For neural networks, it is easier to use ``simple_bind``. By providing the shape for input arguments, it will perform a shape inference for the rest of the -arguments and create the ``NDArray`` automatically. In practice, the binding and +arguments and create the :class:`NDArray` automatically. In practice, the binding and executing steps are hidden under the ``Model`` interface. **TODO** Provide pointers to model tutorial and further details about binding and symbolic API. diff --git a/src/ndarray.jl b/src/ndarray.jl index 2156ce76be14..b2d42fda355f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1,3 +1,8 @@ +#=doc +NDArray +======= +=# + # create a NDArray handle of specific shape function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) h_ref = Ref{MX_handle}(0) @@ -19,16 +24,23 @@ end ################################################################################ # NDArray Type ################################################################################ -"""Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block -of tensor-based computation. - -**Note** since C/C++ use row-major ordering for arrays while Julia follows a -column-major ordering. To keep things consistent, we keep the underlying data -in their original layout, but use *language-native* convention when we talk -about shapes. For example, a mini-batch of 100 MNIST images is a tensor of -C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory -have shape (28,28,1,100). -""" +#=doc +.. class:: NDArray + + Wrapper of the ``NDArray`` type in ``libmxnet``. This is the basic building block + of tensor-based computation. + + .. _ndarray-shape-note: + + .. note:: + + since C/C++ use row-major ordering for arrays while Julia follows a + column-major ordering. To keep things consistent, we keep the underlying data + in their original layout, but use *language-native* convention when we talk + about shapes. For example, a mini-batch of 100 MNIST images is a tensor of + C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory + have shape (28,28,1,100). +=# type NDArray handle :: MX_NDArrayHandle writable :: Bool @@ -55,6 +67,11 @@ Base.cconvert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) ################################################################################ # NDArray functions exported to the users ################################################################################ +#=doc +.. function:: context(arr :: NDArray) + + Get the context that this :class:`NDArray` lives on. +=# function context(arr :: NDArray) ref_typeid = Ref{Cint}(0) ref_devid = Ref{Cint}(0) @@ -63,6 +80,14 @@ function context(arr :: NDArray) return Context(ref_typeid[], ref_devid[]) end +#=doc +.. function:: + empty(shape :: Tuple, ctx :: Context) + empty(shape :: Tuple) + empty(dim1, dim2, ...) + + Allocate memory for an uninitialized :class:`NDArray` with specific shape. +=# function empty{N}(shape :: NTuple{N, Int}) empty(shape, cpu()) end @@ -73,35 +98,19 @@ function empty(shape :: Int...) empty(shape) end -#------------------------------------------------------------ -# Interface functions similar to Julia Arrays -#------------------------------------------------------------ -import Base: size, length, ndims, eltype -"""Get the shape of an `NDArray`. Note the shape is converted to Julia convention. - So the same piece of memory, in Julia (column-major), with shape (K, M, N), will be of the - shape (N, M, K) in the Python (row-major) binding. -""" -function size(arr :: NDArray) - ref_ndim = Ref{MX_uint}(0) - ref_shape = Ref{Ptr{MX_uint}}(0) - @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), - arr, ref_ndim, ref_shape) - tuple(map(Int, flipdim(pointer_to_array(ref_shape[], ref_ndim[]),1))...) -end -function size(arr :: NDArray, dim :: Int) - size(arr)[dim] -end -function length(arr :: NDArray) - prod(size(arr)) -end -function ndims(arr :: NDArray) - length(size(arr)) -end -function eltype(arr :: NDArray) - MX_float -end +#=doc +Interface functions similar to Julia Arrays +------------------------------------------- +=# + +#=doc +.. function:: + zeros(shape :: Tuple, ctx :: Context) + zeros(shape :: Tuple) + zeros(dim1, dim2, ...) -"Create zero-ed NDArray of specific shape" + Create zero-ed :class:`NDArray` with specific shape. +=# function zeros{N}(shape :: NTuple{N, Int}) zeros(shape, cpu()) end @@ -114,7 +123,14 @@ function zeros(shape :: Int...) zeros(shape) end -"Create NDArray and initialize with 1" +#=doc +.. function:: + ones(shape :: Tuple, ctx :: Context) + ones(shape :: Tuple) + ones(dim1, dim2, ...) + + Create an :class:`NDArray` with specific shape and initialize with 1. +=# function ones{N}(shape :: NTuple{N, Int}) ones(shape, cpu()) end @@ -127,6 +143,55 @@ function ones(shape :: Int...) ones(shape) end +import Base: size, length, ndims, eltype + +#=doc +.. function:: + size(arr :: NDArray) + size(arr :: NDArray, dim :: Int) + + Get the shape of an :class:`NDArray`. The shape is in Julia's column-major convention. See + also the :ref:`notes on NDArray shapes `. +=# +function size(arr :: NDArray) + ref_ndim = Ref{MX_uint}(0) + ref_shape = Ref{Ptr{MX_uint}}(0) + @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), + arr, ref_ndim, ref_shape) + tuple(map(Int, flipdim(pointer_to_array(ref_shape[], ref_ndim[]),1))...) +end +function size(arr :: NDArray, dim :: Int) + size(arr)[dim] +end + +#=doc +.. function:: length(arr :: NDArray) + + Get the number of elements in an :class:`NDArray`. +=# +function length(arr :: NDArray) + prod(size(arr)) +end + +#=doc +.. function:: ndims(arr :: NDArray) + + Get the number of dimensions of an :class:`NDArray`. Is equivalent to ``length(size(arr))``. +=# +function ndims(arr :: NDArray) + length(size(arr)) +end + +#=doc +.. function:: eltype(arr :: NDArray) + + Get the element type of an :class:`NDArray`. Currently the element type is always ``mx.MX_float``. +=# +function eltype(arr :: NDArray) + MX_float +end + + import Base: slice """`slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest changing dimension is supported. In Julia's column-major perspective, this is the last From f1f869fac31a06d02df7ab0e06236e54c3584563 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 26 Oct 2015 23:33:10 -0400 Subject: [PATCH 135/630] API document for NDArrays --- docs/api/ndarray.rst | 237 ++++++++++++++++++++++++++++++++++++++ src/ndarray.jl | 267 +++++++++++++++++++++++++++++++++---------- 2 files changed, 446 insertions(+), 58 deletions(-) diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index 1d6be0498e4a..6bf6b5defb29 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -97,3 +97,240 @@ Interface functions similar to Julia Arrays + +.. function:: slice(arr :: NDArray, start:stop) + + Create a view into a sub-slice of an :class:`NDArray`. Note only slicing at the slowest + changing dimension is supported. In Julia's column-major perspective, this is the last + dimension. For example, given an :class:`NDArray` of shape (2,3,4), ``slice(array, 2:3)`` will create + a :class:`NDArray` of shape (2,3,2), sharing the data with the original array. This operation is + used in data parallelization to split mini-batch into sub-batches for different devices. + + + + +.. function:: setindex!(arr :: NDArray, val, idx) + + Assign values to an :class:`NDArray`. Elementwise assignment is not implemented, only the following + scenarios are supported + + - ``arr[:] = val``: whole array assignment, ``val`` could be a scalar or an array (Julia ``Array`` + or :class:`NDArray`) of the same shape. + - ``arr[start:stop] = val``: assignment to a *slice*, ``val`` could be a scalar or an array of + the same shape to the slice. See also :func:`slice`. + + + + +.. function:: getindex(arr :: NDArray, idx) + + Shortcut for :func:`slice`. A typical use is to write + + .. code-block:: julia + + arr[:] += 5 + + which translates into + + .. code-block:: julia + + arr[:] = arr[:] + 5 + + which furthur translates into + + .. code-block:: julia + + setindex!(getindex(arr, Colon()), 5, Colon()) + + .. note:: + + The behavior is quite different from indexing into Julia's ``Array``. For example, ``arr[2:5]`` + create a **copy** of the sub-array for Julia ``Array``, while for :class:`NDArray`, this is + a *slice* that shares the memory. + + + + +Copying functions +----------------- + + + + +.. function:: + copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) + + Copy contents of ``src`` into ``dst``. + + + + +.. function:: + copy(arr :: NDArray) + copy(arr :: NDArray, ctx :: Context) + copy(arr :: Array, ctx :: Context) + + Create a copy of an array. When no :class:`Context` is given, create a Julia ``Array``. + Otherwise, create an :class:`NDArray` on the specified context. + + + + +.. function:: convert(::Type{Array{T}}, arr :: NDArray) + + Convert an :class:`NDArray` into a Julia ``Array`` of specific type. + + + + +Basic arithmetics +----------------- + + + + +.. function:: @inplace + + Julia does not support re-definiton of ``+=`` operator (like ``__iadd__`` in python), + When one write ``a += b``, it gets translated to ``a = a+b``. ``a+b`` will allocate new + memory for the results, and the newly allocated :class:`NDArray` object is then assigned + back to a, while the original contents in a is discarded. This is very inefficient + when we want to do inplace update. + + This macro is a simple utility to implement this behavior. Write + + .. code-block:: julia + + @mx.inplace a += b + + will translate into + + .. code-block:: julia + + mx.add_to!(a, b) + + which will do inplace adding of the contents of ``b`` into ``a``. + + + + +.. function:: add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) + + Add a bunch of arguments into ``dst``. Inplace updating. + + + + +.. function:: + +(args...) + .+(args...) + + Summation. Multiple arguments of either scalar or :class:`NDArray` could be + added together. Note at least the first or second argument needs to be an :class:`NDArray` to + avoid ambiguity of built-in summation. + + + + +.. function:: sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) + + Subtract a bunch of arguments from ``dst``. Inplace updating. + + + + +.. function:: + -(arg0, arg1) + -(arg0) + .-(arg0, arg1) + + Subtraction ``arg0 - arg1``, of scalar types or :class:`NDArray`. Or create + the negative of ``arg0``. + + + + +.. function:: mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) + + Elementwise multiplication into ``dst`` of either a scalar or an :class:`NDArray` of the same shape. + Inplace updating. + + + + +.. function:: + .*(arg0, arg1) + + Elementwise multiplication of ``arg0`` and ``arg``, could be either scalar or :class:`NDArray`. + + + + +.. function:: + *(arg0, arg1) + + Currently only multiplication a scalar with an :class:`NDArray` is implemented. Matrix multiplication + is to be added soon. + + + + +.. function:: div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) + + Elementwise divide a scalar or an :class:`NDArray` of the same shape from ``dst``. Inplace updating. + + + + +.. function:: ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) + + Elementwise dividing an :class:`NDArray` by a scalar or another :class:`NDArray` of the same shape. + + + + +.. function:: /(arg0 :: NDArray, arg :: Real) + + Divide an :class:`NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. + + + + +IO +-- + + + + +.. function:: load(filename, ::Type{NDArray}) + + Load NDArrays from binary file. + + :param AbstractString filename: the path of the file to load. It could be S3 or HDFS address. + :return: Either ``Dict{Base.Symbol, NDArray}`` or ``Vector{NDArray}``. + + If the ``libmxnet`` is built with the corresponding component enabled. Examples + + * ``s3://my-bucket/path/my-s3-ndarray`` + * ``hdfs://my-bucket/path/my-hdfs-ndarray`` + * ``/path-to/my-local-ndarray`` + + + + +.. function:: save(filename :: AbstractString, data) + + Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built + with corresponding support. + + :param filename: path to the binary file to write to. + :param data: an :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. + + + + +libmxnet APIs +------------- + + + diff --git a/src/ndarray.jl b/src/ndarray.jl index b2d42fda355f..6db7546349f3 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -193,12 +193,15 @@ end import Base: slice -"""`slice` create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest -changing dimension is supported. In Julia's column-major perspective, this is the last -dimension. For example, given an `NDArray` of shape (2,3,4), `sub(array, 2:3)` will create -a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is -used in data parallelization to split mini-batch into sub-batches for different devices. -""" +#=doc +.. function:: slice(arr :: NDArray, start:stop) + + Create a view into a sub-slice of an :class:`NDArray`. Note only slicing at the slowest + changing dimension is supported. In Julia's column-major perspective, this is the last + dimension. For example, given an :class:`NDArray` of shape (2,3,4), ``slice(array, 2:3)`` will create + a :class:`NDArray` of shape (2,3,2), sharing the data with the original array. This operation is + used in data parallelization to split mini-batch into sub-batches for different devices. +=# function slice(arr :: NDArray, ::Colon) arr end @@ -219,7 +222,18 @@ function slice(arr :: NDArray, slice::UnitRange{Int}) end import Base: setindex! -"Assign all elements of an NDArray to a scalar" + +#=doc +.. function:: setindex!(arr :: NDArray, val, idx) + + Assign values to an :class:`NDArray`. Elementwise assignment is not implemented, only the following + scenarios are supported + + - ``arr[:] = val``: whole array assignment, ``val`` could be a scalar or an array (Julia ``Array`` + or :class:`NDArray`) of the same shape. + - ``arr[start:stop] = val``: assignment to a *slice*, ``val`` could be a scalar or an array of + the same shape to the slice. See also :func:`slice`. +=# function setindex!(arr :: NDArray, val :: Real, ::Colon) @assert(arr.writable) _set_value(val, arr) @@ -235,6 +249,33 @@ function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, id setindex!(slice(arr, idx), val, Colon()) end +#=doc +.. function:: getindex(arr :: NDArray, idx) + + Shortcut for :func:`slice`. A typical use is to write + + .. code-block:: julia + + arr[:] += 5 + + which translates into + + .. code-block:: julia + + arr[:] = arr[:] + 5 + + which furthur translates into + + .. code-block:: julia + + setindex!(getindex(arr, Colon()), 5, Colon()) + + .. note:: + + The behavior is quite different from indexing into Julia's ``Array``. For example, ``arr[2:5]`` + create a **copy** of the sub-array for Julia ``Array``, while for :class:`NDArray`, this is + a *slice* that shares the memory. +=# import Base: getindex """Shortcut for `slice`. **NOTE** the behavior for Julia's built-in index slicing is to create a copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. @@ -246,11 +287,17 @@ function getindex(arr :: NDArray, idx::UnitRange{Int}) slice(arr, idx) end -#------------------------------------------------------------ -# Copying functions -#------------------------------------------------------------ +#=doc +Copying functions +----------------- +=# import Base: copy!, copy, convert -"Copy data between NDArrays" +#=doc +.. function:: + copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) + + Copy contents of ``src`` into ``dst``. +=# function copy!(dst :: NDArray, src :: NDArray) @assert(dst.writable) if dst.handle == src.handle @@ -262,15 +309,16 @@ function copy!(dst :: NDArray, src :: NDArray) return dst end -"Copy data from NDArray to Julia Array" function copy!(dst :: Array{MX_float}, src :: NDArray) @assert size(dst) == size(src) @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{MX_float}, Csize_t), src, pointer(dst), length(dst)) return dst end +function copy!{T<:Real}(dst :: Array{T}, src :: NDArray) + copy!(dst, copy(src)) +end -"Copy data from Julia Array to NDArray" function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) @assert dst.writable @assert size(dst) == size(src) @@ -280,54 +328,72 @@ function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) return dst end -"Create copy: NDArray -> Julia Array" +#=doc +.. function:: + copy(arr :: NDArray) + copy(arr :: NDArray, ctx :: Context) + copy(arr :: Array, ctx :: Context) + + Create a copy of an array. When no :class:`Context` is given, create a Julia ``Array``. + Otherwise, create an :class:`NDArray` on the specified context. +=# +# Create copy: NDArray -> Julia Array function copy(arr :: NDArray) j_arr = Array(MX_float, size(arr)) copy!(j_arr, arr) end -"Create copy: NDArray -> NDArray in a given context" +# Create copy: NDArray -> NDArray in a given context function copy(arr :: NDArray, ctx :: Context) dst = NDArray(_ndarray_alloc(size(arr), ctx, true)) copy!(dst, arr) end -"Create copy: Julia Array -> NDArray in a given context" +# Create copy: Julia Array -> NDArray in a given context function copy{T<:Real}(arr :: Array{T}, ctx :: Context) dst = empty(size(arr), ctx) copy!(dst, arr) end -"Convert copy: NDArray -> Julia Array" +#=doc +.. function:: convert(::Type{Array{T}}, arr :: NDArray) + + Convert an :class:`NDArray` into a Julia ``Array`` of specific type. +=# +# Convert copy: NDArray -> Julia Array function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) convert(t, copy(arr)) end -#------------------------------------------------------------ -# Basic arithmetics -#------------------------------------------------------------ -""" -Julia does not support re-definiton of `+=` operator (like `__iadd__` in python), -When one write `a += b`, it gets translated to `a = a+b`. `a+b` will allocate new -memory for the results, and the newly allocated `NDArray` object is then assigned -back to a, while the original contents in a is discarded. This is very inefficient -when we want to do inplace update. +#=doc +Basic arithmetics +----------------- +=# -This macro is a simple utility to implement this behavior. Write +#=doc +.. function:: @inplace -```julia -@mx.inplace a += b -``` + Julia does not support re-definiton of ``+=`` operator (like ``__iadd__`` in python), + When one write ``a += b``, it gets translated to ``a = a+b``. ``a+b`` will allocate new + memory for the results, and the newly allocated :class:`NDArray` object is then assigned + back to a, while the original contents in a is discarded. This is very inefficient + when we want to do inplace update. -will translate into + This macro is a simple utility to implement this behavior. Write -```julia -mx.add_to!(a, b) -``` + .. code-block:: julia -which will do inplace adding of the contents of b into a. -""" + @mx.inplace a += b + + will translate into + + .. code-block:: julia + + mx.add_to!(a, b) + + which will do inplace adding of the contents of ``b`` into ``a``. +=# macro inplace(stmt) if stmt.head == :+= || stmt.head == :.+= Expr(:call, :add_to!, esc(stmt.args[1]), esc(stmt.args[2])) @@ -342,6 +408,11 @@ macro inplace(stmt) end end +#=doc +.. function:: add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) + + Add a bunch of arguments into ``dst``. Inplace updating. +=# function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) @assert dst.writable for arg in args @@ -354,7 +425,15 @@ function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) return dst end -# We fix the first arg to be NDArray to avoid ambiguity +#=doc +.. function:: + +(args...) + .+(args...) + + Summation. Multiple arguments of either scalar or :class:`NDArray` could be + added together. Note at least the first or second argument needs to be an :class:`NDArray` to + avoid ambiguity of built-in summation. +=# import Base: +, .+ function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) ret = copy(arg0, context(arg0)) @@ -363,7 +442,18 @@ end function .+(arg0 :: NDArray, args :: Union{Real, NDArray}...) +(arg0, args...) end +function +(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) + +(arg1, arg0, args...) +end +function .+(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) + .+(arg1, arg0, args...) +end + +#=doc +.. function:: sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) + Subtract a bunch of arguments from ``dst``. Inplace updating. +=# function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) @@ -372,6 +462,16 @@ function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) _minus(dst, arg, dst) end end + +#=doc +.. function:: + -(arg0, arg1) + -(arg0) + .-(arg0, arg1) + + Subtraction ``arg0 - arg1``, of scalar types or :class:`NDArray`. Or create + the negative of ``arg0``. +=# import Base: -, .- function -(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) @@ -380,10 +480,25 @@ end function .-(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) -(arg0, arg1) end +function -(arg0 :: Real, arg1 :: NDArray) + ret = -arg1 + add_to!(ret, arg0) + return ret +end +function .-(arg0 :: Real, arg1 :: NDArray) + -(arg0, arg1) +end + function -(arg0 :: NDArray) _mul_scalar(arg0, -1.0) end +#=doc +.. function:: mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) + + Elementwise multiplication into ``dst`` of either a scalar or an :class:`NDArray` of the same shape. + Inplace updating. +=# function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) @@ -393,6 +508,13 @@ function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) end return dst end + +#=doc +.. function:: + .*(arg0, arg1) + + Elementwise multiplication of ``arg0`` and ``arg``, could be either scalar or :class:`NDArray`. +=# import Base: .*, * function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) @@ -401,8 +523,14 @@ end function .*(arg0 :: Real, arg :: NDArray) .*(arg, arg0) end -# unlike *, we only allow type Real in arguments, because array-array * operator -# means matrix multiplication in Julia + +#=doc +.. function:: + *(arg0, arg1) + + Currently only multiplication a scalar with an :class:`NDArray` is implemented. Matrix multiplication + is to be added soon. +=# function *(arg0 :: NDArray, arg :: Real) ret = copy(arg0, context(arg0)) mul_to!(ret, arg) @@ -411,6 +539,11 @@ function *(arg0 :: Real, arg :: NDArray) *(arg, arg0) end +#=doc +.. function:: div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) + + Elementwise divide a scalar or an :class:`NDArray` of the same shape from ``dst``. Inplace updating. +=# function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) @@ -419,33 +552,45 @@ function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) _div(dst, arg, dst) end end + import Base: ./, / +#=doc +.. function:: ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) + + Elementwise dividing an :class:`NDArray` by a scalar or another :class:`NDArray` of the same shape. +=# function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) div_from!(ret, arg) end + +#=doc +.. function:: /(arg0 :: NDArray, arg :: Real) + + Divide an :class:`NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. +=# function /(arg0 :: NDArray, arg :: Real) ./(arg0, arg) end -#------------------------------------------------------------ -# IO -#------------------------------------------------------------ -"""Load NDArrays from binary file. - -**Parameters**: +#=doc +IO +-- +=# +#=doc +.. function:: load(filename, ::Type{NDArray}) -* `filename`: the path of the file to load. It could be S3 or HDFS address - if the `libmxnet` is built with the corresponding component enabled. Examples + Load NDArrays from binary file. - * `s3://my-bucket/path/my-s3-ndarray` - * `hdfs://my-bucket/path/my-hdfs-ndarray` - * `/path-to/my-local-ndarray` + :param AbstractString filename: the path of the file to load. It could be S3 or HDFS address. + :return: Either ``Dict{Base.Symbol, NDArray}`` or ``Vector{NDArray}``. -**Returns**: + If the ``libmxnet`` is built with the corresponding component enabled. Examples - Either `Dict{Base.Symbol, NDArray}` or `Vector{NDArray}`. -""" + * ``s3://my-bucket/path/my-s3-ndarray`` + * ``hdfs://my-bucket/path/my-hdfs-ndarray`` + * ``/path-to/my-local-ndarray`` +=# function load(filename::AbstractString, ::Type{NDArray}) out_size = Ref{MX_uint}(0) out_hdrs = Ref{Ptr{MX_handle}}(0) @@ -464,13 +609,15 @@ function load(filename::AbstractString, ::Type{NDArray}) end end -"""Save NDarrays to binary file. +#=doc +.. function:: save(filename :: AbstractString, data) -**Parameters**: + Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built + with corresponding support. -* `filename`: path to the binary file to write to. -* `data`: an `NDArray`, or a `Vector{NDArray}` or a `Dict{Base.Symbol, NDArray}`. -""" + :param filename: path to the binary file to write to. + :param data: an :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. +=# function save(filename::AbstractString, data::NDArray) save(filename, [data]) end @@ -487,6 +634,10 @@ function save(filename::AbstractString, data::Dict{Base.Symbol,NDArray}) filename, length(names), arrays, names) end +#=doc +libmxnet APIs +------------- +=# ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ From ac39fd6c2ceb153b9862bbd6c00e3c8ccb70f408 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 27 Oct 2015 00:10:13 -0400 Subject: [PATCH 136/630] libmxnet API for ndarrays --- docs/api/ndarray.rst | 279 +++++++++++++++++++++++++++++++++++++++++++ docs/build-api.jl | 59 ++++++++- src/ndarray.jl | 162 ++++++++++++++----------- src/util.jl | 5 +- 4 files changed, 425 insertions(+), 80 deletions(-) diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index 6bf6b5defb29..c8b9aeb6dc6a 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -334,3 +334,282 @@ libmxnet APIs + +The libxmnet APIs are automatically imported from ``libmxnet.so``. The functions listed +here operate on :class:`NDArray` objects. The arguments to the functions are typically ordered +as + +.. code-block:: julia + + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) + +unless ``NDARRAY_ARG_BEFORE_SCALAR`` is not set. In this case, the scalars are put before the input arguments: + +.. code-block:: julia + + func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) + + +If ``ACCEPT_EMPTY_MUTATE_TARGET`` is set. An overloaded function without the output arguments will also be defined: + +.. code-block:: julia + + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) + +Upon calling, the output arguments will be automatically initialized with empty NDArrays. + +Those functions always return the output arguments. If there is only one output (the typical situation), that +object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. + +Public APIs +^^^^^^^^^^^ +.. function:: choose_element(...) + + Choose one element from each line(row for python, column for R/Julia) in lhs according to index indicated by rhs + + :param NDArray lhs: Left operand to the function. + + + :param NDArray rhs: Right operand to the function. + + + + + +.. function:: clip(...) + + Clip ndarray elements to range (a_min, a_max) + + :param NDArray src: Source input + + + :param real_t a_min: Minimum value + + + :param real_t a_max: Maximum value + + + + + +.. function:: dot(...) + + Calcuate 2D matrix multiplication + + :param NDArray lhs: Left operand to the function. + + + :param NDArray rhs: Right operand to the function. + + + + + +.. function:: sqrt(...) + + Take square root of the src + + :param NDArray src: Source input to the function + + + + + +.. function:: square(...) + + Take square of the src + + :param NDArray src: Source input to the function + + + + +Internal APIs +^^^^^^^^^^^^^ + +.. note:: + + Document and signatures for internal API functions might be incomplete. + +.. function:: _copyto(...) + + + + :param NDArray src: Source input to the function. + + + + + +.. function:: _div(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param NDArray rhs: Right operand to the function. + + + + + +.. function:: _div_scalar(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param real_t rhs: Right operand to the function. + + + + + +.. function:: _minus(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param NDArray rhs: Right operand to the function. + + + + + +.. function:: _minus_scalar(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param real_t rhs: Right operand to the function. + + + + + +.. function:: _mul(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param NDArray rhs: Right operand to the function. + + + + + +.. function:: _mul_scalar(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param real_t rhs: Right operand to the function. + + + + + +.. function:: _onehot_encode(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param NDArray rhs: Right operand to the function. + + + + + +.. function:: _plus(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param NDArray rhs: Right operand to the function. + + + + + +.. function:: _plus_scalar(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param real_t rhs: Right operand to the function. + + + + + +.. function:: _random_gaussian(...) + + + + + + + +.. function:: _random_uniform(...) + + + + + + + +.. function:: _rdiv_scalar(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param real_t rhs: Right operand to the function. + + + + + +.. function:: _rminus_scalar(...) + + + + :param NDArray lhs: Left operand to the function. + + + :param real_t rhs: Right operand to the function. + + + + + +.. function:: _set_value(...) + + + + :param real_t src: Source input to the function. + + + + + + + + diff --git a/docs/build-api.jl b/docs/build-api.jl index 9ddf9ff53b5b..82d5d320674b 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -1,17 +1,66 @@ # extract API docs +using MXNet + +const SRC_DIR = joinpath(Pkg.dir("MXNet"), "src") +const API_DIR = joinpath(Pkg.dir("MXNet"), "docs", "api") function extract_doc(output_filename::AbstractString, input_filenames::AbstractString...) - src_dir = joinpath(Pkg.dir("MXNet"), "src") - api_dir = joinpath(Pkg.dir("MXNet"), "docs", "api") - mkpath(api_dir) - open(joinpath(api_dir, output_filename), "w") do io + mkpath(API_DIR) + open(joinpath(API_DIR, output_filename), "w") do io for in_fn in input_filenames - for doc in eachmatch(r"^#=doc\s*$(.*?)^=#\s*$"ms, readall(joinpath(src_dir, in_fn))) + for doc in eachmatch(r"^#=doc\s*$(.*?)^=#\s*$"ms, readall(joinpath(SRC_DIR, in_fn))) println(io, doc.captures[1], "\n\n") end end end end +function sort_api_names(names) + names = collect(names) + names_pub = filter(x -> !startswith(string(x), '_'), names) + names_pri = filter(x -> startswith(string(x), '_'), names) + return (sort(names_pub), sort(names_pri)) +end + +function embed_mxnet_api(output_filename::AbstractString, key::AbstractString, generator::Function) + output_filename = joinpath(API_DIR, output_filename) + contents = readall(output_filename) + open(output_filename, "w") do io + docs = generator(gen_docs=true) + function gen_doc(fname) + doc = replace(docs[fname], r"^"m, " ") + """ + .. function:: $fname(...) + + $doc + + """ + end + + names_pub, names_pri = sort_api_names(keys(docs)) + docs_pub = join(map(gen_doc, names_pub), "\n\n") + docs_pri = join(map(gen_doc, names_pri), "\n\n") + docstrings = """ + Public APIs + ^^^^^^^^^^^ + """ * docs_pub + + docstrings *= """ + + Internal APIs + ^^^^^^^^^^^^^ + + .. note:: + + Document and signatures for internal API functions might be incomplete. + + """ * docs_pri + + key = mx.format(mx.DOC_EMBED_ANCHOR, key) + println(io, replace(contents, key, docstrings)) + end +end + extract_doc("ndarray.rst", "ndarray.jl") +embed_mxnet_api("ndarray.rst", "ndarray", mx._import_ndarray_functions) diff --git a/src/ndarray.jl b/src/ndarray.jl index 6db7546349f3..eb82e06ec294 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -656,32 +656,36 @@ end # functions can overload them import Base: sqrt -""" -Import dynamic functions for NDArrays. The arguments to the functions are typically ordered +#=doc +The libxmnet APIs are automatically imported from ``libmxnet.so``. The functions listed +here operate on :class:`NDArray` objects. The arguments to the functions are typically ordered as -```julia -func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) -``` +.. code-block:: julia + + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) + +unless ``NDARRAY_ARG_BEFORE_SCALAR`` is not set. In this case, the scalars are put before the input arguments: + +.. code-block:: julia + + func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) -unless NDARRAY_ARG_BEFORE_SCALAR is not set. In this case, the scalars are put before the input arguments: -```julia -func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) -``` +If ``ACCEPT_EMPTY_MUTATE_TARGET`` is set. An overloaded function without the output arguments will also be defined: -If `ACCEPT_EMPTY_MUTATE_TARGET` is set. An overloaded function without the output arguments will also be defined: +.. code-block:: julia -```julia -func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) -``` + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) Upon calling, the output arguments will be automatically initialized with empty NDArrays. Those functions always return the output arguments. If there is only one output (the typical situation), that -object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. -""" -function _import_ndarray_functions() +object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. + +**autogen:EMBED:ndarray:EMBED:autogen** +=# +function _import_ndarray_functions(;gen_docs=false) n_ref = Ref{MX_uint}(0) h_ref = Ref{Ptr{MX_handle}}(0) @mxcall(:MXListFunctions, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) @@ -689,6 +693,10 @@ function _import_ndarray_functions() n_funcs = n_ref[] h_funcs = pointer_to_array(h_ref[], n_funcs) + if gen_docs + docs = Dict{Base.Symbol, AbstractString}() + end + for i = 1:n_funcs func_handle = h_funcs[i] @@ -708,66 +716,74 @@ function _import_ndarray_functions() func_name = symbol(bytestring(ref_name[])) - #---------------------------------------- - # get function specification - ref_n_use_vars = Ref{MX_uint}(0) - ref_n_scalars = Ref{MX_uint}(0) - ref_n_mut_vars = Ref{MX_uint}(0) - ref_type_mask = Ref{Cint}(0) - @mxcall(:MXFuncDescribe, - (MX_handle, Ref{MX_uint}, Ref{MX_uint}, Ref{MX_uint}, Ref{Cint}), - func_handle, ref_n_use_vars, ref_n_scalars, ref_n_mut_vars, ref_type_mask) - - #---------------------------------------- - # prepare function definition - n_used_vars = ref_n_use_vars[] - n_scalars = ref_n_scalars[] - n_mutate_vars = ref_n_mut_vars[] - type_mask = ref_type_mask[] - accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 - arg_before_scalar = (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 - - # general ndarray function - if arg_before_scalar - args = vcat([Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) - else - args = vcat([Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) - end - - _use_vars = Expr(:ref, :MX_handle, [symbol("in$i") for i=1:n_used_vars]...) - _scalars = Expr(:ref, :MX_float, [symbol("sca$i") for i=1:n_scalars]...) - _mut_vars = Expr(:ref, :MX_handle, [symbol("out$i") for i=1:n_mutate_vars]...) - stmt_call = Expr(:call, :_invoke_mxfunction, func_handle, _use_vars, _scalars, _mut_vars) - if n_mutate_vars == 1 - stmt_ret = :(return out1) + if gen_docs + # generate document only + f_desc = bytestring(ref_desc[]) * "\n\n" + f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) + docs[func_name] = f_desc else - stmt_ret = Expr(:return, Expr(:tuple, [symbol("out$i") for i=1:n_mutate_vars]...)) - end - - func_body = Expr(:block, stmt_call, stmt_ret) - func_head = Expr(:call, func_name, args...) - - func_def = Expr(:function, func_head, func_body) - eval(func_def) - - if accept_empty_mutate - args0 = args[1:n_used_vars+n_scalars] - func_head0 = Expr(:call, func_name, args0...) - _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] - stmt_call0 = Expr(:call, func_name, args0..., _mut_vars0...) - func_body0 = Expr(:block, stmt_call0) - func_head0 = Expr(:call, func_name, args0...) - - func_def0 = Expr(:function, func_head0, func_body0) - eval(func_def0) + #---------------------------------------- + # get function specification + ref_n_use_vars = Ref{MX_uint}(0) + ref_n_scalars = Ref{MX_uint}(0) + ref_n_mut_vars = Ref{MX_uint}(0) + ref_type_mask = Ref{Cint}(0) + @mxcall(:MXFuncDescribe, + (MX_handle, Ref{MX_uint}, Ref{MX_uint}, Ref{MX_uint}, Ref{Cint}), + func_handle, ref_n_use_vars, ref_n_scalars, ref_n_mut_vars, ref_type_mask) + + #---------------------------------------- + # prepare function definition + n_used_vars = ref_n_use_vars[] + n_scalars = ref_n_scalars[] + n_mutate_vars = ref_n_mut_vars[] + type_mask = ref_type_mask[] + accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 + arg_before_scalar = (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 + + # general ndarray function + if arg_before_scalar + args = vcat([Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], + [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + else + args = vcat([Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], + [Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + end + + _use_vars = Expr(:ref, :MX_handle, [symbol("in$i") for i=1:n_used_vars]...) + _scalars = Expr(:ref, :MX_float, [symbol("sca$i") for i=1:n_scalars]...) + _mut_vars = Expr(:ref, :MX_handle, [symbol("out$i") for i=1:n_mutate_vars]...) + stmt_call = Expr(:call, :_invoke_mxfunction, func_handle, _use_vars, _scalars, _mut_vars) + if n_mutate_vars == 1 + stmt_ret = :(return out1) + else + stmt_ret = Expr(:return, Expr(:tuple, [symbol("out$i") for i=1:n_mutate_vars]...)) + end + + func_body = Expr(:block, stmt_call, stmt_ret) + func_head = Expr(:call, func_name, args...) + + func_def = Expr(:function, func_head, func_body) + eval(func_def) + + if accept_empty_mutate + args0 = args[1:n_used_vars+n_scalars] + func_head0 = Expr(:call, func_name, args0...) + _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] + stmt_call0 = Expr(:call, func_name, args0..., _mut_vars0...) + func_body0 = Expr(:block, stmt_call0) + func_head0 = Expr(:call, func_name, args0...) + + func_def0 = Expr(:function, func_head0, func_body0) + eval(func_def0) + end end + end - # TODO: add doc string - # eval(:(@doc($doc_str, $func_name))) + if gen_docs + return docs end end diff --git a/src/util.jl b/src/util.jl index 1c52fdf3f2c3..b3997dbaff45 100644 --- a/src/util.jl +++ b/src/util.jl @@ -46,6 +46,7 @@ end ################################################################################ # Internal Utilities ################################################################################ +const DOC_EMBED_ANCHOR = "**autogen:EMBED:{1}:EMBED:autogen**" function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{char_pp}, arg_descs::Ref{char_pp}, remove_dup::Bool=true) param_keys = Set{AbstractString}() @@ -63,7 +64,7 @@ function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{ch arg_type = bytestring(arg_types[i]) arg_desc = bytestring(arg_descs[i]) - push!(docstrings, "* `$arg_name`: $arg_type\n\n $arg_desc\n\n") + push!(docstrings, ":param $arg_type $arg_name: $arg_desc\n\n") end - return "**Parameters**\n\n$(join(docstrings, "\n"))" + return join(docstrings, "\n") end From e7ec661e5530a212e722d940b78d94d7bdb11026 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 27 Oct 2015 00:19:54 -0400 Subject: [PATCH 137/630] automatic build API for symbols --- docs/api/symbol.rst | 436 ++++++++++++++++++++++++++++++++++++++++++++ docs/build-api.jl | 10 +- docs/index.rst | 1 + src/symbol.jl | 41 +++-- 4 files changed, 475 insertions(+), 13 deletions(-) create mode 100644 docs/api/symbol.rst diff --git a/docs/api/symbol.rst b/docs/api/symbol.rst new file mode 100644 index 000000000000..9feae90c681f --- /dev/null +++ b/docs/api/symbol.rst @@ -0,0 +1,436 @@ + +libmxnet APIs +------------- + +Public APIs +^^^^^^^^^^^ +.. function:: Activation(...) + + Apply activation function to input. + + :param Symbol data: Input data to activation function. + + + :param {'relu', 'sigmoid', 'tanh'}, required act_type: Activation function to be applied. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: BatchNorm(...) + + Apply batch normalization to input. + + :param Symbol data: Input data to batch normalization + + + :param float, optional, default=1e-10 eps: Epsilon to prevent div 0 + + + :param float, optional, default=0.1 momentum: Momentum for moving average + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: BlockGrad(...) + + Get output from a symbol and pass 0 gradient back + + :param Symbol data: Input data. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: Concat(...) + + Perform an feature concat on channel dim (dim 1) over all the inputs. + + This function support variable length positional :class:`Symbol` inputs. + + :param int, required num_args: Number of inputs to be concated. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: Convolution(...) + + Apply convolution to input then add a bias. + + :param Symbol data: Input data to the ConvolutionOp. + + + :param Symbol weight: Weight matrix. + + + :param Symbol bias: Bias parameter. + + + :param Shape(tuple), required kernel: convolution kernel size: (y, x) + + + :param Shape(tuple), optional, default=(1, 1) stride: convolution stride: (y, x) + + + :param Shape(tuple), optional, default=(0, 0) pad: pad for convolution: (y, x) + + + :param int (non-negative), required num_filter: convolution filter(channel) number + + + :param int (non-negative), optional, default=1 num_group: number of groups partition + + + :param long (non-negative), optional, default=512 workspace: Tmp workspace for convolution (MB) + + + :param boolean, optional, default=False no_bias: Whether to disable bias parameter. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: Dropout(...) + + Apply dropout to input + + :param Symbol data: Input data to dropout. + + + :param float, optional, default=0.5 p: Fraction of the input that gets dropped out at training time + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: ElementWiseSum(...) + + Perform an elementwise sum over all the inputs. + + This function support variable length positional :class:`Symbol` inputs. + + :param int, required num_args: Number of inputs to be sumed. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: Flatten(...) + + Flatten input + + :param Symbol data: Input data to flatten. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: FullyConnected(...) + + Apply matrix multiplication to input then add a bias. + + :param Symbol data: Input data to the FullyConnectedOp. + + + :param Symbol weight: Weight matrix. + + + :param Symbol bias: Bias parameter. + + + :param int, required num_hidden: Number of hidden nodes of the output. + + + :param boolean, optional, default=False no_bias: Whether to disable bias parameter. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: LRN(...) + + Apply convolution to input then add a bias. + + :param Symbol data: Input data to the ConvolutionOp. + + + :param float, optional, default=0.0001 alpha: value of the alpha variance scaling parameter in the normalization formula + + + :param float, optional, default=0.75 beta: value of the beta power parameter in the normalization formula + + + :param float, optional, default=2 knorm: value of the k parameter in normalization formula + + + :param int (non-negative), required nsize: normalization window width in elements. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: LeakyReLU(...) + + Apply activation function to input. + + :param Symbol data: Input data to activation function. + + + :param {'leaky', 'prelu', 'rrelu'},optional, default='leaky' act_type: Activation function to be applied. + + + :param float, optional, default=0.25 slope: Init slope for the activation. (For leaky only) + + + :param float, optional, default=0.125 lower_bound: Lower bound of random slope. (For rrelu only) + + + :param float, optional, default=0.334 upper_bound: Upper bound of random slope. (For rrelu only) + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: LinearRegressionOutput(...) + + Use linear regression for final output, this is used on final output of a net. + + :param Symbol data: Input data to function. + + + :param Symbol label: Input label to function. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: LogisticRegressionOutput(...) + + Use Logistic regression for final output, this is used on final output of a net. + Logistic regression is suitable for binary classification or probability prediction tasks. + + :param Symbol data: Input data to function. + + + :param Symbol label: Input label to function. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: Pooling(...) + + Perform spatial pooling on inputs. + + :param Symbol data: Input data to the pooling operator. + + + :param Shape(tuple), required kernel: pooling kernel size: (y, x) + + + :param {'avg', 'max', 'sum'}, required pool_type: Pooling type to be applied. + + + :param Shape(tuple), optional, default=(1, 1) stride: stride: for pooling (y, x) + + + :param Shape(tuple), optional, default=(0, 0) pad: pad for pooling: (y, x) + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: Reshape(...) + + Reshape input to target shape + + :param Symbol data: Input data to reshape. + + + :param Shape(tuple), required target_shape: Target new shape + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: SliceChannel(...) + + Slice channel into many outputs with equally divided channel + + :param int, required num_outputs: Number of outputs to be sliced. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: Softmax(...) + + Perform a softmax transformation on input. + + :param Symbol data: Input data to softmax. + + + :param float, optional, default=1 grad_scale: Scale the gradient by a float factor + + + :param boolean, optional, default=False multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: sqrt(...) + + Take square root of the src + + :param Symbol src: Source symbolic input to the function + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: square(...) + + Take square of the src + + :param Symbol src: Source symbolic input to the function + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + +Internal APIs +^^^^^^^^^^^^^ + +.. note:: + + Document and signatures for internal API functions might be incomplete. + +.. function:: _Div(...) + + Perform an elementwise div. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: _Minus(...) + + Perform an elementwise minus. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: _Mul(...) + + Perform an elementwise mul. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + +.. function:: _Plus(...) + + Perform an elementwise plus. + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: The constructed :class:`Symbol`. + + + + + + + + diff --git a/docs/build-api.jl b/docs/build-api.jl index 82d5d320674b..b70cbd94615b 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -4,8 +4,10 @@ using MXNet const SRC_DIR = joinpath(Pkg.dir("MXNet"), "src") const API_DIR = joinpath(Pkg.dir("MXNet"), "docs", "api") +################################################################################# +# Document Builders +################################################################################# function extract_doc(output_filename::AbstractString, input_filenames::AbstractString...) - mkpath(API_DIR) open(joinpath(API_DIR, output_filename), "w") do io for in_fn in input_filenames @@ -62,5 +64,11 @@ function embed_mxnet_api(output_filename::AbstractString, key::AbstractString, g end end +################################################################################# +# Build Documents +################################################################################# extract_doc("ndarray.rst", "ndarray.jl") embed_mxnet_api("ndarray.rst", "ndarray", mx._import_ndarray_functions) + +extract_doc("symbol.rst", "symbol.jl") +embed_mxnet_api("symbol.rst", "symbol", mx._import_atomic_symbol_creators) diff --git a/docs/index.rst b/docs/index.rst index 6af0d3b6fde7..adc4ef8d658c 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -32,6 +32,7 @@ For more details, see documentation below. Please also checkout the `examples :caption: API Documentation api/ndarray + api/symbol Indices and tables ================== diff --git a/src/symbol.jl b/src/symbol.jl index a1f008c29cd3..635b4a494c6b 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -253,10 +253,16 @@ function save(filename :: AbstractString, sym :: Symbol) @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), sym, filename) end +#=doc +libmxnet APIs +------------- + +**autogen:EMBED:symbol:EMBED:autogen** +=# ################################################################################ # Atomic Symbol functions dynamically imported from libmxnet ################################################################################ -function _define_atomic_symbol_creator(hdr :: MX_handle) +function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) ref_name = Ref{char_p}(0) ref_desc = Ref{char_p}(0) ref_kv_nargs = Ref{char_p}(0) @@ -274,13 +280,16 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) kv_nargs_s = bytestring(ref_kv_nargs[]) kv_nargs = symbol(kv_nargs_s) - f_desc = bytestring(ref_desc[]) * "\n\n" - if !isempty(kv_nargs_s) - f_desc *= "This function support variable length positional `Symbol` inputs.\n\n" + if gen_docs + f_desc = bytestring(ref_desc[]) * "\n\n" + if !isempty(kv_nargs_s) + f_desc *= "This function support variable length positional :class:`Symbol` inputs.\n\n" + end + f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) + f_desc *= ":param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional.\n\n" + f_desc *= ":return: The constructed :class:`Symbol`.\n\n" + return (func_name, f_desc) end - f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= "* `name`: Julia Symbol (e.g. `:my_symbol`), optional.\n\n The name of the symbol.\n\n" - f_desc *= "**Returns**\n\n`symbol`: `mx.Symbol`\n\n The constructed symbol." # function $func_name(args...; kwargs...) func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) @@ -349,12 +358,9 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) func_def = Expr(:function, func_head, Expr(:block, func_body)) eval(func_def) - - # add doc string - eval(:(@doc($f_desc, $func_name))) end -function _import_atomic_symbol_creators() +function _import_atomic_symbol_creators(;gen_docs=false) n_ref = Ref{MX_uint}(0) h_ref = Ref{Ptr{MX_handle}}(0) @mxcall(:MXSymbolListAtomicSymbolCreators, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) @@ -362,9 +368,20 @@ function _import_atomic_symbol_creators() n_creators = n_ref[] h_creators = pointer_to_array(h_ref[], n_creators) + if gen_docs + docs = Dict{Base.Symbol, AbstractString}() + end + for i = 1:n_creators creator_hdr = h_creators[i] - _define_atomic_symbol_creator(creator_hdr) + ret = _define_atomic_symbol_creator(creator_hdr, gen_docs=gen_docs) + if gen_docs + docs[ret[1]] = ret[2] + end + end + + if gen_docs + return docs end end From 9c87c61dde1ac236ed55658e70fa7673d6e357ed Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 27 Oct 2015 00:26:31 -0400 Subject: [PATCH 138/630] fix mal-formatted param type in sphinx syntax --- docs/api/ndarray.rst | 66 ++++++++--------- docs/api/symbol.rst | 165 +++++++++++++++++++++++-------------------- src/symbol.jl | 16 +++-- src/util.jl | 2 +- 4 files changed, 135 insertions(+), 114 deletions(-) diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index c8b9aeb6dc6a..3f8404afd7e5 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -367,10 +367,10 @@ Public APIs Choose one element from each line(row for python, column for R/Julia) in lhs according to index indicated by rhs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param NDArray rhs: Right operand to the function. + :param rhs: ``NDArray``. Right operand to the function. @@ -380,13 +380,13 @@ Public APIs Clip ndarray elements to range (a_min, a_max) - :param NDArray src: Source input + :param src: ``NDArray``. Source input - :param real_t a_min: Minimum value + :param a_min: ``real_t``. Minimum value - :param real_t a_max: Maximum value + :param a_max: ``real_t``. Maximum value @@ -396,10 +396,10 @@ Public APIs Calcuate 2D matrix multiplication - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param NDArray rhs: Right operand to the function. + :param rhs: ``NDArray``. Right operand to the function. @@ -409,7 +409,7 @@ Public APIs Take square root of the src - :param NDArray src: Source input to the function + :param src: ``NDArray``. Source input to the function @@ -419,7 +419,7 @@ Public APIs Take square of the src - :param NDArray src: Source input to the function + :param src: ``NDArray``. Source input to the function @@ -435,7 +435,7 @@ Internal APIs - :param NDArray src: Source input to the function. + :param src: ``NDArray``. Source input to the function. @@ -445,10 +445,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param NDArray rhs: Right operand to the function. + :param rhs: ``NDArray``. Right operand to the function. @@ -458,10 +458,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param real_t rhs: Right operand to the function. + :param rhs: ``real_t``. Right operand to the function. @@ -471,10 +471,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param NDArray rhs: Right operand to the function. + :param rhs: ``NDArray``. Right operand to the function. @@ -484,10 +484,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param real_t rhs: Right operand to the function. + :param rhs: ``real_t``. Right operand to the function. @@ -497,10 +497,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param NDArray rhs: Right operand to the function. + :param rhs: ``NDArray``. Right operand to the function. @@ -510,10 +510,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param real_t rhs: Right operand to the function. + :param rhs: ``real_t``. Right operand to the function. @@ -523,10 +523,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param NDArray rhs: Right operand to the function. + :param rhs: ``NDArray``. Right operand to the function. @@ -536,10 +536,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param NDArray rhs: Right operand to the function. + :param rhs: ``NDArray``. Right operand to the function. @@ -549,10 +549,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param real_t rhs: Right operand to the function. + :param rhs: ``real_t``. Right operand to the function. @@ -578,10 +578,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param real_t rhs: Right operand to the function. + :param rhs: ``real_t``. Right operand to the function. @@ -591,10 +591,10 @@ Internal APIs - :param NDArray lhs: Left operand to the function. + :param lhs: ``NDArray``. Left operand to the function. - :param real_t rhs: Right operand to the function. + :param rhs: ``real_t``. Right operand to the function. @@ -604,7 +604,7 @@ Internal APIs - :param real_t src: Source input to the function. + :param src: ``real_t``. Source input to the function. diff --git a/docs/api/symbol.rst b/docs/api/symbol.rst index 9feae90c681f..a645d9a13dff 100644 --- a/docs/api/symbol.rst +++ b/docs/api/symbol.rst @@ -1,4 +1,17 @@ +.. class:: Symbol + + Symbol is the basic building block of the symbolic graph in MXNet.jl. + + .. note:: + + Throughout this documentation, ``Symbol`` always refer to this :class:`Symbol` type. + When we refer to the Julia's build-in symbol type (e.g. ``typeof(:foo)``), we always + say ``Base.Symbol``. + + + + libmxnet APIs ------------- @@ -8,12 +21,12 @@ Public APIs Apply activation function to input. - :param Symbol data: Input data to activation function. + :param data: ``Symbol``. Input data to activation function. - :param {'relu', 'sigmoid', 'tanh'}, required act_type: Activation function to be applied. + :param act_type: ``{'relu', 'sigmoid', 'tanh'}, required``. Activation function to be applied. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -25,15 +38,15 @@ Public APIs Apply batch normalization to input. - :param Symbol data: Input data to batch normalization + :param data: ``Symbol``. Input data to batch normalization - :param float, optional, default=1e-10 eps: Epsilon to prevent div 0 + :param eps: ``float, optional, default=1e-10``. Epsilon to prevent div 0 - :param float, optional, default=0.1 momentum: Momentum for moving average + :param momentum: ``float, optional, default=0.1``. Momentum for moving average - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -45,9 +58,9 @@ Public APIs Get output from a symbol and pass 0 gradient back - :param Symbol data: Input data. + :param data: ``Symbol``. Input data. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -61,9 +74,9 @@ Public APIs This function support variable length positional :class:`Symbol` inputs. - :param int, required num_args: Number of inputs to be concated. + :param num_args: ``int, required``. Number of inputs to be concated. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -75,36 +88,36 @@ Public APIs Apply convolution to input then add a bias. - :param Symbol data: Input data to the ConvolutionOp. + :param data: ``Symbol``. Input data to the ConvolutionOp. - :param Symbol weight: Weight matrix. + :param weight: ``Symbol``. Weight matrix. - :param Symbol bias: Bias parameter. + :param bias: ``Symbol``. Bias parameter. - :param Shape(tuple), required kernel: convolution kernel size: (y, x) + :param kernel: ``Shape(tuple), required``. convolution kernel size: (y, x) - :param Shape(tuple), optional, default=(1, 1) stride: convolution stride: (y, x) + :param stride: ``Shape(tuple), optional, default=(1, 1)``. convolution stride: (y, x) - :param Shape(tuple), optional, default=(0, 0) pad: pad for convolution: (y, x) + :param pad: ``Shape(tuple), optional, default=(0, 0)``. pad for convolution: (y, x) - :param int (non-negative), required num_filter: convolution filter(channel) number + :param num_filter: ``int (non-negative), required``. convolution filter(channel) number - :param int (non-negative), optional, default=1 num_group: number of groups partition + :param num_group: ``int (non-negative), optional, default=1``. number of groups partition - :param long (non-negative), optional, default=512 workspace: Tmp workspace for convolution (MB) + :param workspace: ``long (non-negative), optional, default=512``. Tmp workspace for convolution (MB) - :param boolean, optional, default=False no_bias: Whether to disable bias parameter. + :param no_bias: ``boolean, optional, default=False``. Whether to disable bias parameter. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -116,12 +129,12 @@ Public APIs Apply dropout to input - :param Symbol data: Input data to dropout. + :param data: ``Symbol``. Input data to dropout. - :param float, optional, default=0.5 p: Fraction of the input that gets dropped out at training time + :param p: ``float, optional, default=0.5``. Fraction of the input that gets dropped out at training time - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -135,9 +148,9 @@ Public APIs This function support variable length positional :class:`Symbol` inputs. - :param int, required num_args: Number of inputs to be sumed. + :param num_args: ``int, required``. Number of inputs to be sumed. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -149,9 +162,9 @@ Public APIs Flatten input - :param Symbol data: Input data to flatten. + :param data: ``Symbol``. Input data to flatten. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -163,21 +176,21 @@ Public APIs Apply matrix multiplication to input then add a bias. - :param Symbol data: Input data to the FullyConnectedOp. + :param data: ``Symbol``. Input data to the FullyConnectedOp. - :param Symbol weight: Weight matrix. + :param weight: ``Symbol``. Weight matrix. - :param Symbol bias: Bias parameter. + :param bias: ``Symbol``. Bias parameter. - :param int, required num_hidden: Number of hidden nodes of the output. + :param num_hidden: ``int, required``. Number of hidden nodes of the output. - :param boolean, optional, default=False no_bias: Whether to disable bias parameter. + :param no_bias: ``boolean, optional, default=False``. Whether to disable bias parameter. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -189,21 +202,21 @@ Public APIs Apply convolution to input then add a bias. - :param Symbol data: Input data to the ConvolutionOp. + :param data: ``Symbol``. Input data to the ConvolutionOp. - :param float, optional, default=0.0001 alpha: value of the alpha variance scaling parameter in the normalization formula + :param alpha: ``float, optional, default=0.0001``. value of the alpha variance scaling parameter in the normalization formula - :param float, optional, default=0.75 beta: value of the beta power parameter in the normalization formula + :param beta: ``float, optional, default=0.75``. value of the beta power parameter in the normalization formula - :param float, optional, default=2 knorm: value of the k parameter in normalization formula + :param knorm: ``float, optional, default=2``. value of the k parameter in normalization formula - :param int (non-negative), required nsize: normalization window width in elements. + :param nsize: ``int (non-negative), required``. normalization window width in elements. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -215,21 +228,21 @@ Public APIs Apply activation function to input. - :param Symbol data: Input data to activation function. + :param data: ``Symbol``. Input data to activation function. - :param {'leaky', 'prelu', 'rrelu'},optional, default='leaky' act_type: Activation function to be applied. + :param act_type: ``{'leaky', 'prelu', 'rrelu'},optional, default='leaky'``. Activation function to be applied. - :param float, optional, default=0.25 slope: Init slope for the activation. (For leaky only) + :param slope: ``float, optional, default=0.25``. Init slope for the activation. (For leaky only) - :param float, optional, default=0.125 lower_bound: Lower bound of random slope. (For rrelu only) + :param lower_bound: ``float, optional, default=0.125``. Lower bound of random slope. (For rrelu only) - :param float, optional, default=0.334 upper_bound: Upper bound of random slope. (For rrelu only) + :param upper_bound: ``float, optional, default=0.334``. Upper bound of random slope. (For rrelu only) - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -241,12 +254,12 @@ Public APIs Use linear regression for final output, this is used on final output of a net. - :param Symbol data: Input data to function. + :param data: ``Symbol``. Input data to function. - :param Symbol label: Input label to function. + :param label: ``Symbol``. Input label to function. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -259,12 +272,12 @@ Public APIs Use Logistic regression for final output, this is used on final output of a net. Logistic regression is suitable for binary classification or probability prediction tasks. - :param Symbol data: Input data to function. + :param data: ``Symbol``. Input data to function. - :param Symbol label: Input label to function. + :param label: ``Symbol``. Input label to function. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -276,21 +289,21 @@ Public APIs Perform spatial pooling on inputs. - :param Symbol data: Input data to the pooling operator. + :param data: ``Symbol``. Input data to the pooling operator. - :param Shape(tuple), required kernel: pooling kernel size: (y, x) + :param kernel: ``Shape(tuple), required``. pooling kernel size: (y, x) - :param {'avg', 'max', 'sum'}, required pool_type: Pooling type to be applied. + :param pool_type: ``{'avg', 'max', 'sum'}, required``. Pooling type to be applied. - :param Shape(tuple), optional, default=(1, 1) stride: stride: for pooling (y, x) + :param stride: ``Shape(tuple), optional, default=(1, 1)``. stride: for pooling (y, x) - :param Shape(tuple), optional, default=(0, 0) pad: pad for pooling: (y, x) + :param pad: ``Shape(tuple), optional, default=(0, 0)``. pad for pooling: (y, x) - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -302,12 +315,12 @@ Public APIs Reshape input to target shape - :param Symbol data: Input data to reshape. + :param data: ``Symbol``. Input data to reshape. - :param Shape(tuple), required target_shape: Target new shape + :param target_shape: ``Shape(tuple), required``. Target new shape - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -319,9 +332,9 @@ Public APIs Slice channel into many outputs with equally divided channel - :param int, required num_outputs: Number of outputs to be sliced. + :param num_outputs: ``int, required``. Number of outputs to be sliced. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -333,15 +346,15 @@ Public APIs Perform a softmax transformation on input. - :param Symbol data: Input data to softmax. + :param data: ``Symbol``. Input data to softmax. - :param float, optional, default=1 grad_scale: Scale the gradient by a float factor + :param grad_scale: ``float, optional, default=1``. Scale the gradient by a float factor - :param boolean, optional, default=False multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes + :param multi_output: ``boolean, optional, default=False``. If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -353,9 +366,9 @@ Public APIs Take square root of the src - :param Symbol src: Source symbolic input to the function + :param src: ``Symbol``. Source symbolic input to the function - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -367,9 +380,9 @@ Public APIs Take square of the src - :param Symbol src: Source symbolic input to the function + :param src: ``Symbol``. Source symbolic input to the function - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -387,7 +400,7 @@ Internal APIs Perform an elementwise div. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -399,7 +412,7 @@ Internal APIs Perform an elementwise minus. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -411,7 +424,7 @@ Internal APIs Perform an elementwise mul. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -423,7 +436,7 @@ Internal APIs Perform an elementwise plus. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. diff --git a/src/symbol.jl b/src/symbol.jl index 635b4a494c6b..eb29f74594d7 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -1,8 +1,16 @@ export Symbol -################################################################################ -# Symbol Type -################################################################################ +#=doc +.. class:: Symbol + + Symbol is the basic building block of the symbolic graph in MXNet.jl. + + .. note:: + + Throughout this documentation, ``Symbol`` always refer to this :class:`Symbol` type. + When we refer to the Julia's build-in symbol type (e.g. ``typeof(:foo)``), we always + say ``Base.Symbol``. +=# type Symbol handle :: MX_SymbolHandle end @@ -286,7 +294,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) f_desc *= "This function support variable length positional :class:`Symbol` inputs.\n\n" end f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional.\n\n" + f_desc *= ":param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional.\n\n" f_desc *= ":return: The constructed :class:`Symbol`.\n\n" return (func_name, f_desc) end diff --git a/src/util.jl b/src/util.jl index b3997dbaff45..c51ad598bc5a 100644 --- a/src/util.jl +++ b/src/util.jl @@ -64,7 +64,7 @@ function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{ch arg_type = bytestring(arg_types[i]) arg_desc = bytestring(arg_descs[i]) - push!(docstrings, ":param $arg_type $arg_name: $arg_desc\n\n") + push!(docstrings, ":param $arg_name: ``$arg_type``. $arg_desc\n\n") end return join(docstrings, "\n") end From 091c2349b8a5923f8f0673fe4e4b7ee336be2158 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 27 Oct 2015 00:28:11 -0400 Subject: [PATCH 139/630] add title to symbol doc page --- docs/api/symbol.rst | 6 ++++++ src/symbol.jl | 5 ++++- 2 files changed, 10 insertions(+), 1 deletion(-) diff --git a/docs/api/symbol.rst b/docs/api/symbol.rst index a645d9a13dff..cb73a7d35677 100644 --- a/docs/api/symbol.rst +++ b/docs/api/symbol.rst @@ -1,4 +1,10 @@ +Symbol +====== + + + + .. class:: Symbol Symbol is the basic building block of the symbolic graph in MXNet.jl. diff --git a/src/symbol.jl b/src/symbol.jl index eb29f74594d7..3c0109c35e17 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -1,4 +1,7 @@ -export Symbol +#=doc +Symbol +====== +=# #=doc .. class:: Symbol From 54e621e79b309d0c0c185858948e7f920a67782a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 27 Oct 2015 00:39:00 -0400 Subject: [PATCH 140/630] prepare for v0.0.3 --- NEWS.md | 12 ++++++++++++ 1 file changed, 12 insertions(+) diff --git a/NEWS.md b/NEWS.md index 53c3f2e5418d..84858e3aca13 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,15 @@ +# v.0.03 (2015.10.27) + +* Model prediction API. +* Model checkpoint loading and saving. +* IJulia Notebook example of using pre-trained imagenet model as classifier. +* Symbol saving and loading. +* NDArray saving and loading. +* Optimizer gradient clipping. +* Model training callback APIs, default checkpoint and speedometer callbacks. +* Julia Array / NDArray data iterator. +* Sphinx documentation system and documents for dynamically imported libmxnet APIs. + # v0.0.2 (2015.10.23) * Fix a bug in build script that causes Julia REPL to exit. From cadee3af2eaef4e41df8b9d3069c3d919066640a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 27 Oct 2015 10:48:01 -0400 Subject: [PATCH 141/630] better type annotation in docs. --- docs/api/model.rst | 111 +++++++++++++++++++++++ docs/api/ndarray.rst | 104 ++++++++++++++-------- docs/api/symbol.rst | 205 ++++++++++++++++++++++++++---------------- docs/build-api.jl | 2 + docs/index.rst | 1 + src/model.jl | 206 ++++++++++++++++++++++++++++++------------- src/ndarray.jl | 5 +- src/symbol.jl | 2 +- src/util.jl | 2 +- 9 files changed, 462 insertions(+), 176 deletions(-) create mode 100644 docs/api/model.rst diff --git a/docs/api/model.rst b/docs/api/model.rst new file mode 100644 index 000000000000..266e4162ef33 --- /dev/null +++ b/docs/api/model.rst @@ -0,0 +1,111 @@ + +Model +===== + +The model API provides convenient high-level interface to do training and predicting on +a network described using the symbolic API. + + + + +.. class:: AbstractModel + + The abstract super type of all models in MXNet.jl. + + + + +.. class:: FeedForward + + The feedforward model provides convenient interface to train and predict on + feedforward architectures like multi-layer MLP, ConvNets, etc. There is no + explicitly handling of *time index*, but it is relatively easy to implement + unrolled RNN / LSTM under this framework (**TODO**: add example). For models + that handles sequential data explicitly, please use **TODO**... + + + + +.. function:: FeedForward(arch :: Symbol, ctx) + + :param arch: the architecture of the network constructed using the symbolic API. + :param ctx: the devices on which this model should do computation. It could be a single :class:`Context` + or a list of :class:`Context` objects. In the latter case, data parallelization will be used + for training. If no context is provided, the default context ``cpu()`` will be used. + + + + +.. function:: init_model(self, initializer; overwrite=false, input_shapes...) + + Initialize the weights in the model. + + This method will be called automatically when training a model. So there is usually no + need to call this method unless one needs to inspect a model with only randomly initialized + weights. + + :param FeedForward self: the model to be initialized. + :param AbstractInitializer initializer: an initializer describing how the weights should be initialized. + :param Bool overwrite: keyword argument, force initialization even when weights already exists. + :param input_shapes: the shape of all data and label inputs to this model, given as keyword arguments. + For example, ``data=(28,28,1,100), label=(100,)``. + + + + +.. function:: + predict(self, data; overwrite=false, callback=nothing) + + Predict using an existing model. The model should be already initialized, or trained or loaded from + a checkpoint. There is an overloaded function that allows to pass the callback as the first argument, + so it is possible to do + + .. code-block:: julia + + predict(model, data) do batch_output + # consume or write batch_output to file + end + + :param FeedForward self: the model. + :param AbstractDataProvider data: the data to perform prediction on. + :param Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory + allocation of the :class:`Executor` depends on the mini-batch size of the test + data provider. If you call predict twice with data provider of the same batch-size, + then the executor can be re-used. Otherwise, if ``overwrite`` is false (default), + an error will be raised; if ``overwrite`` is set to true, a new :class:`Executor` + will be created to replace the old one. + + .. note:: + + Prediction is computationally much less costly than training, so the bottleneck sometimes becomes the IO + for copying mini-batches of data. Since there is no concern about convergence in prediction, it is better + to set the mini-batch size as large as possible (limited by your device memory) if prediction speed is a + concern. + + For the same reason, currently prediction will only use the first device even if multiple devices are + provided to construct the model. + + :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` + + + + +.. function:: train(model :: FeedForward, ...) + + Alias to :func:`fit`. + + + + +.. function:: fit(model :: FeedForward, optimizer, data; kwargs...) + + Train the ``model`` on ``data`` with the ``optimizer``. + + :param FeedForward model: the model to be trained. + :param AbstractOptimizer optimizer: the optimization algorithm to use. + :param AbstractDataProvider data: the training data provider. + :param Int n_epoch: default 10, the number of full data-passes to run. + :param AbstractOptimizer: + + + diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index 3f8404afd7e5..d3ca98574596 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -323,8 +323,9 @@ IO Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built with corresponding support. - :param filename: path to the binary file to write to. - :param data: an :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. + :param AbstractString filename: path to the binary file to write to. + :param data: data to save to file. + :type data: :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. @@ -367,10 +368,12 @@ Public APIs Choose one element from each line(row for python, column for R/Julia) in lhs according to index indicated by rhs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``NDArray``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: NDArray @@ -380,13 +383,16 @@ Public APIs Clip ndarray elements to range (a_min, a_max) - :param src: ``NDArray``. Source input + :param src: Source input + :type src: NDArray - :param a_min: ``real_t``. Minimum value + :param a_min: Minimum value + :type a_min: real_t - :param a_max: ``real_t``. Maximum value + :param a_max: Maximum value + :type a_max: real_t @@ -396,10 +402,12 @@ Public APIs Calcuate 2D matrix multiplication - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``NDArray``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: NDArray @@ -409,7 +417,8 @@ Public APIs Take square root of the src - :param src: ``NDArray``. Source input to the function + :param src: Source input to the function + :type src: NDArray @@ -419,7 +428,8 @@ Public APIs Take square of the src - :param src: ``NDArray``. Source input to the function + :param src: Source input to the function + :type src: NDArray @@ -435,7 +445,8 @@ Internal APIs - :param src: ``NDArray``. Source input to the function. + :param src: Source input to the function. + :type src: NDArray @@ -445,10 +456,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``NDArray``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: NDArray @@ -458,10 +471,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``real_t``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: real_t @@ -471,10 +486,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``NDArray``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: NDArray @@ -484,10 +501,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``real_t``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: real_t @@ -497,10 +516,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``NDArray``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: NDArray @@ -510,10 +531,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``real_t``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: real_t @@ -523,10 +546,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``NDArray``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: NDArray @@ -536,10 +561,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``NDArray``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: NDArray @@ -549,10 +576,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``real_t``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: real_t @@ -578,10 +607,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``real_t``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: real_t @@ -591,10 +622,12 @@ Internal APIs - :param lhs: ``NDArray``. Left operand to the function. + :param lhs: Left operand to the function. + :type lhs: NDArray - :param rhs: ``real_t``. Right operand to the function. + :param rhs: Right operand to the function. + :type rhs: real_t @@ -604,7 +637,8 @@ Internal APIs - :param src: ``real_t``. Source input to the function. + :param src: Source input to the function. + :type src: real_t diff --git a/docs/api/symbol.rst b/docs/api/symbol.rst index cb73a7d35677..914535f210de 100644 --- a/docs/api/symbol.rst +++ b/docs/api/symbol.rst @@ -27,12 +27,14 @@ Public APIs Apply activation function to input. - :param data: ``Symbol``. Input data to activation function. + :param data: Input data to activation function. + :type data: Symbol - :param act_type: ``{'relu', 'sigmoid', 'tanh'}, required``. Activation function to be applied. + :param act_type: Activation function to be applied. + :type act_type: {'relu', 'sigmoid', 'tanh'}, required - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -44,15 +46,18 @@ Public APIs Apply batch normalization to input. - :param data: ``Symbol``. Input data to batch normalization + :param data: Input data to batch normalization + :type data: Symbol - :param eps: ``float, optional, default=1e-10``. Epsilon to prevent div 0 + :param eps: Epsilon to prevent div 0 + :type eps: float, optional, default=1e-10 - :param momentum: ``float, optional, default=0.1``. Momentum for moving average + :param momentum: Momentum for moving average + :type momentum: float, optional, default=0.1 - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -64,9 +69,10 @@ Public APIs Get output from a symbol and pass 0 gradient back - :param data: ``Symbol``. Input data. + :param data: Input data. + :type data: Symbol - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -80,9 +86,10 @@ Public APIs This function support variable length positional :class:`Symbol` inputs. - :param num_args: ``int, required``. Number of inputs to be concated. + :param num_args: Number of inputs to be concated. + :type num_args: int, required - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -94,36 +101,46 @@ Public APIs Apply convolution to input then add a bias. - :param data: ``Symbol``. Input data to the ConvolutionOp. + :param data: Input data to the ConvolutionOp. + :type data: Symbol - :param weight: ``Symbol``. Weight matrix. + :param weight: Weight matrix. + :type weight: Symbol - :param bias: ``Symbol``. Bias parameter. + :param bias: Bias parameter. + :type bias: Symbol - :param kernel: ``Shape(tuple), required``. convolution kernel size: (y, x) + :param kernel: convolution kernel size: (y, x) + :type kernel: Shape(tuple), required - :param stride: ``Shape(tuple), optional, default=(1, 1)``. convolution stride: (y, x) + :param stride: convolution stride: (y, x) + :type stride: Shape(tuple), optional, default=(1, 1) - :param pad: ``Shape(tuple), optional, default=(0, 0)``. pad for convolution: (y, x) + :param pad: pad for convolution: (y, x) + :type pad: Shape(tuple), optional, default=(0, 0) - :param num_filter: ``int (non-negative), required``. convolution filter(channel) number + :param num_filter: convolution filter(channel) number + :type num_filter: int (non-negative), required - :param num_group: ``int (non-negative), optional, default=1``. number of groups partition + :param num_group: number of groups partition + :type num_group: int (non-negative), optional, default=1 - :param workspace: ``long (non-negative), optional, default=512``. Tmp workspace for convolution (MB) + :param workspace: Tmp workspace for convolution (MB) + :type workspace: long (non-negative), optional, default=512 - :param no_bias: ``boolean, optional, default=False``. Whether to disable bias parameter. + :param no_bias: Whether to disable bias parameter. + :type no_bias: boolean, optional, default=False - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -135,12 +152,14 @@ Public APIs Apply dropout to input - :param data: ``Symbol``. Input data to dropout. + :param data: Input data to dropout. + :type data: Symbol - :param p: ``float, optional, default=0.5``. Fraction of the input that gets dropped out at training time + :param p: Fraction of the input that gets dropped out at training time + :type p: float, optional, default=0.5 - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -154,9 +173,10 @@ Public APIs This function support variable length positional :class:`Symbol` inputs. - :param num_args: ``int, required``. Number of inputs to be sumed. + :param num_args: Number of inputs to be sumed. + :type num_args: int, required - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -168,9 +188,10 @@ Public APIs Flatten input - :param data: ``Symbol``. Input data to flatten. + :param data: Input data to flatten. + :type data: Symbol - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -182,21 +203,26 @@ Public APIs Apply matrix multiplication to input then add a bias. - :param data: ``Symbol``. Input data to the FullyConnectedOp. + :param data: Input data to the FullyConnectedOp. + :type data: Symbol - :param weight: ``Symbol``. Weight matrix. + :param weight: Weight matrix. + :type weight: Symbol - :param bias: ``Symbol``. Bias parameter. + :param bias: Bias parameter. + :type bias: Symbol - :param num_hidden: ``int, required``. Number of hidden nodes of the output. + :param num_hidden: Number of hidden nodes of the output. + :type num_hidden: int, required - :param no_bias: ``boolean, optional, default=False``. Whether to disable bias parameter. + :param no_bias: Whether to disable bias parameter. + :type no_bias: boolean, optional, default=False - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -208,21 +234,26 @@ Public APIs Apply convolution to input then add a bias. - :param data: ``Symbol``. Input data to the ConvolutionOp. + :param data: Input data to the ConvolutionOp. + :type data: Symbol - :param alpha: ``float, optional, default=0.0001``. value of the alpha variance scaling parameter in the normalization formula + :param alpha: value of the alpha variance scaling parameter in the normalization formula + :type alpha: float, optional, default=0.0001 - :param beta: ``float, optional, default=0.75``. value of the beta power parameter in the normalization formula + :param beta: value of the beta power parameter in the normalization formula + :type beta: float, optional, default=0.75 - :param knorm: ``float, optional, default=2``. value of the k parameter in normalization formula + :param knorm: value of the k parameter in normalization formula + :type knorm: float, optional, default=2 - :param nsize: ``int (non-negative), required``. normalization window width in elements. + :param nsize: normalization window width in elements. + :type nsize: int (non-negative), required - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -234,21 +265,26 @@ Public APIs Apply activation function to input. - :param data: ``Symbol``. Input data to activation function. + :param data: Input data to activation function. + :type data: Symbol - :param act_type: ``{'leaky', 'prelu', 'rrelu'},optional, default='leaky'``. Activation function to be applied. + :param act_type: Activation function to be applied. + :type act_type: {'leaky', 'prelu', 'rrelu'},optional, default='leaky' - :param slope: ``float, optional, default=0.25``. Init slope for the activation. (For leaky only) + :param slope: Init slope for the activation. (For leaky only) + :type slope: float, optional, default=0.25 - :param lower_bound: ``float, optional, default=0.125``. Lower bound of random slope. (For rrelu only) + :param lower_bound: Lower bound of random slope. (For rrelu only) + :type lower_bound: float, optional, default=0.125 - :param upper_bound: ``float, optional, default=0.334``. Upper bound of random slope. (For rrelu only) + :param upper_bound: Upper bound of random slope. (For rrelu only) + :type upper_bound: float, optional, default=0.334 - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -260,12 +296,14 @@ Public APIs Use linear regression for final output, this is used on final output of a net. - :param data: ``Symbol``. Input data to function. + :param data: Input data to function. + :type data: Symbol - :param label: ``Symbol``. Input label to function. + :param label: Input label to function. + :type label: Symbol - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -278,12 +316,14 @@ Public APIs Use Logistic regression for final output, this is used on final output of a net. Logistic regression is suitable for binary classification or probability prediction tasks. - :param data: ``Symbol``. Input data to function. + :param data: Input data to function. + :type data: Symbol - :param label: ``Symbol``. Input label to function. + :param label: Input label to function. + :type label: Symbol - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -295,21 +335,26 @@ Public APIs Perform spatial pooling on inputs. - :param data: ``Symbol``. Input data to the pooling operator. + :param data: Input data to the pooling operator. + :type data: Symbol - :param kernel: ``Shape(tuple), required``. pooling kernel size: (y, x) + :param kernel: pooling kernel size: (y, x) + :type kernel: Shape(tuple), required - :param pool_type: ``{'avg', 'max', 'sum'}, required``. Pooling type to be applied. + :param pool_type: Pooling type to be applied. + :type pool_type: {'avg', 'max', 'sum'}, required - :param stride: ``Shape(tuple), optional, default=(1, 1)``. stride: for pooling (y, x) + :param stride: stride: for pooling (y, x) + :type stride: Shape(tuple), optional, default=(1, 1) - :param pad: ``Shape(tuple), optional, default=(0, 0)``. pad for pooling: (y, x) + :param pad: pad for pooling: (y, x) + :type pad: Shape(tuple), optional, default=(0, 0) - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -321,12 +366,14 @@ Public APIs Reshape input to target shape - :param data: ``Symbol``. Input data to reshape. + :param data: Input data to reshape. + :type data: Symbol - :param target_shape: ``Shape(tuple), required``. Target new shape + :param target_shape: Target new shape + :type target_shape: Shape(tuple), required - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -338,9 +385,10 @@ Public APIs Slice channel into many outputs with equally divided channel - :param num_outputs: ``int, required``. Number of outputs to be sliced. + :param num_outputs: Number of outputs to be sliced. + :type num_outputs: int, required - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -352,15 +400,18 @@ Public APIs Perform a softmax transformation on input. - :param data: ``Symbol``. Input data to softmax. + :param data: Input data to softmax. + :type data: Symbol - :param grad_scale: ``float, optional, default=1``. Scale the gradient by a float factor + :param grad_scale: Scale the gradient by a float factor + :type grad_scale: float, optional, default=1 - :param multi_output: ``boolean, optional, default=False``. If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes + :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes + :type multi_output: boolean, optional, default=False - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -372,9 +423,10 @@ Public APIs Take square root of the src - :param src: ``Symbol``. Source symbolic input to the function + :param src: Source symbolic input to the function + :type src: Symbol - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -386,9 +438,10 @@ Public APIs Take square of the src - :param src: ``Symbol``. Source symbolic input to the function + :param src: Source symbolic input to the function + :type src: Symbol - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -406,7 +459,7 @@ Internal APIs Perform an elementwise div. - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -418,7 +471,7 @@ Internal APIs Perform an elementwise minus. - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -430,7 +483,7 @@ Internal APIs Perform an elementwise mul. - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. @@ -442,7 +495,7 @@ Internal APIs Perform an elementwise plus. - :param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. :return: The constructed :class:`Symbol`. diff --git a/docs/build-api.jl b/docs/build-api.jl index b70cbd94615b..46adc3fa59ce 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -72,3 +72,5 @@ embed_mxnet_api("ndarray.rst", "ndarray", mx._import_ndarray_functions) extract_doc("symbol.rst", "symbol.jl") embed_mxnet_api("symbol.rst", "symbol", mx._import_atomic_symbol_creators) + +extract_doc("model.rst", "model.jl") diff --git a/docs/index.rst b/docs/index.rst index adc4ef8d658c..58d0e43c38fa 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -31,6 +31,7 @@ For more details, see documentation below. Please also checkout the `examples :maxdepth: 1 :caption: API Documentation + api/model api/ndarray api/symbol diff --git a/src/model.jl b/src/model.jl index 84b581b00b09..f21e42ed6f2e 100644 --- a/src/model.jl +++ b/src/model.jl @@ -1,5 +1,27 @@ +#=doc +Model +===== + +The model API provides convenient high-level interface to do training and predicting on +a network described using the symbolic API. +=# + +#=doc +.. class:: AbstractModel + + The abstract super type of all models in MXNet.jl. +=# abstract AbstractModel +#=doc +.. class:: FeedForward + + The feedforward model provides convenient interface to train and predict on + feedforward architectures like multi-layer MLP, ConvNets, etc. There is no + explicitly handling of *time index*, but it is relatively easy to implement + unrolled RNN / LSTM under this framework (**TODO**: add example). For models + that handles sequential data explicitly, please use **TODO**... +=# type FeedForward <: AbstractModel arch :: Symbol ctx :: Vector{Context} @@ -29,6 +51,14 @@ function _split_inputs(batch_size :: Int, n_split :: Int) return idx end +#=doc +.. function:: FeedForward(arch :: Symbol, ctx) + + :param arch: the architecture of the network constructed using the symbolic API. + :param ctx: the devices on which this model should do computation. It could be a single :class:`Context` + or a list of :class:`Context` objects. In the latter case, data parallelization will be used + for training. If no context is provided, the default context ``cpu()`` will be used. +=# function FeedForward(arch :: Symbol; context :: Union{Context, Vector{Context}, Void} = nothing) if isa(context, Void) context = [Context(CPU)] @@ -38,19 +68,21 @@ function FeedForward(arch :: Symbol; context :: Union{Context, Vector{Context}, FeedForward(arch, context) end -"""Initialize the weights in the model. +#=doc +.. function:: init_model(self, initializer; overwrite=false, input_shapes...) -This method will be called automatically when training a model. So there is usually no -need to call this method unless one needs to inspect a model with only randomly initialized -weights. + Initialize the weights in the model. -**Parameters** + This method will be called automatically when training a model. So there is usually no + need to call this method unless one needs to inspect a model with only randomly initialized + weights. -* `self`: the model to be initialized -* `initializer`: an `AbstractInitializer` -* `overwrite`: keyword argument, force initialization even when weights already exists -* `input_shapes`: the shape of all data and label inputs to this model, given as keyword arguments. -""" + :param FeedForward self: the model to be initialized. + :param AbstractInitializer initializer: an initializer describing how the weights should be initialized. + :param Bool overwrite: keyword argument, force initialization even when weights already exists. + :param input_shapes: the shape of all data and label inputs to this model, given as keyword arguments. + For example, ``data=(28,28,1,100), label=(100,)``. +=# function init_model(self :: FeedForward, initializer :: AbstractInitializer; overwrite::Bool=false, input_shapes...) # all arg names, including data, label, and parameters arg_names = list_arguments(self.arch) @@ -89,57 +121,6 @@ function init_model(self :: FeedForward, initializer :: AbstractInitializer; ove return (arg_names, param_names, aux_names) end -function _init_model(self :: FeedForward, data :: AbstractDataProvider, initializer :: AbstractInitializer, overwrite :: Bool) - init_model(self, initializer; overwrite=overwrite, [provide_data(data)..., provide_label(data)...]...) -end - -function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}) - if num_device == 1 && !ismatch(r"dist", string(kv_type)) - kv = nothing - else - if kv_type == :local - max_size = maximum([prod(size(param)) for (k,param) in arg_params]) - if max_size < 1024 * 1024 * 16 - kv_type = :local_update_cpu - else - kv_type = :local_allreduce_cpu - end - info("Auto-select kvstore type = $kv_type") - end - kv = KVStore(kv_type) - end - - update_on_kvstore = true - if isa(kv, Void) || ismatch(r"local_allreduce", string(get_type(kv))) - update_on_kvstore = false - end - - return (kv, update_on_kvstore) -end - -@defstruct TrainingOptions Any ( - initializer :: AbstractInitializer = UniformInitializer(0.01), - n_epoch :: Int = 10, - eval_data :: Union{Void, AbstractDataProvider} = nothing, - eval_metric :: AbstractEvalMetric = Accuracy(), - kvstore :: Union{Base.Symbol, KVStore} = :local, - force_init :: Bool = false, - callbacks :: Vector{AbstractCallback} = AbstractCallback[], -) - -function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, param::CallbackParams, type_filter::Type) - map(callbacks) do cb - if isa(cb, type_filter) - if type_filter == AbstractEpochCallback - # epoch callback have extra access to the model object - cb(self, param) - else - cb(param) - end - end - end -end - function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_shapes...) if !isdefined(self, :pred_exec) || isa(self.pred_exec, Void) || overwrite if !isdefined(self, :arg_params) || !isdefined(self, :aux_params) @@ -158,6 +139,41 @@ function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_sha end end +#=doc +.. function:: + predict(self, data; overwrite=false, callback=nothing) + + Predict using an existing model. The model should be already initialized, or trained or loaded from + a checkpoint. There is an overloaded function that allows to pass the callback as the first argument, + so it is possible to do + + .. code-block:: julia + + predict(model, data) do batch_output + # consume or write batch_output to file + end + + :param FeedForward self: the model. + :param AbstractDataProvider data: the data to perform prediction on. + :param Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory + allocation of the :class:`Executor` depends on the mini-batch size of the test + data provider. If you call predict twice with data provider of the same batch-size, + then the executor can be re-used. Otherwise, if ``overwrite`` is false (default), + an error will be raised; if ``overwrite`` is set to true, a new :class:`Executor` + will be created to replace the old one. + + .. note:: + + Prediction is computationally much less costly than training, so the bottleneck sometimes becomes the IO + for copying mini-batches of data. Since there is no concern about convergence in prediction, it is better + to set the mini-batch size as large as possible (limited by your device memory) if prediction speed is a + concern. + + For the same reason, currently prediction will only use the first device even if multiple devices are + provided to construct the model. + + :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` +=# function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = false) predict(self, data; overwrite = overwrite, callback=callback) end @@ -209,9 +225,77 @@ function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::B return output_arrays end +function _init_model(self :: FeedForward, data :: AbstractDataProvider, initializer :: AbstractInitializer, overwrite :: Bool) + init_model(self, initializer; overwrite=overwrite, [provide_data(data)..., provide_label(data)...]...) +end + +function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}) + if num_device == 1 && !ismatch(r"dist", string(kv_type)) + kv = nothing + else + if kv_type == :local + max_size = maximum([prod(size(param)) for (k,param) in arg_params]) + if max_size < 1024 * 1024 * 16 + kv_type = :local_update_cpu + else + kv_type = :local_allreduce_cpu + end + info("Auto-select kvstore type = $kv_type") + end + kv = KVStore(kv_type) + end + + update_on_kvstore = true + if isa(kv, Void) || ismatch(r"local_allreduce", string(get_type(kv))) + update_on_kvstore = false + end + + return (kv, update_on_kvstore) +end + +@defstruct TrainingOptions Any ( + initializer :: AbstractInitializer = UniformInitializer(0.01), + n_epoch :: Int = 10, + eval_data :: Union{Void, AbstractDataProvider} = nothing, + eval_metric :: AbstractEvalMetric = Accuracy(), + kvstore :: Union{Base.Symbol, KVStore} = :local, + force_init :: Bool = false, + callbacks :: Vector{AbstractCallback} = AbstractCallback[], +) + +function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, param::CallbackParams, type_filter::Type) + map(callbacks) do cb + if isa(cb, type_filter) + if type_filter == AbstractEpochCallback + # epoch callback have extra access to the model object + cb(self, param) + else + cb(param) + end + end + end +end + +#=doc +.. function:: train(model :: FeedForward, ...) + + Alias to :func:`fit`. +=# function train(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) fit(self, optimizer, data; kwargs...) end + +#=doc +.. function:: fit(model :: FeedForward, optimizer, data; kwargs...) + + Train the ``model`` on ``data`` with the ``optimizer``. + + :param FeedForward model: the model to be trained. + :param AbstractOptimizer optimizer: the optimization algorithm to use. + :param AbstractDataProvider data: the training data provider. + :param Int n_epoch: default 10, the number of full data-passes to run. + :param AbstractOptimizer: +=# function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) opts = TrainingOptions(; kwargs...) diff --git a/src/ndarray.jl b/src/ndarray.jl index eb82e06ec294..db2b300bdebc 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -615,8 +615,9 @@ end Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built with corresponding support. - :param filename: path to the binary file to write to. - :param data: an :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. + :param AbstractString filename: path to the binary file to write to. + :param data: data to save to file. + :type data: :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. =# function save(filename::AbstractString, data::NDArray) save(filename, [data]) diff --git a/src/symbol.jl b/src/symbol.jl index 3c0109c35e17..14adb56f0473 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -297,7 +297,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) f_desc *= "This function support variable length positional :class:`Symbol` inputs.\n\n" end f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":param name: ``Base.Symbol``. The name of the symbol. (e.g. `:my_symbol`), optional.\n\n" + f_desc *= ":param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional.\n\n" f_desc *= ":return: The constructed :class:`Symbol`.\n\n" return (func_name, f_desc) end diff --git a/src/util.jl b/src/util.jl index c51ad598bc5a..4ca613cbf7d1 100644 --- a/src/util.jl +++ b/src/util.jl @@ -64,7 +64,7 @@ function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{ch arg_type = bytestring(arg_types[i]) arg_desc = bytestring(arg_descs[i]) - push!(docstrings, ":param $arg_name: ``$arg_type``. $arg_desc\n\n") + push!(docstrings, ":param $arg_name: $arg_desc\n:type $arg_name: $arg_type\n\n") end return join(docstrings, "\n") end From 1b62ddf7b4af8b5a0322b13c34a686d4b50feea2 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 27 Oct 2015 11:10:27 -0400 Subject: [PATCH 142/630] more docs. --- docs/api/callback.rst | 27 +++++++++++++++++++++++++++ docs/api/initializer.rst | 27 +++++++++++++++++++++++++++ docs/api/model.rst | 21 ++++++++++++++++++--- docs/api/ndarray.rst | 4 ++-- docs/api/symbol.rst | 4 ++-- docs/build-api.jl | 2 ++ docs/index.rst | 2 ++ src/callback.jl | 23 ++++++++++++++++++++--- src/initializer.jl | 20 ++++++++++++++++++++ src/model.jl | 21 ++++++++++++++++++--- src/ndarray.jl | 4 ++-- src/symbol.jl | 4 ++-- 12 files changed, 142 insertions(+), 17 deletions(-) create mode 100644 docs/api/callback.rst create mode 100644 docs/api/initializer.rst diff --git a/docs/api/callback.rst b/docs/api/callback.rst new file mode 100644 index 000000000000..56ab1fbb7074 --- /dev/null +++ b/docs/api/callback.rst @@ -0,0 +1,27 @@ + +Callbacks in training +===================== + + + + +.. class:: AbstractCallback + + Abstract type of callback functions used in training. + + + + +.. class:: AbstractIterationCallback + + Abstract type of callbacks to be called every mini-batch. + + + + +.. class:: AbstractEpochCallback + + Abstract type of callbacks to be called every epoch. + + + diff --git a/docs/api/initializer.rst b/docs/api/initializer.rst new file mode 100644 index 000000000000..63e1a231b187 --- /dev/null +++ b/docs/api/initializer.rst @@ -0,0 +1,27 @@ + +Built-in Initializers +===================== + + + + +.. class:: AbstractInitializer + + The abstract base class for all initializers. + + + + +.. class:: UniformInitializer + + Initialize weights according to a uniform distribution within the provided scale. + + + + +.. class:: NormalInitializer + + Initialize weights according to a univariate Gaussian distribution. + + + diff --git a/docs/api/model.rst b/docs/api/model.rst index 266e4162ef33..e9a8ee5a0a63 100644 --- a/docs/api/model.rst +++ b/docs/api/model.rst @@ -1,6 +1,6 @@ -Model -===== +Built-in Models and Interface +============================= The model API provides convenient high-level interface to do training and predicting on a network described using the symbolic API. @@ -105,7 +105,22 @@ a network described using the symbolic API. :param AbstractOptimizer optimizer: the optimization algorithm to use. :param AbstractDataProvider data: the training data provider. :param Int n_epoch: default 10, the number of full data-passes to run. - :param AbstractOptimizer: + :param AbstractDataProvider eval_data: keyword argument, default ``nothing``. The data provider for + the validation set. + :param AbstractEvalMetric eval_metric: keyword argument, default :class:`Accuracy`. The metric used + to evaluate the training performance. If ``eval_data`` is provided, the same metric is also + calculated on the validation set. + :param kvstore: keyword argument, default ``:local``. The key-value store used to synchronize gradients + and parameters when multiple devices are used for training. + :type kvstore: :class:`KVStore` or ``Base.Symbol`` + :param AbstractInitializer initializer: keyword argument, default :class:`UniformInitializer(0.01)`. + :param Bool force_init: keyword argument, default false. By default, the random initialization using the + provided ``initializer`` will be skipped if the model weights already exists, maybe from a previous + call to :func:`train` or an explicit call to :func:`init_model` or :func:`load_checkpoint`. When + this option is set, it will always do random initialization at the begining of training. + :param callbacks: keyword argument, default ``[]``. Callbacks to be invoked at each epoch or mini-batch, + see :class:`AbstractCallback`. + :type callbacks: ``Vector{AbstractCallback}`` diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index d3ca98574596..8ac5e9bda8f0 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -1,6 +1,6 @@ -NDArray -======= +NDArray API +=========== diff --git a/docs/api/symbol.rst b/docs/api/symbol.rst index 914535f210de..604fadc0f43d 100644 --- a/docs/api/symbol.rst +++ b/docs/api/symbol.rst @@ -1,6 +1,6 @@ -Symbol -====== +Symbolic API +============ diff --git a/docs/build-api.jl b/docs/build-api.jl index 46adc3fa59ce..29f99369d431 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -73,4 +73,6 @@ embed_mxnet_api("ndarray.rst", "ndarray", mx._import_ndarray_functions) extract_doc("symbol.rst", "symbol.jl") embed_mxnet_api("symbol.rst", "symbol", mx._import_atomic_symbol_creators) +extract_doc("initializer.rst", "initializer.jl") +extract_doc("callback.rst", "callback.jl") extract_doc("model.rst", "model.jl") diff --git a/docs/index.rst b/docs/index.rst index 58d0e43c38fa..cf44dc197b2d 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -32,6 +32,8 @@ For more details, see documentation below. Please also checkout the `examples :caption: API Documentation api/model + api/callback + api/initializer api/ndarray api/symbol diff --git a/src/callback.jl b/src/callback.jl index 049f19432981..14406add7006 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -1,10 +1,27 @@ -"Abstract type of callback functions used in training" +#=doc +Callbacks in training +===================== +=# + +#=doc +.. class:: AbstractCallback + + Abstract type of callback functions used in training. +=# abstract AbstractCallback -"Abstract type of callbacks to be called every mini-batch" +#=doc +.. class:: AbstractIterationCallback + + Abstract type of callbacks to be called every mini-batch. +=# abstract AbstractIterationCallback <: AbstractCallback -"Abstract type of callbacks to be called every epoch" +#=doc +.. class:: AbstractEpochCallback + + Abstract type of callbacks to be called every epoch. +=# abstract AbstractEpochCallback <: AbstractCallback type CallbackParams diff --git a/src/initializer.jl b/src/initializer.jl index 502baf2189e1..3f830860f586 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -1,3 +1,13 @@ +#=doc +Built-in Initializers +===================== +=# + +#=doc +.. class:: AbstractInitializer + + The abstract base class for all initializers. +=# abstract AbstractInitializer function call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) @@ -32,6 +42,11 @@ function _init_zero(self :: AbstractInitializer, name :: Base.Symbol, array :: N array[:] = 0 end +#=doc +.. class:: UniformInitializer + + Initialize weights according to a uniform distribution within the provided scale. +=# immutable UniformInitializer <: AbstractInitializer scale :: AbstractFloat end @@ -41,6 +56,11 @@ function _init_weight(self :: UniformInitializer, name :: Base.Symbol, array :: rand!(-self.scale, self.scale, array) end +#=doc +.. class:: NormalInitializer + + Initialize weights according to a univariate Gaussian distribution. +=# immutable NormalInitializer <: AbstractInitializer μ :: AbstractFloat σ :: AbstractFloat diff --git a/src/model.jl b/src/model.jl index f21e42ed6f2e..f28fd0d9f5af 100644 --- a/src/model.jl +++ b/src/model.jl @@ -1,6 +1,6 @@ #=doc -Model -===== +Built-in Models and Interface +============================= The model API provides convenient high-level interface to do training and predicting on a network described using the symbolic API. @@ -294,7 +294,22 @@ end :param AbstractOptimizer optimizer: the optimization algorithm to use. :param AbstractDataProvider data: the training data provider. :param Int n_epoch: default 10, the number of full data-passes to run. - :param AbstractOptimizer: + :param AbstractDataProvider eval_data: keyword argument, default ``nothing``. The data provider for + the validation set. + :param AbstractEvalMetric eval_metric: keyword argument, default ``Accuracy()``. The metric used + to evaluate the training performance. If ``eval_data`` is provided, the same metric is also + calculated on the validation set. + :param kvstore: keyword argument, default ``:local``. The key-value store used to synchronize gradients + and parameters when multiple devices are used for training. + :type kvstore: :class:`KVStore` or ``Base.Symbol`` + :param AbstractInitializer initializer: keyword argument, default ``UniformInitializer(0.01)``. + :param Bool force_init: keyword argument, default false. By default, the random initialization using the + provided ``initializer`` will be skipped if the model weights already exists, maybe from a previous + call to :func:`train` or an explicit call to :func:`init_model` or :func:`load_checkpoint`. When + this option is set, it will always do random initialization at the begining of training. + :param callbacks: keyword argument, default ``[]``. Callbacks to be invoked at each epoch or mini-batch, + see :class:`AbstractCallback`. + :type callbacks: ``Vector{AbstractCallback}`` =# function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) opts = TrainingOptions(; kwargs...) diff --git a/src/ndarray.jl b/src/ndarray.jl index db2b300bdebc..347346e6751a 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1,6 +1,6 @@ #=doc -NDArray -======= +NDArray API +=========== =# # create a NDArray handle of specific shape diff --git a/src/symbol.jl b/src/symbol.jl index 14adb56f0473..4c656cfedacb 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -1,6 +1,6 @@ #=doc -Symbol -====== +Symbolic API +============ =# #=doc From d19f28fc3d14c9c141b2bc9cc9c3e5c899e2d227 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 27 Oct 2015 11:25:01 -0400 Subject: [PATCH 143/630] docs for built-in callbacks --- docs/api/callback.rst | 65 +++++++++++++++++++++++++++++++++++++++++++ docs/api/model.rst | 4 +-- src/callback.jl | 59 ++++++++++++++++++++++++++++++++++++++- 3 files changed, 125 insertions(+), 3 deletions(-) diff --git a/docs/api/callback.rst b/docs/api/callback.rst index 56ab1fbb7074..ac1c8f36b862 100644 --- a/docs/api/callback.rst +++ b/docs/api/callback.rst @@ -25,3 +25,68 @@ Callbacks in training + +.. function:: every_n_iter(callback :: Function, n :: Int; call_on_0 = false) + + A convenient function to construct a callback that runs every ``n`` mini-batches. + + :param Int call_on_0: keyword argument, default false. Unless set, the callback + will **not** be run on iteration 0. + + For example, the :func:`speedometer` callback is defined as + + .. code-block:: julia + + every_n_iter(frequency, call_on_0=true) do param :: CallbackParams + if param.curr_iter == 0 + # reset timer + else + # compute and print speed + end + end + + :seealso: :func:`every_n_epoch`, :func:`speedometer`. + + + + +.. function:: speedometer(; frequency=50) + + Create an :class:`AbstractIterationCallback` that measure the training speed + (number of samples processed per second) every k mini-batches. + + :param Int frequency: keyword argument, default 50. The frequency (number of + min-batches) to measure and report the speed. + + + + +.. function:: every_n_epoch(callback :: Function, n :: Int; call_on_0 = false) + + A convenient function to construct a callback that runs every ``n`` full data-passes. + + :param Int call_on_0: keyword argument, default false. Unless set, the callback + will **not** be run on epoch 0. Epoch 0 means no training has been performed + yet. This is useful if you want to inspect the randomly initialized model + that has not seen any data yet. + + :seealso: :func:`every_n_iter`. + + + + +.. function:: do_checkpoint(prefix; frequency=1, save_epoch_0=false) + + Create an :class:`AbstractEpochCallback` that save checkpoints of the model to disk. + The checkpoints can be loaded back later on. + + :param AbstractString prefix: the prefix of the filenames to save the model. The model + architecture will be saved to prefix-symbol.json, while the weights will be saved + to prefix-0012.params, for example, for the 12-th epoch. + :param Int frequency: keyword argument, default 1. The frequency (measured in epochs) to + save checkpoints. + :param Bool save_epoch_0: keyword argument, default false. Whether we should save a + checkpoint for epoch 0 (model initialized but not seen any data yet). + + + diff --git a/docs/api/model.rst b/docs/api/model.rst index e9a8ee5a0a63..7593e6e68f55 100644 --- a/docs/api/model.rst +++ b/docs/api/model.rst @@ -107,13 +107,13 @@ a network described using the symbolic API. :param Int n_epoch: default 10, the number of full data-passes to run. :param AbstractDataProvider eval_data: keyword argument, default ``nothing``. The data provider for the validation set. - :param AbstractEvalMetric eval_metric: keyword argument, default :class:`Accuracy`. The metric used + :param AbstractEvalMetric eval_metric: keyword argument, default ``Accuracy()``. The metric used to evaluate the training performance. If ``eval_data`` is provided, the same metric is also calculated on the validation set. :param kvstore: keyword argument, default ``:local``. The key-value store used to synchronize gradients and parameters when multiple devices are used for training. :type kvstore: :class:`KVStore` or ``Base.Symbol`` - :param AbstractInitializer initializer: keyword argument, default :class:`UniformInitializer(0.01)`. + :param AbstractInitializer initializer: keyword argument, default ``UniformInitializer(0.01)``. :param Bool force_init: keyword argument, default false. By default, the random initialization using the provided ``initializer`` will be skipped if the model weights already exists, maybe from a previous call to :func:`train` or an explicit call to :func:`init_model` or :func:`load_checkpoint`. When diff --git a/src/callback.jl b/src/callback.jl index 14406add7006..ea890ab2c269 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -37,6 +37,28 @@ type IterationCallback <: AbstractIterationCallback callback :: Function end +#=doc +.. function:: every_n_iter(callback :: Function, n :: Int; call_on_0 = false) + + A convenient function to construct a callback that runs every ``n`` mini-batches. + + :param Int call_on_0: keyword argument, default false. Unless set, the callback + will **not** be run on iteration 0. + + For example, the :func:`speedometer` callback is defined as + + .. code-block:: julia + + every_n_iter(frequency, call_on_0=true) do param :: CallbackParams + if param.curr_iter == 0 + # reset timer + else + # compute and print speed + end + end + + :seealso: :func:`every_n_epoch`, :func:`speedometer`. +=# function every_n_iter(callback :: Function, n :: Int; call_on_0 :: Bool = false) IterationCallback(n, call_on_0, callback) end @@ -50,11 +72,20 @@ function Base.call(cb :: IterationCallback, param :: CallbackParams) end end +#=doc +.. function:: speedometer(; frequency=50) + + Create an :class:`AbstractIterationCallback` that measure the training speed + (number of samples processed per second) every k mini-batches. + + :param Int frequency: keyword argument, default 50. The frequency (number of + min-batches) to measure and report the speed. +=# function speedometer(;frequency::Int=50) cl_tic = 0 every_n_iter(frequency, call_on_0=true) do param :: CallbackParams if param.curr_iter == 0 - # reset counter + # reset timer cl_tic = time() else speed = frequency * param.batch_size / (time() - cl_tic) @@ -71,6 +102,18 @@ type EpochCallback <: AbstractEpochCallback callback :: Function end +#=doc +.. function:: every_n_epoch(callback :: Function, n :: Int; call_on_0 = false) + + A convenient function to construct a callback that runs every ``n`` full data-passes. + + :param Int call_on_0: keyword argument, default false. Unless set, the callback + will **not** be run on epoch 0. Epoch 0 means no training has been performed + yet. This is useful if you want to inspect the randomly initialized model + that has not seen any data yet. + + :seealso: :func:`every_n_iter`. +=# function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) end @@ -84,6 +127,20 @@ function Base.call(cb :: EpochCallback, model :: Any, param :: CallbackParams) end end +#=doc +.. function:: do_checkpoint(prefix; frequency=1, save_epoch_0=false) + + Create an :class:`AbstractEpochCallback` that save checkpoints of the model to disk. + The checkpoints can be loaded back later on. + + :param AbstractString prefix: the prefix of the filenames to save the model. The model + architecture will be saved to prefix-symbol.json, while the weights will be saved + to prefix-0012.params, for example, for the 12-th epoch. + :param Int frequency: keyword argument, default 1. The frequency (measured in epochs) to + save checkpoints. + :param Bool save_epoch_0: keyword argument, default false. Whether we should save a + checkpoint for epoch 0 (model initialized but not seen any data yet). +=# function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) mkpath(dirname(prefix)) every_n_epoch(frequency, call_on_0=save_epoch_0) do model, param From c051c2a456ffb21fa86500e2953ccef9f0cd7305 Mon Sep 17 00:00:00 2001 From: cjb Date: Wed, 28 Oct 2015 14:09:32 +0100 Subject: [PATCH 144/630] fixed joinpath problem in example in README.md --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 8e148c2d7529..2c28bc58f15e 100644 --- a/README.md +++ b/README.md @@ -24,7 +24,7 @@ mlp = @mx.chain mx.Variable(:data) => # data provider batch_size = 100 -include(joinpath(Pkg.dir("MXNet"), "/examples/mnist/mnist-data.jl")) +include(joinpath(Pkg.dir("MXNet"), "examples/mnist/mnist-data.jl")) train_provider, eval_provider = get_mnist_providers(batch_size) # setup model From 0132f19a17b31bd9e40d4aafbdf71fdf30005117 Mon Sep 17 00:00:00 2001 From: cjb Date: Wed, 28 Oct 2015 14:52:29 +0100 Subject: [PATCH 145/630] added ADAM SGD --- src/optimizer.jl | 1 + src/optimizers/adam.jl | 64 ++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 65 insertions(+) create mode 100644 src/optimizers/adam.jl diff --git a/src/optimizer.jl b/src/optimizer.jl index d01f92e7d735..c2c8ba4c28ef 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -30,3 +30,4 @@ end include("optimizers/sgd.jl") +include("optimizers/adam.jl") diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl new file mode 100644 index 000000000000..b555773a49a9 --- /dev/null +++ b/src/optimizers/adam.jl @@ -0,0 +1,64 @@ + +@defstruct ADAMOptions Any ( + (lr :: Real = 0.001, lr > 0), + (lr_decay :: Real = 1.0, lr_decay > 0), + (beta1 :: Real = 0.9, beta1 > 0), + (beta2 :: Real = 0.999, beta2 > 0), + (epsilon :: Real = 1e-8, epsilon > 0), + (grad_scale :: Real = 1.0, grad_scale >= 0), + (grad_clip :: Real = 0, grad_clip >= 0) +) + + +type ADAM <: AbstractOptimizer + iter :: Int + batch_size :: Int + opts :: ADAMOptions + + function ADAM(; kwargs...) + opts = ADAMOptions(;kwargs...) + + new(0, 0, opts) + end +end + +type ADAMState + current_lr :: Float64 # current learning rate + mt :: NDArray + vt :: NDArray + beta1Power :: Float64 + beta2Power :: Float64 +end + +function create_state(self :: ADAM, index :: Int, weight :: NDArray) + return ADAMState( self.opts.lr, + zeros(size(weight), context(weight)), + zeros(size(weight), context(weight)), + self.opts.beta1, + self.opts.beta2 ) +end + +function update(self :: ADAM, index :: Int, weight :: NDArray, grad :: NDArray, state :: ADAMState) + lr = state.current_lr + grad_scale = self.opts.grad_scale / self.batch_size + + grad = grad_scale * grad + if self.opts.grad_clip > 0 + grad = clip(grad, -self.opts.grad_clip, self.opts.grad_clip) + end + + state.mt = self.opts.beta1 * state.mt + (1 - self.opts.beta1) * grad + state.vt = self.opts.beta2 * state.vt + (1 - self.opts.beta2) * (grad .* grad) + + mt = state.mt / (1 - state.beta1Power) + vt = state.vt / (1 - state.beta2Power) + + #@show state.beta1Power,state.beta2Power + + state.beta1Power *= self.opts.beta1 + state.beta2Power *= self.opts.beta2 + + @inplace weight .+= -lr * mt ./ (sqrt(vt) + self.opts.epsilon) + + state.current_lr *= self.opts.lr_decay +end From 6e0c5c7a8b5d2bf8d309d3937a762ecf5ce042a8 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 28 Oct 2015 10:11:29 -0400 Subject: [PATCH 146/630] some doc for symbol --- src/symbol.jl | 11 +++++++++++ 1 file changed, 11 insertions(+) diff --git a/src/symbol.jl b/src/symbol.jl index 4c656cfedacb..ed7e2d77c411 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -23,11 +23,22 @@ end Base.convert(t::Type{MX_handle}, obj::Symbol) = Base.unsafe_convert(t, obj) Base.cconvert(t::Type{MX_handle}, obj::Symbol) = Base.unsafe_convert(t, obj) +#=doc +.. function:: deepcopy(self :: Symbol) + + Make a deep copy of a symbol. +=# function Base.deepcopy(self :: Symbol) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCopy, (MX_handle, Ref{MX_handle}), self, ref_hdr) return Symbol(MX_SymbolHandle(ref_hdr[])) end + +#=doc +.. function:: copy(self :: Symbol) + + Make a copy of a symbol. The same as making a deep copy. +=# function Base.copy(self :: Symbol) Base.deepcopy(self) end From 762c45e544d431bb1f171b096567af33ca0a2836 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 28 Oct 2015 23:27:47 -0400 Subject: [PATCH 147/630] refactoring and naming convention dmlc/mxnet#407 --- docs/api/callback.rst | 12 +- docs/api/optimizer.rst | 104 ++++++++++++ docs/api/symbol.rst | 14 ++ docs/build-api.jl | 2 + docs/index.rst | 1 + .../Prediction with Pre-trained Model.ipynb | 48 ++++-- src/callback.jl | 57 +++---- src/model.jl | 32 ++-- src/optimizer.jl | 149 +++++++++++++++++- src/optimizers/sgd.jl | 41 ++--- 10 files changed, 360 insertions(+), 100 deletions(-) create mode 100644 docs/api/optimizer.rst diff --git a/docs/api/callback.rst b/docs/api/callback.rst index ac1c8f36b862..2bda7477094f 100644 --- a/docs/api/callback.rst +++ b/docs/api/callback.rst @@ -12,7 +12,7 @@ Callbacks in training -.. class:: AbstractIterationCallback +.. class:: AbstractBatchCallback Abstract type of callbacks to be called every mini-batch. @@ -26,19 +26,19 @@ Callbacks in training -.. function:: every_n_iter(callback :: Function, n :: Int; call_on_0 = false) +.. function:: every_n_batch(callback :: Function, n :: Int; call_on_0 = false) A convenient function to construct a callback that runs every ``n`` mini-batches. :param Int call_on_0: keyword argument, default false. Unless set, the callback - will **not** be run on iteration 0. + will **not** be run on batch 0. For example, the :func:`speedometer` callback is defined as .. code-block:: julia - every_n_iter(frequency, call_on_0=true) do param :: CallbackParams - if param.curr_iter == 0 + every_n_iter(frequency, call_on_0=true) do state :: OptimizationState + if state.curr_batch == 0 # reset timer else # compute and print speed @@ -52,7 +52,7 @@ Callbacks in training .. function:: speedometer(; frequency=50) - Create an :class:`AbstractIterationCallback` that measure the training speed + Create an :class:`AbstractBatchCallback` that measure the training speed (number of samples processed per second) every k mini-batches. :param Int frequency: keyword argument, default 50. The frequency (number of diff --git a/docs/api/optimizer.rst b/docs/api/optimizer.rst new file mode 100644 index 000000000000..97b152375bf9 --- /dev/null +++ b/docs/api/optimizer.rst @@ -0,0 +1,104 @@ + +Optimizers +========== + + + + +.. class:: AbstractOptimizer + + Base type for all optimizers. + + + + +.. class:: AbstractLearningRateScheduler + + Base type for all learning rate scheduler. + + + + +.. class:: AbstractMomentumScheduler + + Base type for all momentum scheduler. + + + + +.. class:: OptimizationState + + .. attribute:: batch_size + + The size of the mini-batch used in stochastic training. + + .. attribute:: curr_epoch + + The current epoch count. Epoch 0 means no training yet, during the first + pass through the data, the epoch will be 1; during the second pass, the + epoch count will be 1, and so on. + + .. attribute:: curr_batch + + The current mini-batch count. The batch count is reset during every epoch. + The batch count 0 means the beginning of each epoch, with no mini-batch + seen yet. During the first mini-batch, the mini-batch count will be 1. + + .. attribute:: curr_iter + + The current iteration count. One iteration corresponds to one mini-batch, + but unlike the mini-batch count, the iteration count does **not** reset + in each epoch. So it track the *total* number of mini-batches seen so far. + + + + +.. function:: get_learning_rate(scheduler, state) + + :param AbstractLearningRateScheduler scheduler: a learning rate scheduler. + :param OptimizationState state: the current state about epoch, mini-batch and iteration count. + :return: the current learning rate. + + + + +.. class:: LearningRate.Fixed + + Fixed learning rate scheduler always return the same learning rate. + + + + +.. function:: get_momentum(scheduler, state) + + :param AbstractMomentumScheduler scheduler: the momentum scheduler. + :param OptimizationState state: the state about current epoch, mini-batch and iteration count. + :return: the current momentum. + + + + +.. class:: Momentum.Null + + The null momentum scheduler always returns 0 for momentum. It is also used to + explicitly indicate momentum should not be used. + + + + +.. class:: Momentum.Fixed + + Fixed momentum scheduler always returns the same value. + + + + +.. function:: get_updater(optimizer) + + :param AbstractOptimizer optimizer: the underlying optimizer. + + A utility function to create an updater function, that uses its closure to + store all the states needed for each weights. + + + diff --git a/docs/api/symbol.rst b/docs/api/symbol.rst index 604fadc0f43d..457b462982ad 100644 --- a/docs/api/symbol.rst +++ b/docs/api/symbol.rst @@ -18,6 +18,20 @@ Symbolic API +.. function:: deepcopy(self :: Symbol) + + Make a deep copy of a symbol. + + + + +.. function:: copy(self :: Symbol) + + Make a copy of a symbol. The same as making a deep copy. + + + + libmxnet APIs ------------- diff --git a/docs/build-api.jl b/docs/build-api.jl index 29f99369d431..abccd31f1222 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -76,3 +76,5 @@ embed_mxnet_api("symbol.rst", "symbol", mx._import_atomic_symbol_creators) extract_doc("initializer.rst", "initializer.jl") extract_doc("callback.rst", "callback.jl") extract_doc("model.rst", "model.jl") + +extract_doc("optimizer.rst", "optimizer.jl") diff --git a/docs/index.rst b/docs/index.rst index cf44dc197b2d..1176f927174d 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -36,6 +36,7 @@ For more details, see documentation below. Please also checkout the `examples api/initializer api/ndarray api/symbol + api/optimizer Indices and tables ================== diff --git a/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb b/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb index 5359f41b299e..0f0bd945c723 100644 --- a/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb +++ b/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb @@ -22,31 +22,36 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 106, "metadata": { "collapsed": false }, "outputs": [ { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "RGB4 Images.Image with:\n", - " data: 256x256 Array{ColorTypes.RGB4{FixedPointNumbers.UfixedBase{UInt8,8}},2}\n", + " data: 594x629 Array{ColorTypes.RGB4{FixedPointNumbers.UfixedBase{UInt8,8}},2}\n", " properties:\n", " imagedescription: \n", " spatialorder: x y\n", " pixelspacing: 1 1" ] }, - "execution_count": 1, + "execution_count": 106, "metadata": {}, "output_type": "execute_result" } ], "source": [ "using Images, Colors\n", - "img = imread(\"cat.png\")" + "#img = imread(\"cat.png\")\n", + "img = imread(\"/Users/chiyuan/Desktop/bird.png\")\n", + "img = imread(\"/Users/chiyuan/Desktop/bill-gates.jpg\")\n", + "#img = imread(\"/Users/chiyuan/Desktop/dog.jpg\")\n", + "#img = imread(\"/Users/chiyuan/Desktop/schoolbus.jpg\")\n", + "#img = imread(\"/Users/chiyuan/Desktop/horse-face-2.jpg\")" ] }, { @@ -58,7 +63,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 107, "metadata": { "collapsed": false }, @@ -68,7 +73,7 @@ "output_type": "stream", "text": [ "Image resized to (224,224,3)\n", - "('Original Image Shape: ', (256, 256, 3))\n" + "('Original Image Shape: ', (629, 594, 3))\n" ] } ], @@ -93,7 +98,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 108, "metadata": { "collapsed": false }, @@ -127,7 +132,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 109, "metadata": { "collapsed": false }, @@ -156,7 +161,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 110, "metadata": { "collapsed": false }, @@ -165,7 +170,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "Egyptian cat\n" + "wig\n" ] } ], @@ -186,7 +191,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 111, "metadata": { "collapsed": false }, @@ -195,11 +200,11 @@ "name": "stdout", "output_type": "stream", "text": [ - " Egyptian cat w.p. 0.415571\n", - " tabby, tabby cat w.p. 0.230575\n", - " lynx, catamount w.p. 0.153771\n", - " tiger cat w.p. 0.129155\n", - " Persian cat w.p. 0.053005\n" + " wig w.p. 0.430989\n", + " feather boa, boa w.p. 0.127852\n", + " fur coat w.p. 0.112760\n", + " hair spray w.p. 0.055442\n", + " cloak w.p. 0.019644\n" ] } ], @@ -213,6 +218,15 @@ " println(mx.format(\"{1:>18} w.p. {2:4f}\", l, p))\n", "end" ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [] } ], "metadata": { diff --git a/src/callback.jl b/src/callback.jl index ea890ab2c269..9f3d85b576ff 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -11,11 +11,11 @@ Callbacks in training abstract AbstractCallback #=doc -.. class:: AbstractIterationCallback +.. class:: AbstractBatchCallback Abstract type of callbacks to be called every mini-batch. =# -abstract AbstractIterationCallback <: AbstractCallback +abstract AbstractBatchCallback <: AbstractCallback #=doc .. class:: AbstractEpochCallback @@ -24,33 +24,26 @@ abstract AbstractIterationCallback <: AbstractCallback =# abstract AbstractEpochCallback <: AbstractCallback -type CallbackParams - batch_size :: Int - curr_epoch :: Int - curr_iter :: Int -end -CallbackParams(batch_size::Int) = CallbackParams(batch_size, 0, 0) - -type IterationCallback <: AbstractIterationCallback +type BatchCallback <: AbstractBatchCallback frequency :: Int call_on_0 :: Bool callback :: Function end #=doc -.. function:: every_n_iter(callback :: Function, n :: Int; call_on_0 = false) +.. function:: every_n_batch(callback :: Function, n :: Int; call_on_0 = false) A convenient function to construct a callback that runs every ``n`` mini-batches. :param Int call_on_0: keyword argument, default false. Unless set, the callback - will **not** be run on iteration 0. + will **not** be run on batch 0. For example, the :func:`speedometer` callback is defined as .. code-block:: julia - every_n_iter(frequency, call_on_0=true) do param :: CallbackParams - if param.curr_iter == 0 + every_n_iter(frequency, call_on_0=true) do state :: OptimizationState + if state.curr_batch == 0 # reset timer else # compute and print speed @@ -59,23 +52,23 @@ end :seealso: :func:`every_n_epoch`, :func:`speedometer`. =# -function every_n_iter(callback :: Function, n :: Int; call_on_0 :: Bool = false) - IterationCallback(n, call_on_0, callback) +function every_n_batch(callback :: Function, n :: Int; call_on_0 :: Bool = false) + BatchCallback(n, call_on_0, callback) end -function Base.call(cb :: IterationCallback, param :: CallbackParams) - if param.curr_iter == 0 +function Base.call(cb :: BatchCallback, state :: OptimizationState) + if state.curr_batch == 0 if cb.call_on_0 - cb.callback(param) + cb.callback(state) end - elseif param.curr_iter % cb.frequency == 0 - cb.callback(param) + elseif state.curr_batch % cb.frequency == 0 + cb.callback(state) end end #=doc .. function:: speedometer(; frequency=50) - Create an :class:`AbstractIterationCallback` that measure the training speed + Create an :class:`AbstractBatchCallback` that measure the training speed (number of samples processed per second) every k mini-batches. :param Int frequency: keyword argument, default 50. The frequency (number of @@ -83,12 +76,12 @@ end =# function speedometer(;frequency::Int=50) cl_tic = 0 - every_n_iter(frequency, call_on_0=true) do param :: CallbackParams - if param.curr_iter == 0 + every_n_batch(frequency, call_on_0=true) do state :: OptimizationState + if state.curr_batch == 0 # reset timer cl_tic = time() else - speed = frequency * param.batch_size / (time() - cl_tic) + speed = frequency * state.batch_size / (time() - cl_tic) info(format("Speed: {1:>6.2f} samples/sec", speed)) cl_tic = time() end @@ -117,13 +110,13 @@ end function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) end -function Base.call(cb :: EpochCallback, model :: Any, param :: CallbackParams) - if param.curr_epoch == 0 +function Base.call(cb :: EpochCallback, model :: Any, state :: OptimizationState) + if state.curr_epoch == 0 if cb.call_on_0 - cb.callback(model, param) + cb.callback(model, state) end - elseif param.curr_epoch % cb.frequency == 0 - cb.callback(model, param) + elseif state.curr_epoch % cb.frequency == 0 + cb.callback(model, state) end end @@ -143,7 +136,7 @@ end =# function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) mkpath(dirname(prefix)) - every_n_epoch(frequency, call_on_0=save_epoch_0) do model, param - save_checkpoint(model, prefix, param) + every_n_epoch(frequency, call_on_0=save_epoch_0) do model, state + save_checkpoint(model, prefix, state) end end diff --git a/src/model.jl b/src/model.jl index f28fd0d9f5af..5b42278f8db2 100644 --- a/src/model.jl +++ b/src/model.jl @@ -263,14 +263,15 @@ end callbacks :: Vector{AbstractCallback} = AbstractCallback[], ) -function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, param::CallbackParams, type_filter::Type) +function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, + state::OptimizationState, type_filter::Type) map(callbacks) do cb if isa(cb, type_filter) if type_filter == AbstractEpochCallback # epoch callback have extra access to the model object - cb(self, param) + cb(self, state) else - cb(param) + cb(state) end end end @@ -355,8 +356,8 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra grad_arrays = [NDArray[exec.grad_arrays[i] for exec in train_execs] for i in param_idx] aux_arrays = [NDArray[exec.aux_arrays[i] for exec in train_execs] for i = 1:length(aux_names)] - optimizer.batch_size = batch_size - cb_param = CallbackParams(batch_size) + op_state = OptimizationState(batch_size) + optimizer.state = op_state if !update_on_kvstore updater = get_updater(optimizer) @@ -388,18 +389,18 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra cpu_label_arrays_full_slice = [SlicedNDArray[(1:batch_size, x)] for x in cpu_label_arrays] # invoke callbacks on epoch 0 - _invoke_callbacks(self, opts.callbacks, cb_param, AbstractEpochCallback) + _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) # now start training... for i_epoch = 1:opts.n_epoch time_start = time() reset!(opts.eval_metric) - cb_param.curr_epoch = i_epoch - cb_param.curr_iter = 0 + op_state.curr_epoch = i_epoch + op_state.curr_batch = 0 # invoke callbacks on iteration 0 - _invoke_callbacks(self, opts.callbacks, cb_param, AbstractIterationCallback) + _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) for batch in data load_data!(batch, data_arrays) @@ -417,6 +418,10 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra backward(texec) end + op_state.curr_iter += 1 + op_state.curr_batch += 1 + optimizer.state = op_state + # update parameters for idx = 1:length(param_names) # gradient synchronization @@ -445,8 +450,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end # invoke callbacks after finishing each iteration - _invoke_callbacks(self, opts.callbacks, cb_param, AbstractIterationCallback) - cb_param.curr_iter += 1 + _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) # update evaluation metric on training set load_label!(batch, cpu_label_arrays_full_slice) @@ -503,12 +507,12 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra copy!(self.aux_params[name], aux_avg) end end - _invoke_callbacks(self, opts.callbacks, cb_param, AbstractEpochCallback) + _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) end # end of all epochs end -function save_checkpoint(self :: FeedForward, prefix :: AbstractString, param :: CallbackParams) - save_checkpoint(self.arch, self.arg_params, self.aux_params, prefix, param.curr_epoch) +function save_checkpoint(self :: FeedForward, prefix :: AbstractString, state :: OptimizationState) + save_checkpoint(self.arch, self.arg_params, self.aux_params, prefix, state.curr_epoch) end function save_checkpoint(sym :: Symbol, arg_params :: Dict{Base.Symbol, NDArray}, aux_params :: Dict{Base.Symbol, NDArray}, prefix :: AbstractString, epoch :: Int) diff --git a/src/optimizer.jl b/src/optimizer.jl index c2c8ba4c28ef..07950d82a221 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -1,22 +1,158 @@ +#=doc +Optimizers +========== +=# + + +#=doc +.. class:: AbstractOptimizer + + Base type for all optimizers. +=# abstract AbstractOptimizer +#=doc +.. class:: AbstractLearningRateScheduler + + Base type for all learning rate scheduler. +=# abstract AbstractLearningRateScheduler + +#=doc +.. class:: AbstractMomentumScheduler + + Base type for all momentum scheduler. +=# abstract AbstractMomentumScheduler -type FixedLearningRateScheduler <: AbstractLearningRateScheduler + + +#=doc +.. class:: OptimizationState + + .. attribute:: batch_size + + The size of the mini-batch used in stochastic training. + + .. attribute:: curr_epoch + + The current epoch count. Epoch 0 means no training yet, during the first + pass through the data, the epoch will be 1; during the second pass, the + epoch count will be 1, and so on. + + .. attribute:: curr_batch + + The current mini-batch count. The batch count is reset during every epoch. + The batch count 0 means the beginning of each epoch, with no mini-batch + seen yet. During the first mini-batch, the mini-batch count will be 1. + + .. attribute:: curr_iter + + The current iteration count. One iteration corresponds to one mini-batch, + but unlike the mini-batch count, the iteration count does **not** reset + in each epoch. So it track the *total* number of mini-batches seen so far. +=# +type OptimizationState + batch_size :: Int + curr_epoch :: Int + curr_batch :: Int + curr_iter :: Int +end +OptimizationState(batch_size::Int) = OptimizationState(batch_size, 0, 0, 0) + + +#=doc +.. function:: get_learning_rate(scheduler, state) + + :param AbstractLearningRateScheduler scheduler: a learning rate scheduler. + :param OptimizationState state: the current state about epoch, mini-batch and iteration count. + :return: the current learning rate. +=# +function get_learning_rate +end + +################################################################################ +# The learning rate module +module LearningRate +import ..mx: AbstractLearningRateScheduler, OptimizationState, get_learning_rate + +#=doc +.. class:: LearningRate.Fixed + + Fixed learning rate scheduler always return the same learning rate. +=# +type Fixed <: AbstractLearningRateScheduler learning_rate :: Float64 end -get_learning_rate(self :: FixedLearningRateScheduler, iter :: Int) = self.learning_rate +get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rate + +end # module LearningRate +################################################################################ +function get_lr_scheduler(scheduler :: Any, lr :: Real) + if isa(scheduler, AbstractLearningRateScheduler) + return scheduler + else + return LearningRate.Fixed(lr) + end +end + + +#=doc +.. function:: get_momentum(scheduler, state) + + :param AbstractMomentumScheduler scheduler: the momentum scheduler. + :param OptimizationState state: the state about current epoch, mini-batch and iteration count. + :return: the current momentum. +=# +function get_momentum +end -type NullMomentumScheduler <: AbstractMomentumScheduler + +################################################################################ +# The Momentum module +module Momentum +import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum + +#=doc +.. class:: Momentum.Null + + The null momentum scheduler always returns 0 for momentum. It is also used to + explicitly indicate momentum should not be used. +=# +type Null <: AbstractMomentumScheduler end -get_momentum(self :: NullMomentumScheduler, iter :: Int) = 0.0 +get_momentum(self :: Null, state :: OptimizationState) = 0.0 -type FixedMomentumScheduler <: AbstractMomentumScheduler +#=doc +.. class:: Momentum.Fixed + + Fixed momentum scheduler always returns the same value. +=# +type Fixed <: AbstractMomentumScheduler momentum :: Float64 end -get_momentum(self :: FixedMomentumScheduler, iter :: Int) = self.momentum +get_momentum(self :: Fixed, state :: OptimizationState) = self.momentum +end # module Momentum +################################################################################ +function get_momentum_scheduler(scheduler :: Any, momentum :: Real) + if isa(scheduler, AbstractMomentumScheduler) + return scheduler + elseif momentum == 0 + return Momentum.Null() + else + return Momentum.Fixed(momentum) + end +end + + +#=doc +.. function:: get_updater(optimizer) + :param AbstractOptimizer optimizer: the underlying optimizer. + + A utility function to create an updater function, that uses its closure to + store all the states needed for each weights. +=# function get_updater(optimizer :: AbstractOptimizer) states = Dict{Int,Any}() function updater(index :: Int, grad :: NDArray, weight :: NDArray) @@ -28,6 +164,5 @@ function get_updater(optimizer :: AbstractOptimizer) return updater end - include("optimizers/sgd.jl") include("optimizers/adam.jl") diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index b910e2c3d6b6..9655229b4ace 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -1,36 +1,29 @@ @defstruct SGDOptions Any ( - (lr :: Real = 0.01, lr > 0), - (momentum :: Real = 0.0, momentum >= 0), - (weight_decay :: Real = 0.0001, weight_decay >= 0), - (grad_scale :: Real = 1.0, grad_scale >= 0), - (grad_clip :: Real = 0, grad_clip >= 0), - lr_scheduler :: Any = nothing, - mom_scheduler :: Any = nothing + (lr :: Real = 0.01, lr > 0), + (momentum :: Real = 0.0, momentum >= 0), + (weight_decay :: Real = 0.0001, weight_decay >= 0), + (grad_scale :: Real = 1.0, grad_scale >= 0), + (grad_clip :: Real = 0, grad_clip >= 0), + lr_scheduler :: Any = nothing, + momentum_scheduler :: Any = nothing ) type SGD <: AbstractOptimizer - iter :: Int - batch_size :: Int - opts :: SGDOptions + opts :: SGDOptions + state :: OptimizationState function SGD(; kwargs...) opts = SGDOptions(;kwargs...) - if !isa(opts.lr_scheduler, AbstractLearningRateScheduler) - opts.lr_scheduler = FixedLearningRateScheduler(opts.lr) - end - if !isa(opts.mom_scheduler, AbstractMomentumScheduler) - opts.mom_scheduler = opts.momentum > 0 ? - FixedMomentumScheduler(opts.momentum) : - NullMomentumScheduler() - end - - new(0, 0, opts) + opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) + opts.momentum_scheduler = get_momentum_scheduler(opts.momentum_scheduler, opts.momentum) + + new(opts) end end function create_state(self :: SGD, index :: Int, weight :: NDArray) - if isa(self.opts.mom_scheduler, NullMomentumScheduler) + if isa(self.opts.momentum_scheduler, Momentum.Null) return nothing else return zeros(size(weight), context(weight)) @@ -38,8 +31,8 @@ function create_state(self :: SGD, index :: Int, weight :: NDArray) end function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: Union{Void, NDArray}) - lr = get_learning_rate(self.opts.lr_scheduler, self.iter) - grad_scale = self.opts.grad_scale / self.batch_size + lr = get_learning_rate(self.opts.lr_scheduler, self.state) + grad_scale = self.opts.grad_scale / self.state.batch_size grad = grad_scale * grad if self.opts.grad_clip > 0 @@ -50,7 +43,7 @@ function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, s @inplace weight += -lr * (grad + self.opts.weight_decay * weight) else mom = state :: NDArray - coef = get_momentum(self.opts.mom_scheduler, self.iter) + coef = get_momentum(self.opts.momentum_scheduler, self.state) @inplace mom .*= coef @inplace mom .+= -lr * (grad + self.opts.weight_decay * weight) @inplace weight .+= mom From a2beae8ee57ba1e664bf4639e226b5a0de2ca5a7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 28 Oct 2015 23:39:42 -0400 Subject: [PATCH 148/630] refactoring of optimizer --- docs/api/optimizer.rst | 28 ++++++++++++++++++++++++++++ src/optimizer.jl | 36 ++++++++++++++++++++++++++++++++++++ src/optimizers/sgd.jl | 10 +++------- 3 files changed, 67 insertions(+), 7 deletions(-) diff --git a/docs/api/optimizer.rst b/docs/api/optimizer.rst index 97b152375bf9..e9f29e4aa07c 100644 --- a/docs/api/optimizer.rst +++ b/docs/api/optimizer.rst @@ -2,6 +2,9 @@ Optimizers ========== +Common interfaces +----------------- + @@ -102,3 +105,28 @@ Optimizers + +Built-in optimizers +------------------- + + + + +.. class:: AbstractOptimizerOptions + + Base class for all optimizer options. + + + + +.. function:: normalized_gradient(opts, state, grad) + + :param AbstractOptimizerOptions opts: options for the optimizer, should contain the field + ``grad_scale`` and ``grad_clip``. + :param OptimizationState state: the current optimization state. + :param NDArray grad: the original gradient. + + Get the properly normalized gradient (re-scaled and clipped if necessary). + + + diff --git a/src/optimizer.jl b/src/optimizer.jl index 07950d82a221..2e6e58ac1429 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -1,6 +1,9 @@ #=doc Optimizers ========== + +Common interfaces +----------------- =# @@ -164,5 +167,38 @@ function get_updater(optimizer :: AbstractOptimizer) return updater end +################################################################################ +#=doc +Built-in optimizers +------------------- +=# + +#=doc +.. class:: AbstractOptimizerOptions + + Base class for all optimizer options. +=# +abstract AbstractOptimizerOptions + +#=doc +.. function:: normalized_gradient(opts, state, grad) + + :param AbstractOptimizerOptions opts: options for the optimizer, should contain the field + ``grad_scale`` and ``grad_clip``. + :param OptimizationState state: the current optimization state. + :param NDArray grad: the original gradient. + + Get the properly normalized gradient (re-scaled and clipped if necessary). +=# +function normalized_gradient(opts::AbstractOptimizerOptions, state::OptimizationState, grad::NDArray) + grad_scale = opts.grad_scale / state.batch_size + + grad = grad_scale * grad + if opts.grad_clip > 0 + grad = clip(grad, -opts.grad_clip, opts.grad_clip) + end + return grad +end + include("optimizers/sgd.jl") include("optimizers/adam.jl") diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index 9655229b4ace..abad6770216d 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -1,4 +1,4 @@ -@defstruct SGDOptions Any ( +@defstruct SGDOptions AbstractOptimizerOptions ( (lr :: Real = 0.01, lr > 0), (momentum :: Real = 0.0, momentum >= 0), (weight_decay :: Real = 0.0001, weight_decay >= 0), @@ -32,14 +32,10 @@ end function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: Union{Void, NDArray}) lr = get_learning_rate(self.opts.lr_scheduler, self.state) - grad_scale = self.opts.grad_scale / self.state.batch_size - - grad = grad_scale * grad - if self.opts.grad_clip > 0 - grad = clip(grad, -self.opts.grad_clip, self.opts.grad_clip) - end + grad = normalized_gradient(self.opts, self.state, grad) if isa(state, Void) + # vanilla SGD, without momentum @inplace weight += -lr * (grad + self.opts.weight_decay * weight) else mom = state :: NDArray From fe36340e1f4a73ea64ab2069871877b24765baeb Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 28 Oct 2015 23:55:26 -0400 Subject: [PATCH 149/630] refactor adam optimizer --- src/optimizer.jl | 10 +++++++--- src/optimizers/adam.jl | 39 +++++++++++++++------------------------ src/optimizers/sgd.jl | 8 ++++---- 3 files changed, 26 insertions(+), 31 deletions(-) diff --git a/src/optimizer.jl b/src/optimizer.jl index 2e6e58ac1429..33a67ebd5896 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -184,19 +184,23 @@ abstract AbstractOptimizerOptions .. function:: normalized_gradient(opts, state, grad) :param AbstractOptimizerOptions opts: options for the optimizer, should contain the field - ``grad_scale`` and ``grad_clip``. + ``grad_scale``, ``grad_clip`` and ``weight_decay``. :param OptimizationState state: the current optimization state. - :param NDArray grad: the original gradient. + :param NDArray weight: the trainable weights. + :param NDArray grad: the original gradient of the weights. Get the properly normalized gradient (re-scaled and clipped if necessary). =# -function normalized_gradient(opts::AbstractOptimizerOptions, state::OptimizationState, grad::NDArray) +function normalized_gradient(opts::AbstractOptimizerOptions, state::OptimizationState, + weight::NDArray, grad::NDArray) grad_scale = opts.grad_scale / state.batch_size grad = grad_scale * grad if opts.grad_clip > 0 grad = clip(grad, -opts.grad_clip, opts.grad_clip) end + @inplace grad += opts.weight_decay * weight + return grad end diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl index b555773a49a9..d8d1d2377836 100644 --- a/src/optimizers/adam.jl +++ b/src/optimizers/adam.jl @@ -1,38 +1,38 @@ - -@defstruct ADAMOptions Any ( +@defstruct ADAMOptions AbstractOptimizerOptions ( (lr :: Real = 0.001, lr > 0), - (lr_decay :: Real = 1.0, lr_decay > 0), + (grad_scale :: Real = 1.0, grad_scale >= 0), + (grad_clip :: Real = 0, grad_clip >= 0), + (weight_decay :: Real = 0.00001, weight_decay >= 0), (beta1 :: Real = 0.9, beta1 > 0), (beta2 :: Real = 0.999, beta2 > 0), (epsilon :: Real = 1e-8, epsilon > 0), - (grad_scale :: Real = 1.0, grad_scale >= 0), - (grad_clip :: Real = 0, grad_clip >= 0) + lr_scheduler :: Any = nothing ) type ADAM <: AbstractOptimizer - iter :: Int - batch_size :: Int - opts :: ADAMOptions + opts :: ADAMOptions + state :: OptimizationState function ADAM(; kwargs...) opts = ADAMOptions(;kwargs...) - - new(0, 0, opts) + opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) + + new(opts) end end type ADAMState current_lr :: Float64 # current learning rate - mt :: NDArray - vt :: NDArray + mt :: NDArray + vt :: NDArray beta1Power :: Float64 beta2Power :: Float64 end function create_state(self :: ADAM, index :: Int, weight :: NDArray) - return ADAMState( self.opts.lr, - zeros(size(weight), context(weight)), + return ADAMState( get_learning_rate(self.opts.lr_scheduler, self.state), + zeros(size(weight), context(weight)), zeros(size(weight), context(weight)), self.opts.beta1, self.opts.beta2 ) @@ -40,12 +40,7 @@ end function update(self :: ADAM, index :: Int, weight :: NDArray, grad :: NDArray, state :: ADAMState) lr = state.current_lr - grad_scale = self.opts.grad_scale / self.batch_size - - grad = grad_scale * grad - if self.opts.grad_clip > 0 - grad = clip(grad, -self.opts.grad_clip, self.opts.grad_clip) - end + grad = normalized_gradient(self.opts, self.state, weight, grad) state.mt = self.opts.beta1 * state.mt + (1 - self.opts.beta1) * grad state.vt = self.opts.beta2 * state.vt + (1 - self.opts.beta2) * (grad .* grad) @@ -53,12 +48,8 @@ function update(self :: ADAM, index :: Int, weight :: NDArray, grad :: NDArray, mt = state.mt / (1 - state.beta1Power) vt = state.vt / (1 - state.beta2Power) - #@show state.beta1Power,state.beta2Power - state.beta1Power *= self.opts.beta1 state.beta2Power *= self.opts.beta2 @inplace weight .+= -lr * mt ./ (sqrt(vt) + self.opts.epsilon) - - state.current_lr *= self.opts.lr_decay end diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index abad6770216d..84ea55f40f11 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -1,9 +1,9 @@ @defstruct SGDOptions AbstractOptimizerOptions ( (lr :: Real = 0.01, lr > 0), (momentum :: Real = 0.0, momentum >= 0), - (weight_decay :: Real = 0.0001, weight_decay >= 0), (grad_scale :: Real = 1.0, grad_scale >= 0), (grad_clip :: Real = 0, grad_clip >= 0), + (weight_decay :: Real = 0.0001, weight_decay >= 0), lr_scheduler :: Any = nothing, momentum_scheduler :: Any = nothing ) @@ -32,16 +32,16 @@ end function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: Union{Void, NDArray}) lr = get_learning_rate(self.opts.lr_scheduler, self.state) - grad = normalized_gradient(self.opts, self.state, grad) + grad = normalized_gradient(self.opts, self.state, weight, grad) if isa(state, Void) # vanilla SGD, without momentum - @inplace weight += -lr * (grad + self.opts.weight_decay * weight) + @inplace weight += -lr * grad else mom = state :: NDArray coef = get_momentum(self.opts.momentum_scheduler, self.state) @inplace mom .*= coef - @inplace mom .+= -lr * (grad + self.opts.weight_decay * weight) + @inplace mom .+= -lr * grad @inplace weight .+= mom end end From 1f39e1d90d922b6ca8df07165366039352797231 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 00:05:33 -0400 Subject: [PATCH 150/630] more learning rate scheduler --- src/optimizer.jl | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) diff --git a/src/optimizer.jl b/src/optimizer.jl index 33a67ebd5896..2c784adc13e7 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -89,6 +89,24 @@ type Fixed <: AbstractLearningRateScheduler end get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rate +#=doc +.. class:: LearningRate.Exp + + $$\eta_t = \eta_0\gamma^t$$. Here $$t$$ is the epoch count, or the iteration + count if ``decay_on_iteration`` is set to true. +=# +type Exp <: AbstractLearningRateScheduler + learning_rate :: Float64 + gamma :: Float64 + on_iteration :: Bool +end +function Exp(base_lr::Real; gamma::Real=0.9, decay_on_iteration::Bool=false) + @assert(0 < gamma < 1) + Exp(Float64(base_lr), Float64(gamma), decay_on_iteration) +end +get_learning_rate(self :: Exp, state :: OptimizationState) = + self.learning_rate * self.gamma ^ (self.on_iteration ? state.curr_iter : state.curr_epoch) + end # module LearningRate ################################################################################ function get_lr_scheduler(scheduler :: Any, lr :: Real) From e821f9501da6272ceee86384290650b6a63e48c9 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 00:09:50 -0400 Subject: [PATCH 151/630] update equation in sphinx doc --- docs/api/optimizer.rst | 13 +++++++++++-- src/optimizer.jl | 2 +- 2 files changed, 12 insertions(+), 3 deletions(-) diff --git a/docs/api/optimizer.rst b/docs/api/optimizer.rst index e9f29e4aa07c..bc45cf1744ac 100644 --- a/docs/api/optimizer.rst +++ b/docs/api/optimizer.rst @@ -72,6 +72,14 @@ Common interfaces +.. class:: LearningRate.Exp + + :math:`\eta_t = \eta_0\gamma^t`. Here :math:`t` is the epoch count, or the iteration + count if ``decay_on_iteration`` is set to true. + + + + .. function:: get_momentum(scheduler, state) :param AbstractMomentumScheduler scheduler: the momentum scheduler. @@ -122,9 +130,10 @@ Built-in optimizers .. function:: normalized_gradient(opts, state, grad) :param AbstractOptimizerOptions opts: options for the optimizer, should contain the field - ``grad_scale`` and ``grad_clip``. + ``grad_scale``, ``grad_clip`` and ``weight_decay``. :param OptimizationState state: the current optimization state. - :param NDArray grad: the original gradient. + :param NDArray weight: the trainable weights. + :param NDArray grad: the original gradient of the weights. Get the properly normalized gradient (re-scaled and clipped if necessary). diff --git a/src/optimizer.jl b/src/optimizer.jl index 2c784adc13e7..a5f0bfd5ec60 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -92,7 +92,7 @@ get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rat #=doc .. class:: LearningRate.Exp - $$\eta_t = \eta_0\gamma^t$$. Here $$t$$ is the epoch count, or the iteration + :math:`\eta_t = \eta_0\gamma^t`. Here :math:`t` is the epoch count, or the iteration count if ``decay_on_iteration`` is set to true. =# type Exp <: AbstractLearningRateScheduler From 04bde14aa923c2b259ad289c734200e721ae1841 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 00:18:41 -0400 Subject: [PATCH 152/630] fix accidental notebook changes --- .../Prediction with Pre-trained Model.ipynb | 48 +++++++------------ 1 file changed, 17 insertions(+), 31 deletions(-) diff --git a/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb b/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb index 0f0bd945c723..9f4f2b8cb1d3 100644 --- a/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb +++ b/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb @@ -22,36 +22,31 @@ }, { "cell_type": "code", - "execution_count": 106, + "execution_count": 1, "metadata": { "collapsed": false }, "outputs": [ { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "RGB4 Images.Image with:\n", - " data: 594x629 Array{ColorTypes.RGB4{FixedPointNumbers.UfixedBase{UInt8,8}},2}\n", + " data: 256x256 Array{ColorTypes.RGB4{FixedPointNumbers.UfixedBase{UInt8,8}},2}\n", " properties:\n", " imagedescription: \n", " spatialorder: x y\n", " pixelspacing: 1 1" ] }, - "execution_count": 106, + "execution_count": 1, "metadata": {}, "output_type": "execute_result" } ], "source": [ "using Images, Colors\n", - "#img = imread(\"cat.png\")\n", - "img = imread(\"/Users/chiyuan/Desktop/bird.png\")\n", - "img = imread(\"/Users/chiyuan/Desktop/bill-gates.jpg\")\n", - "#img = imread(\"/Users/chiyuan/Desktop/dog.jpg\")\n", - "#img = imread(\"/Users/chiyuan/Desktop/schoolbus.jpg\")\n", - "#img = imread(\"/Users/chiyuan/Desktop/horse-face-2.jpg\")" + "img = imread(\"cat.png\")" ] }, { @@ -63,7 +58,7 @@ }, { "cell_type": "code", - "execution_count": 107, + "execution_count": 2, "metadata": { "collapsed": false }, @@ -73,7 +68,7 @@ "output_type": "stream", "text": [ "Image resized to (224,224,3)\n", - "('Original Image Shape: ', (629, 594, 3))\n" + "('Original Image Shape: ', (256, 256, 3))\n" ] } ], @@ -98,7 +93,7 @@ }, { "cell_type": "code", - "execution_count": 108, + "execution_count": 3, "metadata": { "collapsed": false }, @@ -132,7 +127,7 @@ }, { "cell_type": "code", - "execution_count": 109, + "execution_count": 4, "metadata": { "collapsed": false }, @@ -161,7 +156,7 @@ }, { "cell_type": "code", - "execution_count": 110, + "execution_count": 5, "metadata": { "collapsed": false }, @@ -170,7 +165,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "wig\n" + "lynx, catamount\n" ] } ], @@ -191,7 +186,7 @@ }, { "cell_type": "code", - "execution_count": 111, + "execution_count": 6, "metadata": { "collapsed": false }, @@ -200,11 +195,11 @@ "name": "stdout", "output_type": "stream", "text": [ - " wig w.p. 0.430989\n", - " feather boa, boa w.p. 0.127852\n", - " fur coat w.p. 0.112760\n", - " hair spray w.p. 0.055442\n", - " cloak w.p. 0.019644\n" + " lynx, catamount w.p. 0.552236\n", + " tabby, tabby cat w.p. 0.118180\n", + " Persian cat w.p. 0.114004\n", + " Egyptian cat w.p. 0.090389\n", + " tiger cat w.p. 0.086328\n" ] } ], @@ -218,15 +213,6 @@ " println(mx.format(\"{1:>18} w.p. {2:4f}\", l, p))\n", "end" ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": { - "collapsed": true - }, - "outputs": [], - "source": [] } ], "metadata": { From 1dc944e02f334ff90511c68af279648f15fb1243 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 11:00:11 -0400 Subject: [PATCH 153/630] first step of refining the data provider API. --- docs/api/io.rst | 134 +++++++++++++++++++++++++++++++++++++ docs/build-api.jl | 2 + docs/index.rst | 5 +- src/io.jl | 163 +++++++++++++++++++++++++++++++--------------- 4 files changed, 249 insertions(+), 55 deletions(-) create mode 100644 docs/api/io.rst diff --git a/docs/api/io.rst b/docs/api/io.rst new file mode 100644 index 000000000000..d3d060fb12f3 --- /dev/null +++ b/docs/api/io.rst @@ -0,0 +1,134 @@ + +Data Providers +============== + +Data providers are wrappers that load external data, be it images, text, or general tensors, +and split it into mini-batches so that the model can consume the data in a uniformed way. + + + + +.. class:: AbstractDataProvider + + The root type for all data provider. A data provider should implement the following interfaces: + + .. function:: get_batch_size(provider) -> Int + + :param AbstractDataProvider provider: the data provider. + :return: the mini-batch size of the provided data. All the provided data should have the + same mini-batch size (i.e. the last dimension). + + .. function:: provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} + + :param AbstractDataProvider provider: the data provider. + :return: a vector of (name, shape) pairs describing the names of the data it provides, and + the corresponding shapes. + + .. function:: provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} + + :param AbstractDataProvider provider: the data provider. + :return: a vector of (name, shape) pairs describing the names of the labels it provides, and + the corresponding shapes. + + The difference between *data* and *label* is that during + training stage, both *data* and *label* will be feeded into the model, while during + prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and + of any shapes. The provided data and label names here should match the input names in a target + :class:`Symbol`. + + A data provider should also implement the Julia iteration interface, in order to allow iterating + through the data set. The provider will be called in the following way: + + .. code-block:: julia + + for batch in provider + data = get_data(provider, batch) + end + + which will be translated by Julia compiler into + + .. code-block:: julia + + state = Base.start(provider) + while !Base.done(provider, state) + (batch, state) = Base.next(provider, state) + data = get_data(provider, batch) + end + + The detailed interface function is listed below: + + .. function:: Base.eltype(provider) -> AbstractDataBatch + + :param AbstractDataProvider provider: the data provider. + :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. + + .. function:: Base.start(provider) -> AbstractDataProviderState + + :param AbstractDataProvider provider: the data provider. + + This function is always called before iterating into the dataset. It should initialize + the iterator, reset the index, and do data shuffling if needed. + + .. function:: Base.done(provider, state) -> Bool + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. + :return: true if there is no more data to iterate in this dataset. + + .. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) + + :param AbstractDataProvider provider: the data provider. + :return: the current data batch, and the state for the next iteration. + + Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that + is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this + case, you can safely assume that + + * :func:`Base.start` will always be called, and called only once before the iteration starts. + * :func:`Base.done` will always be called at the beginning of every iteration and always be called once. + * If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with + a call to :func:`Base.start`. + * :func:`Base.next` will always be called only once in each iteration. It will always be called after + one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will + not be called. + + With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation + of the built-in :class:`MXDataProvider` for example. + + + + +.. class:: AbstractDataProviderState + + Base type for data provider states. + + + + +.. class:: AbstractDataBatch + + Base type for a data mini-batch. It should implement the following interfaces: + + .. function:: count_samples(batch) -> Int + + :param AbstractDataBatch batch: the data batch object. + :return: the number of samples in this batch. This number should be greater than 0, but + less than or equal to the batch size. This is used to indicate at the end of + the data set, there might not be enough samples for a whole mini-batch. + + .. function:: get_data(provider, batch) -> Vector{NDArray} + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :return: a vector of data in this batch, should be in the same order as declared in + :func:`provide_data() `. The last dimension + of each :class:`NDArray` should match the value returned by :func:`count_samples`. + + .. function:: get_label(provider, batch) -> Vector{NDArray} + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :return: a vector of labels in this batch. Similar to :func:`get_data`. + + + diff --git a/docs/build-api.jl b/docs/build-api.jl index abccd31f1222..0d01e4f84ec8 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -78,3 +78,5 @@ extract_doc("callback.rst", "callback.jl") extract_doc("model.rst", "model.jl") extract_doc("optimizer.rst", "optimizer.jl") + +extract_doc("io.rst", "io.jl") diff --git a/docs/index.rst b/docs/index.rst index 1176f927174d..eda80ac1c18d 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -32,11 +32,12 @@ For more details, see documentation below. Please also checkout the `examples :caption: API Documentation api/model - api/callback api/initializer + api/optimizer + api/callback + api/io api/ndarray api/symbol - api/optimizer Indices and tables ================== diff --git a/src/io.jl b/src/io.jl index c8396c1d7182..9f4ad67d735b 100644 --- a/src/io.jl +++ b/src/io.jl @@ -1,76 +1,106 @@ -"""Root type for data provider +#=doc +Data Providers +============== -A data provider provides interface to iterate over a dataset. It should implement the following functions: +Data providers are wrappers that load external data, be it images, text, or general tensors, +and split it into mini-batches so that the model can consume the data in a uniformed way. +=# -```julia -provide_data(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} -provide_label(provider :: AbstractDataProvider) => Vector{Tuple{Base.Symbol, Tuple}} -``` +#=doc +.. class:: AbstractDataProvider -Returns a list of name-shape pairs, indicating the name and shape of the each data stream. For example, -`[(:data, (100,1,28,28))]` or `[(:softmax_label, (100,1))]`. It should also implement the following convenient -function + The root type for all data provider. A data provider should implement the following interfaces: -```julia -get_batch_size(provider :: AbstractDataProvider) => Int -``` + .. function:: get_batch_size(provider) -> Int -which returns the batch size used in this data provider. + :param AbstractDataProvider provider: the data provider. + :return: the mini-batch size of the provided data. All the provided data should have the + same mini-batch size (i.e. the last dimension). -A data provider should implement the standard Julia iteration interface, including `Base.start`, -`Base.next`, `Base.done` and `Base.eltype`. It could safely assume that the interface functions will -always be called like + .. function:: provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} -```julia -for batch in provider - # ... - load_data!(batch, targets) -end -``` + :param AbstractDataProvider provider: the data provider. + :return: a vector of (name, shape) pairs describing the names of the data it provides, and + the corresponding shapes. -which translates into + .. function:: provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} -```julia -state = Base.start(provider) -while !Base.done(provider, state) - (batch, state) = Base.next(provider, state) - # ... - load_data!(batch, targets) -end -``` + :param AbstractDataProvider provider: the data provider. + :return: a vector of (name, shape) pairs describing the names of the labels it provides, and + the corresponding shapes. -In other words, it could safely assume that `Base.next` is always called after `Base.done`. And neither -of those function will be called twice consequtively. The detailed interfaces are list below: + The difference between *data* and *label* is that during + training stage, both *data* and *label* will be feeded into the model, while during + prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and + of any shapes. The provided data and label names here should match the input names in a target + :class:`Symbol`. -```julia -Base.start(provider :: AbstractDataProvider) => AbstractDataProviderState -``` + A data provider should also implement the Julia iteration interface, in order to allow iterating + through the data set. The provider will be called in the following way: -Initialize or reset the data iteration. + .. code-block:: julia -```julia -Base.next(provider :: AbstractDataProvider, state :: AbstractDataProviderState) - => (AbstractDataBatch, AbstractDataProviderState) -``` + for batch in provider + data = get_data(provider, batch) + end -Return one batch of data. Actual data can be retrieved from the batch by interface functions described -in the document of type `AbstractDataBatch`. + which will be translated by Julia compiler into -```julia -Base.done(provider :: AbstractDataProvider, state :: AbstractDataProviderState) => Bool -``` + .. code-block:: julia -Return `false` if there is more batch to get. + state = Base.start(provider) + while !Base.done(provider, state) + (batch, state) = Base.next(provider, state) + data = get_data(provider, batch) + end -```julia -Base.eltype(::Type{MyDataProvider}) => MyDataProviderState -``` + The detailed interface function is listed below: -Return the type of the data provider state. -""" + .. function:: Base.eltype(provider) -> AbstractDataBatch + + :param AbstractDataProvider provider: the data provider. + :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. + + .. function:: Base.start(provider) -> AbstractDataProviderState + + :param AbstractDataProvider provider: the data provider. + + This function is always called before iterating into the dataset. It should initialize + the iterator, reset the index, and do data shuffling if needed. + + .. function:: Base.done(provider, state) -> Bool + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. + :return: true if there is no more data to iterate in this dataset. + + .. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) + + :param AbstractDataProvider provider: the data provider. + :return: the current data batch, and the state for the next iteration. + + Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that + is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this + case, you can safely assume that + + * :func:`Base.start` will always be called, and called only once before the iteration starts. + * :func:`Base.done` will always be called at the beginning of every iteration and always be called once. + * If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with + a call to :func:`Base.start`. + * :func:`Base.next` will always be called only once in each iteration. It will always be called after + one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will + not be called. + + With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation + of the built-in :class:`MXDataProvider` for example. +=# abstract AbstractDataProvider -"""Root type for states of data provider""" +#=doc +.. class:: AbstractDataProviderState + + Base type for data provider states. +=# abstract AbstractDataProviderState """A tuple of (slice, NDArray). Usually each NDArray resides on a different device, and each @@ -78,6 +108,33 @@ abstract AbstractDataProviderState """ typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} +#=doc +.. class:: AbstractDataBatch + + Base type for a data mini-batch. It should implement the following interfaces: + + .. function:: count_samples(batch) -> Int + + :param AbstractDataBatch batch: the data batch object. + :return: the number of samples in this batch. This number should be greater than 0, but + less than or equal to the batch size. This is used to indicate at the end of + the data set, there might not be enough samples for a whole mini-batch. + + .. function:: get_data(provider, batch) -> Vector{NDArray} + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :return: a vector of data in this batch, should be in the same order as declared in + :func:`provide_data() `. The last dimension + of each :class:`NDArray` should match the value returned by :func:`count_samples`. + + .. function:: get_label(provider, batch) -> Vector{NDArray} + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :return: a vector of labels in this batch. Similar to :func:`get_data`. +=# + """Root type for data batch A data batch must implement the following interface function to actually provide the data and label. From 49a5acb3841d2ca8ed63a7ec2e4993e68d0b9602 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 12:46:00 -0400 Subject: [PATCH 154/630] import doc of built-in data provider. --- docs/api/io.rst | 242 +++++++++++++++++++++++++++++++++++++++++++- docs/api/symbol.rst | 92 ++++++++--------- docs/build-api.jl | 28 +++-- src/io.jl | 108 +++++++++++++------- src/symbol.jl | 4 +- 5 files changed, 377 insertions(+), 97 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index d3d060fb12f3..6d4ed63f8553 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -109,7 +109,7 @@ and split it into mini-batches so that the model can consume the data in a unifo Base type for a data mini-batch. It should implement the following interfaces: - .. function:: count_samples(batch) -> Int + .. function:: count_samples(provider, batch) -> Int :param AbstractDataBatch batch: the data batch object. :return: the number of samples in this batch. This number should be greater than 0, but @@ -121,8 +121,11 @@ and split it into mini-batches so that the model can consume the data in a unifo :param AbstractDataProvider provider: the data provider. :param AbstractDataBatch batch: the data batch object. :return: a vector of data in this batch, should be in the same order as declared in - :func:`provide_data() `. The last dimension - of each :class:`NDArray` should match the value returned by :func:`count_samples`. + :func:`provide_data() `. + + The last dimension of each :class:`NDArray` should always match the batch_size, even when + :func:`count_samples` returns a value less than the batch size. In this case, + the data provider is free to pad the remaining contents with any value. .. function:: get_label(provider, batch) -> Vector{NDArray} @@ -131,4 +134,237 @@ and split it into mini-batches so that the model can consume the data in a unifo :return: a vector of labels in this batch. Similar to :func:`get_data`. + The following function will be automatically defined. They are primarily useful for debugging + and testing. + + .. function:: get(provider, batch, name) -> NDArray + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :param Base.Symbol name: the name of the data to get, should be one of the names + provided in either :func:`provide_data() ` + or :func:`provide_label() `. + :return: the corresponding data array corresponding to that name. + + + + +.. class:: MXDataProvider + + A data provider that wrap built-in data iterators from libmxnet. + + + + +Built-in data providers in libmxnet +----------------------------------- + +.. function:: ImageRecordIter(...) + + Can also be called with the alias ``ImageRecordProvider``. + Create iterator for dataset packed in recordio. + + :param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data. + :param Base.Symbol label_name: keyword argument, default ``:softmax_label``. The name of the label. Could be ``nothing`` if no label is presented in this dataset. + + :param path_imglist: Dataset Param: Path to image list. + :type path_imglist: string, optional, default='' + + + :param path_imgrec: Dataset Param: Path to image record file. + :type path_imgrec: string, optional, default='./data/imgrec.rec' + + + :param label_width: Dataset Param: How many labels for an image. + :type label_width: int, optional, default='1' + + + :param data_shape: Dataset Param: Shape of each instance generated by the DataIter. + :type data_shape: Shape(tuple), required + + + :param preprocess_threads: Backend Param: Number of thread to do preprocessing. + :type preprocess_threads: int, optional, default='4' + + + :param verbose: Auxiliary Param: Whether to output parser information. + :type verbose: boolean, optional, default=True + + + :param num_parts: partition the data into multiple parts + :type num_parts: int, optional, default='1' + + + :param part_index: the index of the part will read + :type part_index: int, optional, default='0' + + + :param shuffle: Augmentation Param: Whether to shuffle data. + :type shuffle: boolean, optional, default=False + + + :param seed: Augmentation Param: Random Seed. + :type seed: int, optional, default='0' + + + :param batch_size: Batch Param: Batch size. + :type batch_size: int (non-negative), required + + + :param round_batch: Batch Param: Use round robin to handle overflow batch. + :type round_batch: boolean, optional, default=True + + + :param prefetch_buffer: Backend Param: Number of prefetched parameters + :type prefetch_buffer: , optional, default=4 + + + :param rand_crop: Augmentation Param: Whether to random crop on the image + :type rand_crop: boolean, optional, default=False + + + :param crop_y_start: Augmentation Param: Where to nonrandom crop on y. + :type crop_y_start: int, optional, default='-1' + + + :param crop_x_start: Augmentation Param: Where to nonrandom crop on x. + :type crop_x_start: int, optional, default='-1' + + + :param max_rotate_angle: Augmentation Param: rotated randomly in [-max_rotate_angle, max_rotate_angle]. + :type max_rotate_angle: int, optional, default='0' + + + :param max_aspect_ratio: Augmentation Param: denotes the max ratio of random aspect ratio augmentation. + :type max_aspect_ratio: float, optional, default=0 + + + :param max_shear_ratio: Augmentation Param: denotes the max random shearing ratio. + :type max_shear_ratio: float, optional, default=0 + + + :param max_crop_size: Augmentation Param: Maximum crop size. + :type max_crop_size: int, optional, default='-1' + + + :param min_crop_size: Augmentation Param: Minimum crop size. + :type min_crop_size: int, optional, default='-1' + + + :param max_random_scale: Augmentation Param: Maxmum scale ratio. + :type max_random_scale: float, optional, default=1 + + + :param min_random_scale: Augmentation Param: Minimum scale ratio. + :type min_random_scale: float, optional, default=1 + + + :param max_img_size: Augmentation Param: Maxmum image size after resizing. + :type max_img_size: float, optional, default=1e+10 + + + :param min_img_size: Augmentation Param: Minimum image size after resizing. + :type min_img_size: float, optional, default=0 + + + :param rotate: Augmentation Param: Rotate angle. + :type rotate: int, optional, default='-1' + + + :param fill_value: Augmentation Param: Maximum value of illumination variation. + :type fill_value: int, optional, default='255' + + + :param mirror: Augmentation Param: Whether to mirror the image. + :type mirror: boolean, optional, default=False + + + :param rand_mirror: Augmentation Param: Whether to mirror the image randomly. + :type rand_mirror: boolean, optional, default=False + + + :param mean_img: Augmentation Param: Mean Image to be subtracted. + :type mean_img: string, optional, default='' + + + :param mean_r: Augmentation Param: Mean value on R channel. + :type mean_r: float, optional, default=0 + + + :param mean_g: Augmentation: Mean value on G channel. + :type mean_g: float, optional, default=0 + + + :param mean_b: Augmentation: Mean value on B channel. + :type mean_b: float, optional, default=0 + + + :param scale: Augmentation Param: Scale in color space. + :type scale: float, optional, default=1 + + + :param max_random_contrast: Augmentation Param: Maximum ratio of contrast variation. + :type max_random_contrast: float, optional, default=0 + + + :param max_random_illumination: Augmentation Param: Maximum value of illumination variation. + :type max_random_illumination: float, optional, default=0 + + :return: the constructed :class:`MXDataProvider`. + + + +.. function:: MNISTIter(...) + + Can also be called with the alias ``MNISTProvider``. + Create iterator for MNIST hand-written digit number recognition dataset. + + :param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data. + :param Base.Symbol label_name: keyword argument, default ``:softmax_label``. The name of the label. Could be ``nothing`` if no label is presented in this dataset. + + :param image: Dataset Param: Mnist image path. + :type image: string, optional, default='./train-images-idx3-ubyte' + + + :param label: Dataset Param: Mnist label path. + :type label: string, optional, default='./train-labels-idx1-ubyte' + + + :param batch_size: Batch Param: Batch Size. + :type batch_size: int, optional, default='128' + + + :param shuffle: Augmentation Param: Whether to shuffle data. + :type shuffle: boolean, optional, default=True + + + :param flat: Augmentation Param: Whether to flat the data into 1D. + :type flat: boolean, optional, default=False + + + :param seed: Augmentation Param: Random Seed. + :type seed: int, optional, default='0' + + + :param silent: Auxiliary Param: Whether to print out data info. + :type silent: boolean, optional, default=False + + + :param num_parts: partition the data into multiple parts + :type num_parts: int, optional, default='1' + + + :param part_index: the index of the part will read + :type part_index: int, optional, default='0' + + + :param prefetch_buffer: Backend Param: Number of prefetched parameters + :type prefetch_buffer: , optional, default=4 + + :return: the constructed :class:`MXDataProvider`. + + + + + diff --git a/docs/api/symbol.rst b/docs/api/symbol.rst index 457b462982ad..2c7df712c2f8 100644 --- a/docs/api/symbol.rst +++ b/docs/api/symbol.rst @@ -48,9 +48,9 @@ Public APIs :param act_type: Activation function to be applied. :type act_type: {'relu', 'sigmoid', 'tanh'}, required - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -71,9 +71,9 @@ Public APIs :param momentum: Momentum for moving average :type momentum: float, optional, default=0.1 - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -86,9 +86,9 @@ Public APIs :param data: Input data. :type data: Symbol - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -103,9 +103,9 @@ Public APIs :param num_args: Number of inputs to be concated. :type num_args: int, required - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -154,9 +154,9 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=False - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -173,9 +173,9 @@ Public APIs :param p: Fraction of the input that gets dropped out at training time :type p: float, optional, default=0.5 - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -190,9 +190,9 @@ Public APIs :param num_args: Number of inputs to be sumed. :type num_args: int, required - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -205,9 +205,9 @@ Public APIs :param data: Input data to flatten. :type data: Symbol - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -236,9 +236,9 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=False - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -267,9 +267,9 @@ Public APIs :param nsize: normalization window width in elements. :type nsize: int (non-negative), required - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -298,9 +298,9 @@ Public APIs :param upper_bound: Upper bound of random slope. (For rrelu only) :type upper_bound: float, optional, default=0.334 - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -317,9 +317,9 @@ Public APIs :param label: Input label to function. :type label: Symbol - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -337,9 +337,9 @@ Public APIs :param label: Input label to function. :type label: Symbol - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -368,9 +368,9 @@ Public APIs :param pad: pad for pooling: (y, x) :type pad: Shape(tuple), optional, default=(0, 0) - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -387,9 +387,9 @@ Public APIs :param target_shape: Target new shape :type target_shape: Shape(tuple), required - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -402,9 +402,9 @@ Public APIs :param num_outputs: Number of outputs to be sliced. :type num_outputs: int, required - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -425,9 +425,9 @@ Public APIs :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes :type multi_output: boolean, optional, default=False - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -440,9 +440,9 @@ Public APIs :param src: Source symbolic input to the function :type src: Symbol - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -455,9 +455,9 @@ Public APIs :param src: Source symbolic input to the function :type src: Symbol - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -473,9 +473,9 @@ Internal APIs Perform an elementwise div. - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -485,9 +485,9 @@ Internal APIs Perform an elementwise minus. - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -497,9 +497,9 @@ Internal APIs Perform an elementwise mul. - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. @@ -509,9 +509,9 @@ Internal APIs Perform an elementwise plus. - :param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. - :return: The constructed :class:`Symbol`. + :return: the constructed :class:`Symbol`. diff --git a/docs/build-api.jl b/docs/build-api.jl index 0d01e4f84ec8..0aed51a9a022 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -43,21 +43,28 @@ function embed_mxnet_api(output_filename::AbstractString, key::AbstractString, g names_pub, names_pri = sort_api_names(keys(docs)) docs_pub = join(map(gen_doc, names_pub), "\n\n") docs_pri = join(map(gen_doc, names_pri), "\n\n") - docstrings = """ - Public APIs - ^^^^^^^^^^^ - """ * docs_pub + if isempty(names_pri) + docstrings = "" + else + docstrings = """ + Public APIs + ^^^^^^^^^^^ + """ + end + docstrings *= docs_pub - docstrings *= """ + if !isempty(names_pri) + docstrings *= """ - Internal APIs - ^^^^^^^^^^^^^ + Internal APIs + ^^^^^^^^^^^^^ - .. note:: + .. note:: - Document and signatures for internal API functions might be incomplete. + Document and signatures for internal API functions might be incomplete. - """ * docs_pri + """ * docs_pri + end key = mx.format(mx.DOC_EMBED_ANCHOR, key) println(io, replace(contents, key, docstrings)) @@ -80,3 +87,4 @@ extract_doc("model.rst", "model.jl") extract_doc("optimizer.rst", "optimizer.jl") extract_doc("io.rst", "io.jl") +embed_mxnet_api("io.rst", "io", mx._import_io_iterators) diff --git a/src/io.jl b/src/io.jl index 9f4ad67d735b..52a0a8680a1f 100644 --- a/src/io.jl +++ b/src/io.jl @@ -103,17 +103,12 @@ abstract AbstractDataProvider =# abstract AbstractDataProviderState -"""A tuple of (slice, NDArray). Usually each NDArray resides on a different device, and each - slice describe which part of a larger piece of data should goto that device. -""" -typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} - #=doc .. class:: AbstractDataBatch Base type for a data mini-batch. It should implement the following interfaces: - .. function:: count_samples(batch) -> Int + .. function:: count_samples(provider, batch) -> Int :param AbstractDataBatch batch: the data batch object. :return: the number of samples in this batch. This number should be greater than 0, but @@ -125,15 +120,37 @@ typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} :param AbstractDataProvider provider: the data provider. :param AbstractDataBatch batch: the data batch object. :return: a vector of data in this batch, should be in the same order as declared in - :func:`provide_data() `. The last dimension - of each :class:`NDArray` should match the value returned by :func:`count_samples`. + :func:`provide_data() `. + + The last dimension of each :class:`NDArray` should always match the batch_size, even when + :func:`count_samples` returns a value less than the batch size. In this case, + the data provider is free to pad the remaining contents with any value. .. function:: get_label(provider, batch) -> Vector{NDArray} :param AbstractDataProvider provider: the data provider. :param AbstractDataBatch batch: the data batch object. :return: a vector of labels in this batch. Similar to :func:`get_data`. + + + The following function will be automatically defined. They are primarily useful for debugging + and testing. + + .. function:: get(provider, batch, name) -> NDArray + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :param Base.Symbol name: the name of the data to get, should be one of the names + provided in either :func:`provide_data() ` + or :func:`provide_label() `. + :return: the corresponding data array corresponding to that name. =# +abstract AbstractDataBatch + +"""A tuple of (slice, NDArray). Usually each NDArray resides on a different device, and each + slice describe which part of a larger piece of data should goto that device. +""" +typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} """Root type for data batch @@ -167,7 +184,6 @@ Return the number of *dummy samples* in this mini-batch. The Batch type should have a field named `provider` pointing to the underlying provider. Helper functions `get_data` and `get_label` (mainly for debug purpose) will be able to use this. """ -abstract AbstractDataBatch function _get_data_or_label(batch::AbstractDataBatch, provide_func::Function, loader::Function) data_shapes = provide_func(batch.provider) @@ -343,11 +359,11 @@ end ################################################################################ -# MXDataProvider -################################################################################ +#=doc +.. class:: MXDataProvider -"""Wrapper of built-in `libmxnet` data iterators. -""" + A data provider that wrap built-in data iterators from libmxnet. +=# type MXDataProvider <: AbstractDataProvider handle :: MX_DataIterHandle data_shape :: Vector{Tuple{Base.Symbol, Tuple}} @@ -375,7 +391,7 @@ function _get_label(handle :: MX_DataIterHandle) end function MXDataProvider(handle :: MX_DataIterHandle; - data_name :: Union{Base.Symbol,Void}=:data, + data_name :: Base.Symbol=:data, label_name :: Union{Base.Symbol,Void}=:softmax_label, kwargs...) # for convenience, we ignore the rest keyword arguments # init iterator, load the first batch and get shapes @@ -387,7 +403,6 @@ function MXDataProvider(handle :: MX_DataIterHandle; else label_shape = Tuple{Base.Symbol, Tuple}[] end - _reset_data_iter(handle) MXDataProvider(handle, data_shape, label_shape, data_shape[1][2][end]) end @@ -399,8 +414,7 @@ get_batch_size(provider::MXDataProvider) = provider.batch_size type MXDataProviderState <: AbstractDataProviderState has_next :: Bool end -type MXDataBatch <: AbstractDataBatch - provider :: MXDataProvider +immutable MXDataBatch <: AbstractDataBatch end function Base.eltype(provider :: MXDataProvider) @@ -418,29 +432,25 @@ function Base.next(provider :: MXDataProvider, state :: MXDataProviderState) return (MXDataBatch(provider), state) end -function _load_general!(batch :: MXDataBatch, loader :: Function, targets :: Vector{Vector{SlicedNDArray}}) - @assert length(targets) == 1 - src = loader(batch.provider.handle) - for (idx, target) in targets[1] - copy!(target, slice(src, idx)) - end -end - -function load_data!(batch :: MXDataBatch, targets :: Vector{Vector{SlicedNDArray}}) - _load_general!(batch, _get_data, targets) +function get_data(provider :: MXDataProvider, batch :: MXDataBatch) + return NDArray[_get_data(provider.handle)] end -function load_label!(batch :: MXDataBatch, targets :: Vector{Vector{SlicedNDArray}}) - _load_general!(batch, _get_label, targets) +function get_label(provider :: MXDataProvider, batch :: MXDataBatch) + return NDArray[_get_label(provider.handle)] end - -function get_pad(batch :: MXDataBatch) +function count_samples(provider :: MXDataProvider, batch :: MXDataBatch) ref_pad = Ref{Cint}(0) @mxcall(:MXDataIterGetPadNum, (MX_handle, Ref{Cint}), batch.provider.handle, ref_pad) - return Int(ref_pad[]) + return provider.batch_size - Int(ref_pad[]) end +#=doc +Built-in data providers in libmxnet +----------------------------------- -function _define_data_iter_creator(hdr :: MX_handle) +**autogen:EMBED:io:EMBED:autogen** +=# +function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) ref_name = Ref{char_p}(0) ref_desc = Ref{char_p}(0) ref_narg = Ref{MX_uint}(0) @@ -453,6 +463,22 @@ function _define_data_iter_creator(hdr :: MX_handle) hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) iter_name = symbol(bytestring(ref_name[])) + + if gen_docs + if endswith(string(iter_name), "Iter") + f_desc = "Can also be called with the alias ``$(string(iter_name)[1:end-4] * "Provider")``.\n" + else + f_desc = "" + end + f_desc *= bytestring(ref_desc[]) * "\n\n" + f_desc *= ":param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data.\n" + f_desc *= ":param Base.Symbol label_name: keyword argument, default ``:softmax_label``. " * + "The name of the label. Could be ``nothing`` if no label is presented in this dataset.\n\n" + f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) + f_desc *= ":return: the constructed :class:`MXDataProvider`." + return (iter_name, f_desc) + end + defun = quote function $iter_name(; kwargs...) arg_keys = AbstractString[string(k) for (k,v) in kwargs] @@ -466,7 +492,6 @@ function _define_data_iter_creator(hdr :: MX_handle) end end eval(defun) - # TODO: add docstring # add an alias XXXProvider => XXXIter if endswith(string(iter_name), "Iter") @@ -475,7 +500,7 @@ function _define_data_iter_creator(hdr :: MX_handle) end end -function _import_io_iterators() +function _import_io_iterators(;gen_docs::Bool=false) n_ref = Ref{MX_uint}(0) h_ref = Ref{Ptr{MX_handle}}(0) @mxcall(:MXListDataIters, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) @@ -483,8 +508,19 @@ function _import_io_iterators() n_creators = n_ref[] h_creators = pointer_to_array(h_ref[], n_creators) + if gen_docs + docs = Dict{Base.Symbol, AbstractString}() + end + for i = 1:n_creators creator_hdr = h_creators[i] - _define_data_iter_creator(creator_hdr) + ret = _define_data_iter_creator(creator_hdr; gen_docs=gen_docs) + if gen_docs + docs[ret[1]] = ret[2] + end + end + + if gen_docs + return docs end end diff --git a/src/symbol.jl b/src/symbol.jl index ed7e2d77c411..13338602f259 100644 --- a/src/symbol.jl +++ b/src/symbol.jl @@ -308,8 +308,8 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) f_desc *= "This function support variable length positional :class:`Symbol` inputs.\n\n" end f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":param Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional.\n\n" - f_desc *= ":return: The constructed :class:`Symbol`.\n\n" + f_desc *= ":param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional.\n\n" + f_desc *= ":return: the constructed :class:`Symbol`.\n\n" return (func_name, f_desc) end From 76fee6ba4748da7bd59c34c0bb37398eb30eeb53 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 13:28:53 -0400 Subject: [PATCH 155/630] refine mxdataiter api --- docs/api/io.rst | 35 ++++++++++++++++-- src/io.jl | 94 ++++++++++++++++++++++++++++++++++++------------- src/model.jl | 14 ++++---- 3 files changed, 109 insertions(+), 34 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index 6d4ed63f8553..1e23217ace3b 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -134,8 +134,7 @@ and split it into mini-batches so that the model can consume the data in a unifo :return: a vector of labels in this batch. Similar to :func:`get_data`. - The following function will be automatically defined. They are primarily useful for debugging - and testing. + The following utility functions will be automatically defined. .. function:: get(provider, batch, name) -> NDArray @@ -146,6 +145,38 @@ and split it into mini-batches so that the model can consume the data in a unifo or :func:`provide_label() `. :return: the corresponding data array corresponding to that name. + .. function:: load_data!(provider, batch, targets) + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :param targets: the targets to load data into. + :type targets: Vector{Vector{SlicedNDArray}} + + The targets is a list of the same length as number of data provided by this provider. + Each element in the list is a ``Vector{SlicedNDArray}``. This vector described a + spliting of this data batch into different slices, each slice is specified by + a slice-ndarray pair, where *slice* specify the range of samples in the mini-batch + that should be loaded into the corresponding *ndarray*. + + This utility function is used in data parallelization, where a mini-batch is splited + and computed on several different devices. + + .. function:: load_label!(provider, batch, targets) + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :param targets: the targets to load label into. + :type targets: Vector{Vector{SlicedNDArray}} + + The same as :func:`load_data!`, except that this is for loading labels. + + + + +.. class:: SlicedNDArray + + A alias type of ``Pair{UnitRange{Int},NDArray}``. + diff --git a/src/io.jl b/src/io.jl index 52a0a8680a1f..2c694ef316f6 100644 --- a/src/io.jl +++ b/src/io.jl @@ -133,8 +133,7 @@ abstract AbstractDataProviderState :return: a vector of labels in this batch. Similar to :func:`get_data`. - The following function will be automatically defined. They are primarily useful for debugging - and testing. + The following utility functions will be automatically defined. .. function:: get(provider, batch, name) -> NDArray @@ -144,14 +143,59 @@ abstract AbstractDataProviderState provided in either :func:`provide_data() ` or :func:`provide_label() `. :return: the corresponding data array corresponding to that name. + + .. function:: load_data!(provider, batch, targets) + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :param targets: the targets to load data into. + :type targets: Vector{Vector{SlicedNDArray}} + + The targets is a list of the same length as number of data provided by this provider. + Each element in the list is a list of :class:`SlicedNDArray`. This list described a + spliting scheme of this data batch into different slices, each slice is specified by + a slice-ndarray pair, where *slice* specify the range of samples in the mini-batch + that should be loaded into the corresponding *ndarray*. + + This utility function is used in data parallelization, where a mini-batch is splited + and computed on several different devices. + + .. function:: load_label!(provider, batch, targets) + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :param targets: the targets to load label into. + :type targets: Vector{Vector{SlicedNDArray}} + + The same as :func:`load_data!`, except that this is for loading labels. =# abstract AbstractDataBatch -"""A tuple of (slice, NDArray). Usually each NDArray resides on a different device, and each - slice describe which part of a larger piece of data should goto that device. -""" +#=doc +.. class:: SlicedNDArray + + A alias type of ``Tuple{UnitRange{Int},NDArray}``. +=# typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} +function _load_general!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, + targets :: Vector{Vector{SlicedNDArray}}, loader::Function) + data = loader(provider, batch) + for (d_src, d_targets) in zip(data, targets) + for (slice_idx, d_dst) in d_targets + copy!(d_dst, slice(d_src, slice_idx)) + end + end +end +function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, + targets :: Vector{Vector{SlicedNDArray}}) + _load_general!(provider, batch, targets, get_data) +end +function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, + targets :: Vector{Vector{SlicedNDArray}}) + _load_general!(provider, batch, targets, get_label) +end + """Root type for data batch A data batch must implement the following interface function to actually provide the data and label. @@ -185,25 +229,25 @@ The Batch type should have a field named `provider` pointing to the underlying p `get_data` and `get_label` (mainly for debug purpose) will be able to use this. """ -function _get_data_or_label(batch::AbstractDataBatch, provide_func::Function, loader::Function) - data_shapes = provide_func(batch.provider) - data_arrays = [mx.empty(x[2]) for x in data_shapes] - batch_size = get_batch_size(batch.provider) - data_arrays_fake_slice = [SlicedNDArray[(1:batch_size, x)] for x in data_arrays] - loader(batch, data_arrays_fake_slice) - - if length(data_arrays) == 1 - return data_arrays[1] - else - return data_arrays - end -end -function get_data(batch :: AbstractDataBatch) - _get_data_or_label(batch, provide_data, load_data!) -end -function get_label(batch :: AbstractDataBatch) - _get_data_or_label(batch, provide_label, load_label!) -end +#function _get_data_or_label(batch::AbstractDataBatch, provide_func::Function, loader::Function) +# data_shapes = provide_func(batch.provider) +# data_arrays = [mx.empty(x[2]) for x in data_shapes] +# batch_size = get_batch_size(batch.provider) +# data_arrays_fake_slice = [SlicedNDArray[(1:batch_size, x)] for x in data_arrays] +# loader(batch, data_arrays_fake_slice) +# +# if length(data_arrays) == 1 +# return data_arrays[1] +# else +# return data_arrays +# end +#end +#function get_data(batch :: AbstractDataBatch) +# _get_data_or_label(batch, provide_data, load_data!) +#end +#function get_label(batch :: AbstractDataBatch) +# _get_data_or_label(batch, provide_label, load_label!) +#end ################################################################################ # ArrayDataProvider @@ -429,7 +473,7 @@ function Base.done(provider :: MXDataProvider, state :: MXDataProviderState) return !state.has_next end function Base.next(provider :: MXDataProvider, state :: MXDataProviderState) - return (MXDataBatch(provider), state) + return (MXDataBatch(), state) end function get_data(provider :: MXDataProvider, batch :: MXDataBatch) diff --git a/src/model.jl b/src/model.jl index 5b42278f8db2..d49aca6c040a 100644 --- a/src/model.jl +++ b/src/model.jl @@ -186,12 +186,12 @@ function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::B data_arrays = [SlicedNDArray[(1:batch_size, self.pred_exec.arg_dict[name])] for name in data_names] output_list = [Array{MX_float}[] for i=1:length(self.pred_exec.outputs)] for batch in data - load_data!(batch, data_arrays) + load_data!(data, batch, data_arrays) forward(self.pred_exec, is_train=false) if isa(callback, Void) # no callback, accumulate the data and return at the end for (o_list, o_nd) in zip(output_list, self.pred_exec.outputs) - push!(o_list, copy(slice(o_nd, 1:batch_size-get_pad(batch)))) + push!(o_list, copy(slice(o_nd, 1:count_samples(data, batch)))) end else outputs = self.pred_exec.outputs @@ -403,8 +403,8 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) for batch in data - load_data!(batch, data_arrays) - load_label!(batch, label_arrays) + load_data!(data, batch, data_arrays) + load_label!(data, batch, label_arrays) # forward and backward for (texec, islice) in zip(train_execs, slices) @@ -453,7 +453,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) # update evaluation metric on training set - load_label!(batch, cpu_label_arrays_full_slice) + load_label!(data, batch, cpu_label_arrays_full_slice) update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) end # end of one epoch @@ -474,7 +474,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra reset!(opts.eval_metric) for batch in opts.eval_data - load_data!(batch, data_arrays) + load_data!(opts.eval_data, batch, data_arrays) # forward and backward for (texec, islice) in zip(train_execs, slices) @@ -485,7 +485,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra copy!(slice(cpu_out, islice), dev_out) end end - load_label!(batch, cpu_label_arrays_full_slice) + load_label!(opts.eval_data, batch, cpu_label_arrays_full_slice) update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) end From 5e03d2783a298186ea47a4c70d16137dde6d2678 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 18:37:44 -0400 Subject: [PATCH 156/630] fix unittest for new data IO api --- docs/api/io.rst | 29 +++++++- src/io.jl | 176 +++++++++++++++++++++++++++++++------------- src/ndarray.jl | 10 +++ test/unittest/io.jl | 19 +++-- 4 files changed, 170 insertions(+), 64 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index 1e23217ace3b..2e8a62dd7a08 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -95,6 +95,22 @@ and split it into mini-batches so that the model can consume the data in a unifo With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation of the built-in :class:`MXDataProvider` for example. + .. caution:: + + Please do not use the one data provider simultaneously in two different places, either in parallel, + or in a nested loop. For example, the behavior for the following code is undefined + + .. code-block:: julia + + for batch in data + # updating the parameters + + # now let's test the performance on the training set + for b2 in data + # ... + end + end + @@ -153,8 +169,8 @@ and split it into mini-batches so that the model can consume the data in a unifo :type targets: Vector{Vector{SlicedNDArray}} The targets is a list of the same length as number of data provided by this provider. - Each element in the list is a ``Vector{SlicedNDArray}``. This vector described a - spliting of this data batch into different slices, each slice is specified by + Each element in the list is a list of :class:`SlicedNDArray`. This list described a + spliting scheme of this data batch into different slices, each slice is specified by a slice-ndarray pair, where *slice* specify the range of samples in the mini-batch that should be loaded into the corresponding *ndarray*. @@ -175,7 +191,14 @@ and split it into mini-batches so that the model can consume the data in a unifo .. class:: SlicedNDArray - A alias type of ``Pair{UnitRange{Int},NDArray}``. + A alias type of ``Tuple{UnitRange{Int},NDArray}``. + + + + +.. class:: ArrayDataProvider + + A convenient tool to iterate :class:`NDArray` or Julia ``Array``. diff --git a/src/io.jl b/src/io.jl index 2c694ef316f6..8fae4bcbb15b 100644 --- a/src/io.jl +++ b/src/io.jl @@ -93,6 +93,22 @@ and split it into mini-batches so that the model can consume the data in a unifo With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation of the built-in :class:`MXDataProvider` for example. + + .. caution:: + + Please do not use the one data provider simultaneously in two different places, either in parallel, + or in a nested loop. For example, the behavior for the following code is undefined + + .. code-block:: julia + + for batch in data + # updating the parameters + + # now let's test the performance on the training set + for b2 in data + # ... + end + end =# abstract AbstractDataProvider @@ -196,6 +212,21 @@ function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatc _load_general!(provider, batch, targets, get_label) end +import Base.get +function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name :: Base.Symbol) + for (idx, (k, s)) in enumerate(provide_data(provider)) + if name == k + return get_data(provider, batch)[idx] + end + end + for (idx, (k, s)) in enumerate(provide_label(provider)) + if name == k + return get_label(provider, batch)[idx] + end + end + error("$name is not provided by this data provider") +end + """Root type for data batch A data batch must implement the following interface function to actually provide the data and label. @@ -250,9 +281,11 @@ The Batch type should have a field named `provider` pointing to the underlying p #end ################################################################################ -# ArrayDataProvider -################################################################################ -"A convenient tool to iterate `NDArray` or Julia `Array`" +#=doc +.. class:: ArrayDataProvider + + A convenient tool to iterate :class:`NDArray` or Julia ``Array``. +=# type ArrayDataProvider <: AbstractDataProvider data_arrays :: Vector{Array{MX_float}} data_names :: Vector{Base.Symbol} @@ -263,8 +296,10 @@ type ArrayDataProvider <: AbstractDataProvider shuffle :: Bool data_padding :: MX_float label_padding :: MX_float -end + data_batch :: Vector{NDArray} + label_batch :: Vector{NDArray} +end # Julia's type system is sometimes very frustrating. You cannot specify a function # with argument Vector{Pair} to expect to be matched when calling with the parameter @@ -272,40 +307,43 @@ end # results, about the parametric type in the Pair{T1,T2} type, thus does not match the # generic Pair type. In general, Int <: Number but Vector{Int} <: Vector{Number} is not # true. So let us just use Any here... -function ArrayDataProvider(data::Any; batch_size::Int=1, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) +function ArrayDataProvider(data::Any; batch_size::Int=0, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) ArrayDataProvider(data, [], batch_size=batch_size, shuffle=shuffle, data_padding=data_padding, label_padding=label_padding) end -function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) +function ArrayDataProvider(data::Any, label::Any; batch_size::Int=0, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) + asarr{T}(arr :: Array{T}) = convert(Array{MX_float}, arr) + asarr(arr :: NDArray) = copy(arr) + if isa(data, Union{NDArray, Array}) && eltype(data) <: Real data_names = [:data] - data_arrays = Array{MX_float}[data] + data_arrays = Array{MX_float}[asarr(data)] elseif isa(data, Pair) @assert isa(data.first, Base.Symbol) && isa(data.second, Union{NDArray, Array}) data_names = [data.first] - data_arrays = Array{MX_float}[data.second] + data_arrays = Array{MX_float}[asarr(data.second)] elseif isa(data, Vector) || isa(data, Tuple) map(data) do d @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) end data_names = Base.Symbol[d.first for d in data] - data_arrays = Array{MX_float}[d.second for d in data] + data_arrays = Array{MX_float}[asarr(d.second) for d in data] else error("Invalid data argument type") end if isa(label, Union{NDArray, Array}) && eltype(label) <: Real label_names = [:softmax_label] - label_arrays = Array{MX_float}[label] + label_arrays = Array{MX_float}[asarr(label)] elseif isa(label, Pair) @assert isa(label.first, Base.Symbol) && isa(label.second, Union{NDArray, Array}) label_names = [label.first] - label_arrays = Array{MX_float}[label.second] + label_arrays = Array{MX_float}[asarr(label.second)] elseif isa(label, Vector) || isa(label, Tuple) map(label) do d @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) end label_names = Base.Symbol[d.first for d in label] - label_arrays = Array{MX_float}[d.second for d in label] + label_arrays = Array{MX_float}[asarr(d.second) for d in label] else error("Invalid label argument type") end @@ -321,8 +359,31 @@ function ArrayDataProvider(data::Any, label::Any; batch_size::Int=1, shuffle::Bo "Number of samples in $(label_names[i]) is mismatch with $(data_names[1])") end + if batch_size == 0 + batch_size = sample_count + end + @assert 0 < batch_size <= sample_count + + function gen_batch_nds(arrs :: Vector{Array{MX_float}}, bsize :: Int) + map(arrs) do arr + shape = size(arr) + empty(shape[1:end-1]..., bsize) + end + end + + data_batch = gen_batch_nds(data_arrays, batch_size) + label_batch = gen_batch_nds(label_arrays, batch_size) + + # reshape data and labels into 2D tensors, so that it is easier to work with them + data_arrays = map(data_arrays) do arr + reshape(arr, prod(size(arr)[1:end-1]), size(arr)[end]) + end + label_arrays = map(label_arrays) do arr + reshape(arr, prod(size(arr)[1:end-1]), size(arr)[end]) + end + ArrayDataProvider(data_arrays, data_names, label_arrays, label_names, batch_size, - sample_count, shuffle, data_padding, label_padding) + sample_count, shuffle, data_padding, label_padding, data_batch, label_batch) end function provide_data(provider::ArrayDataProvider) @@ -341,17 +402,12 @@ function Base.eltype(provider :: ArrayDataProvider) ArrayDataProviderState end -function _shuffle_array(arr::Array, idx::Vector{Int}) - shape = size(arr) - colons = [Colon() for c = 1:length(shape)-1] - getindex(arr, colons..., idx) -end function Base.start(provider :: ArrayDataProvider) if provider.shuffle # re-shuffle all data idx_perm = randperm(provider.sample_count) - provider.data_arrays = map(x->_shuffle_array(x,idx_perm), provider.data_arrays) - provider.label_arrays = map(x->_shuffle_array(x,idx_perm), provider.label_arrays) + provider.data_arrays = map(x->x[:,idx_perm], provider.data_arrays) + provider.label_arrays = map(x->x[:,idx_perm], provider.label_arrays) end return ArrayDataProviderState(1) @@ -362,43 +418,61 @@ function Base.done(provider::ArrayDataProvider, state :: ArrayDataProviderState) end immutable ArrayDataBatch <: AbstractDataBatch - provider :: ArrayDataProvider - idx :: UnitRange{Int} + idx :: UnitRange{Int} end function Base.next(provider :: ArrayDataProvider, state :: ArrayDataProviderState) idx = state.curr_idx:min(state.curr_idx+provider.batch_size-1, provider.sample_count) - return (ArrayDataBatch(provider, idx), ArrayDataProviderState(idx.stop+1)) -end - -function get_pad(batch :: ArrayDataBatch) - return batch.provider.batch_size - length(batch.idx) -end - -function _load_general!(batch :: ArrayDataBatch, sources :: Vector{Array{MX_float}}, - targets :: Vector{Vector{SlicedNDArray}}, pad_val::Real) - @assert length(sources) == length(targets) - for (src, tgt) in zip(sources, targets) - src_colons = [Colon() for i = 1:ndims(src)-1] - for (slice_idx, dst) in tgt - if slice_idx.start > length(batch.idx) - dst[:] = pad_val - else - slice_idx0 = slice_idx.start:min(slice_idx.stop, length(batch.idx)) - copy!(dst[1:length(slice_idx0)], getindex(src, src_colons..., batch.idx[slice_idx0])) - if length(slice_idx0) < length(slice_idx) - # need padding - dst[length(slice_idx0)+1:length(slice_idx)] = pad_val - end - end - end - end + return (ArrayDataBatch(idx), ArrayDataProviderState(idx.stop+1)) end -function load_data!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) - _load_general!(batch, batch.provider.data_arrays, targets, batch.provider.data_padding) + +function count_samples(provider :: ArrayDataProvider, batch :: ArrayDataBatch) + return length(batch.idx) end -function load_label!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) - _load_general!(batch, batch.provider.label_arrays, targets, batch.provider.label_padding) + +function get_data(provider :: ArrayDataProvider, batch :: ArrayDataBatch) + for (src, dst) in zip(provider.data_arrays, provider.data_batch) + copy_ignore_shape!(dst[1:length(batch.idx)], src[:, batch.idx]) + if length(batch.idx) < provider.batch_size + dst[length(batch.idx)+1:provider.batch_size] = provider.data_padding + end + end + return provider.data_batch end +function get_label(provider :: ArrayDataProvider, batch :: ArrayDataBatch) + for (src, dst) in zip(provider.label_arrays, provider.label_batch) + copy_ignore_shape!(dst[1:length(batch.idx)], src[:, batch.idx]) + if length(batch.idx) < provider.batch_size + dst[length(batch.idx)+1:provider.batch_size] = provider.label_padding + end + end + return provider.label_batch +end + +#function _load_general!(batch :: ArrayDataBatch, sources :: Vector{Array{MX_float}}, +# targets :: Vector{Vector{SlicedNDArray}}, pad_val::Real) +# @assert length(sources) == length(targets) +# for (src, tgt) in zip(sources, targets) +# src_colons = [Colon() for i = 1:ndims(src)-1] +# for (slice_idx, dst) in tgt +# if slice_idx.start > length(batch.idx) +# dst[:] = pad_val +# else +# slice_idx0 = slice_idx.start:min(slice_idx.stop, length(batch.idx)) +# copy!(dst[1:length(slice_idx0)], getindex(src, src_colons..., batch.idx[slice_idx0])) +# if length(slice_idx0) < length(slice_idx) +# # need padding +# dst[length(slice_idx0)+1:length(slice_idx)] = pad_val +# end +# end +# end +# end +#end +#function load_data!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) +# _load_general!(batch, batch.provider.data_arrays, targets, batch.provider.data_padding) +#end +#function load_label!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) +# _load_general!(batch, batch.provider.label_arrays, targets, batch.provider.label_padding) +#end diff --git a/src/ndarray.jl b/src/ndarray.jl index 347346e6751a..82293d2fdbe9 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -328,6 +328,16 @@ function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) return dst end +function copy_ignore_shape!{T<:Real}(dst :: NDArray, src :: Array{T}) + @assert dst.writable + @assert length(dst) == length(src) + src = convert(Array{MX_float}, src) # this might involve copying + @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), + dst.handle, pointer(src), length(src)) + return dst +end + + #=doc .. function:: copy(arr :: NDArray) diff --git a/test/unittest/io.jl b/test/unittest/io.jl index cffb00417a57..d34fb674b689 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -27,8 +27,8 @@ function test_mnist() data_targets = [[(1:batch_size, data_array)] for i = 1:1] label_targets = [[(1:batch_size, label_array)] for i = 1:1] - mx.load_data!(batch, data_targets) - mx.load_label!(batch, label_targets) + mx.load_data!(mnist_provider, batch, data_targets) + mx.load_label!(mnist_provider, batch, label_targets) true_labels = [5,0,4,1,9,2,1,3,1,4] # the first 10 labels in MNIST train got_labels = Int[copy(label_array)...] @@ -53,11 +53,11 @@ function test_arrays_impl(data::Vector, label::Vector, provider::mx.ArrayDataPro for (idx, batch) in zip(idx_all, provider) data_batch = [x[[Colon() for i=1:ndims(x)-1]..., idx:min(idx+batch_size-1,sample_count)] for x in data] data_get = [mx.empty(size(x)[1:end-1]..., batch_size) for x in data] - mx.load_data!(batch, [[(1:batch_size, x)] for x in data_get]) + mx.load_data!(provider, batch, [[(1:batch_size, x)] for x in data_get]) for (d_real, d_get) in zip(data_batch, data_get) @test reldiff(d_real, copy(d_get)[[1:n for n in size(d_real)]...]) < 1e-6 - @test mx.get_pad(batch) == batch_size - size(d_real)[end] + @test mx.count_samples(provider, batch) == size(d_real)[end] end end end @@ -97,12 +97,11 @@ function test_arrays_shuffle() data_got = similar(data) label_got = similar(label) for (idx, batch) in zip(idx_all, provider) - data_batch = [(1:batch_size, mx.empty(1,batch_size))] - label_batch = [(1:batch_size, mx.empty(batch_size))] - mx.load_data!(batch, typeof(data_batch)[data_batch]) - mx.load_label!(batch, typeof(label_batch)[label_batch]) - data_got[idx:min(idx+batch_size-1,sample_count)] = copy(data_batch[1][2])[1:batch_size-mx.get_pad(batch)] - label_got[idx:min(idx+batch_size-1,sample_count)] = copy(label_batch[1][2])[1:batch_size-mx.get_pad(batch)] + data_batch = mx.get(provider, batch, :data) + label_batch = mx.get(provider, batch, :index) + ns_batch = mx.count_samples(provider, batch) + data_got[idx:idx+ns_batch-1] = copy(data_batch)[1:ns_batch] + label_got[idx:idx+ns_batch-1] = copy(label_batch)[1:ns_batch] end @test label_got != label From ceaa3eb292dbc534e710698e5f0f1c3a6a98ecca Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 18:50:43 -0400 Subject: [PATCH 157/630] fix mlp example to use the updated data io API --- docs/api/io.rst | 27 ++++++++++- examples/mnist/mlp.jl | 2 +- src/io.jl | 106 ++++++++++-------------------------------- 3 files changed, 52 insertions(+), 83 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index 2e8a62dd7a08..076aa47159cf 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -203,9 +203,34 @@ and split it into mini-batches so that the model can consume the data in a unifo +.. function:: ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) + + Construct a data provider from :class:`NDArray` or Julia Arrays. + + :param data: the data, could be + + - a :class:`NDArray`, or a Julia Array. This is equivalent to ``:data => data``. + - a name-data pair, like ``:mydata => array``, where ``:mydata`` is the name of the data + and ``array`` is an :class:`NDArray` or a Julia Array. + - a list of name-data pairs. + + :param label: the same as the ``data`` parameter. When this argument is omitted, the constructed + provider will provide no labels. + :param Int batch_size: the batch size, default is 0, which means treating the whole array as a + single mini-batch. + :param Bool shuffle: turn on if the data should be shuffled at every epoch. + :param Real data_padding: when the mini-batch goes beyond the dataset boundary, there might + be less samples to include than a mini-batch. This value specify a scalar to pad the + contents of all the missing data points. + :param Real label_padding: the same as ``data_padding``, except for the labels. + + + + .. class:: MXDataProvider - A data provider that wrap built-in data iterators from libmxnet. + A data provider that wrap built-in data iterators from libmxnet. See below for + a list of built-in data iterators. diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 03be2f7d336b..857b25f50049 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -43,7 +43,7 @@ probs = mx.predict(model, eval_provider) # collect all labels from eval data labels = Array[] for batch in eval_provider - push!(labels, copy(mx.get_label(batch))) + push!(labels, copy(mx.get(eval_provider, batch, :softmax_label))) end labels = cat(1, labels...) diff --git a/src/io.jl b/src/io.jl index 8fae4bcbb15b..b3ca7e000d40 100644 --- a/src/io.jl +++ b/src/io.jl @@ -227,58 +227,6 @@ function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name error("$name is not provided by this data provider") end -"""Root type for data batch - -A data batch must implement the following interface function to actually provide the data and label. - -```julia -load_data!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) -load_label!(batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) -``` - -Load data and label into targets. The targets is a list of target that the data/label should be -copied into. The order in the list is guaranteed to be the same as returned by `provide_data` and -`provide_label`. Each entry in the list is again a list of `SlicedNDArray`, corresponding the -memory buffer for each device. - -The `SlicedNDArray` is used in data parallelization to run different sub-batch on different devices. - -The following function should also be implemented to handle the case when the mini-batch size does not -divide the size of the whole dataset. So in the last mini-batch, the actual data copied might be fewer -than the mini-batch size. This is usually not an issue during the training as the remaining space may -contain the data and label copied during the previous mini-batch are still valid data. However, during -testing, especially when doing feature extraction, we need to be precise about the number of samples -processed. - -```julia -get_pad(batch :: AbstractDataBatch) -``` - -Return the number of *dummy samples* in this mini-batch. - -The Batch type should have a field named `provider` pointing to the underlying provider. Helper functions -`get_data` and `get_label` (mainly for debug purpose) will be able to use this. -""" - -#function _get_data_or_label(batch::AbstractDataBatch, provide_func::Function, loader::Function) -# data_shapes = provide_func(batch.provider) -# data_arrays = [mx.empty(x[2]) for x in data_shapes] -# batch_size = get_batch_size(batch.provider) -# data_arrays_fake_slice = [SlicedNDArray[(1:batch_size, x)] for x in data_arrays] -# loader(batch, data_arrays_fake_slice) -# -# if length(data_arrays) == 1 -# return data_arrays[1] -# else -# return data_arrays -# end -#end -#function get_data(batch :: AbstractDataBatch) -# _get_data_or_label(batch, provide_data, load_data!) -#end -#function get_label(batch :: AbstractDataBatch) -# _get_data_or_label(batch, provide_label, load_label!) -#end ################################################################################ #=doc @@ -301,6 +249,28 @@ type ArrayDataProvider <: AbstractDataProvider label_batch :: Vector{NDArray} end +#=doc +.. function:: ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) + + Construct a data provider from :class:`NDArray` or Julia Arrays. + + :param data: the data, could be + + - a :class:`NDArray`, or a Julia Array. This is equivalent to ``:data => data``. + - a name-data pair, like ``:mydata => array``, where ``:mydata`` is the name of the data + and ``array`` is an :class:`NDArray` or a Julia Array. + - a list of name-data pairs. + + :param label: the same as the ``data`` parameter. When this argument is omitted, the constructed + provider will provide no labels. + :param Int batch_size: the batch size, default is 0, which means treating the whole array as a + single mini-batch. + :param Bool shuffle: turn on if the data should be shuffled at every epoch. + :param Real data_padding: when the mini-batch goes beyond the dataset boundary, there might + be less samples to include than a mini-batch. This value specify a scalar to pad the + contents of all the missing data points. + :param Real label_padding: the same as ``data_padding``, except for the labels. +=# # Julia's type system is sometimes very frustrating. You cannot specify a function # with argument Vector{Pair} to expect to be matched when calling with the parameter # [:foo => zeros(2,3), :bar => zeros(3)] because the type inference gives very specific @@ -448,39 +418,13 @@ function get_label(provider :: ArrayDataProvider, batch :: ArrayDataBatch) return provider.label_batch end -#function _load_general!(batch :: ArrayDataBatch, sources :: Vector{Array{MX_float}}, -# targets :: Vector{Vector{SlicedNDArray}}, pad_val::Real) -# @assert length(sources) == length(targets) -# for (src, tgt) in zip(sources, targets) -# src_colons = [Colon() for i = 1:ndims(src)-1] -# for (slice_idx, dst) in tgt -# if slice_idx.start > length(batch.idx) -# dst[:] = pad_val -# else -# slice_idx0 = slice_idx.start:min(slice_idx.stop, length(batch.idx)) -# copy!(dst[1:length(slice_idx0)], getindex(src, src_colons..., batch.idx[slice_idx0])) -# if length(slice_idx0) < length(slice_idx) -# # need padding -# dst[length(slice_idx0)+1:length(slice_idx)] = pad_val -# end -# end -# end -# end -#end -#function load_data!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) -# _load_general!(batch, batch.provider.data_arrays, targets, batch.provider.data_padding) -#end -#function load_label!(batch :: ArrayDataBatch, targets :: Vector{Vector{SlicedNDArray}}) -# _load_general!(batch, batch.provider.label_arrays, targets, batch.provider.label_padding) -#end - - ################################################################################ #=doc .. class:: MXDataProvider - A data provider that wrap built-in data iterators from libmxnet. + A data provider that wrap built-in data iterators from libmxnet. See below for + a list of built-in data iterators. =# type MXDataProvider <: AbstractDataProvider handle :: MX_DataIterHandle @@ -558,7 +502,7 @@ function get_label(provider :: MXDataProvider, batch :: MXDataBatch) end function count_samples(provider :: MXDataProvider, batch :: MXDataBatch) ref_pad = Ref{Cint}(0) - @mxcall(:MXDataIterGetPadNum, (MX_handle, Ref{Cint}), batch.provider.handle, ref_pad) + @mxcall(:MXDataIterGetPadNum, (MX_handle, Ref{Cint}), provider.handle, ref_pad) return provider.batch_size - Int(ref_pad[]) end From 993be59c8b1a1066daf21a3dbc3c92f8a57ab5cc Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 18:55:39 -0400 Subject: [PATCH 158/630] simplify model a bit with data IO api --- src/io.jl | 11 +++++++++++ src/model.jl | 7 +++---- 2 files changed, 14 insertions(+), 4 deletions(-) diff --git a/src/io.jl b/src/io.jl index b3ca7e000d40..ed63a2dbedfe 100644 --- a/src/io.jl +++ b/src/io.jl @@ -212,6 +212,17 @@ function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatc _load_general!(provider, batch, targets, get_label) end +function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{NDArray}) + for (src, dst) in zip(get_data(provider, batch), targets) + copy!(dst, src) + end +end +function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{NDArray}) + for (src, dst) in zip(get_label(provider, batch), targets) + copy!(dst, src) + end +end + import Base.get function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name :: Base.Symbol) for (idx, (k, s)) in enumerate(provide_data(provider)) diff --git a/src/model.jl b/src/model.jl index d49aca6c040a..55ba733b5d13 100644 --- a/src/model.jl +++ b/src/model.jl @@ -183,7 +183,7 @@ function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::B _setup_predictor(self, overwrite; data_shapes...) batch_size = get_batch_size(data) - data_arrays = [SlicedNDArray[(1:batch_size, self.pred_exec.arg_dict[name])] for name in data_names] + data_arrays = [self.pred_exec.arg_dict[name] for name in data_names] output_list = [Array{MX_float}[] for i=1:length(self.pred_exec.outputs)] for batch in data load_data!(data, batch, data_arrays) @@ -386,7 +386,6 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra cpu_dev = Context(CPU) cpu_output_arrays = [empty(shape, cpu_dev) for shape in output_shapes] cpu_label_arrays = [empty(shape, cpu_dev) for (name,shape) in provide_label(data)] - cpu_label_arrays_full_slice = [SlicedNDArray[(1:batch_size, x)] for x in cpu_label_arrays] # invoke callbacks on epoch 0 _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) @@ -453,7 +452,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) # update evaluation metric on training set - load_label!(data, batch, cpu_label_arrays_full_slice) + load_label!(data, batch, cpu_label_arrays) update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) end # end of one epoch @@ -485,7 +484,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra copy!(slice(cpu_out, islice), dev_out) end end - load_label!(opts.eval_data, batch, cpu_label_arrays_full_slice) + load_label!(opts.eval_data, batch, cpu_label_arrays) update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) end From f30aedc7f174a9aa4d3b4ff13e9c527b4a26f33f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 29 Oct 2015 19:43:59 -0400 Subject: [PATCH 159/630] part of the executor API doc --- docs/api/context.rst | 32 ++++++++++++++++++++++++++++ docs/api/executor.rst | 32 ++++++++++++++++++++++++++++ docs/api/initializer.rst | 46 ++++++++++++++++++++++++++++++++++++++-- docs/api/io.rst | 17 ++++++++++++--- docs/api/model.rst | 4 ++-- docs/build-api.jl | 4 ++++ docs/index.rst | 2 ++ src/context.jl | 25 ++++++++++++++++++++++ src/executor.jl | 27 +++++++++++++++++++++++ src/initializer.jl | 38 +++++++++++++++++++++++++++++++-- src/io.jl | 14 +++++++++--- src/model.jl | 4 ++-- 12 files changed, 231 insertions(+), 14 deletions(-) create mode 100644 docs/api/context.rst create mode 100644 docs/api/executor.rst diff --git a/docs/api/context.rst b/docs/api/context.rst new file mode 100644 index 000000000000..5230b892c8e5 --- /dev/null +++ b/docs/api/context.rst @@ -0,0 +1,32 @@ + +Context +======= + + + + +.. class:: Context + + A context describes the device type and id on which computation should be carried on. + + + + +.. function:: cpu(dev_id=0) + + :param Int dev_id: the CPU id. + + Get a CPU context with a specific id. ``cpu()`` is usually the default context for many + operations when no context is specified. + + + + +.. function:: gpu(dev_id=0) + + :param Int dev_id: the GPU device id. + + Get a GPU context with a specific id. The K GPUs on a node is typically numbered as 0,...,K-1. + + + diff --git a/docs/api/executor.rst b/docs/api/executor.rst new file mode 100644 index 000000000000..8887d4ce1d24 --- /dev/null +++ b/docs/api/executor.rst @@ -0,0 +1,32 @@ + +Executor +======== + + + + +.. class:: Executor + + An executor is a realization of a symbolic architecture defined by a :class:`Symbol`. + The actual forward and backward computation specified by the network architecture can + be carried out with an executor. + + + + +.. function:: bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) + + Create an :class:`Executor` by binding a :class:`Symbol` to concrete :class:`NDArray`. + + :param Symbol sym: the network architecture describing the computation graph. + :param Context ctx: the context on which the computation should run. + :param args: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete + arrays for all the inputs in the network architecture. The inputs typically include + network parameters (weights, bias, filters, etc.), data and labels. See :func:`list_arguments` + and :func:`infer_shape`. + :param args_grad: TODO + :param aux_states: + :param grad_req: + + + diff --git a/docs/api/initializer.rst b/docs/api/initializer.rst index 63e1a231b187..3f4126721542 100644 --- a/docs/api/initializer.rst +++ b/docs/api/initializer.rst @@ -1,6 +1,8 @@ -Built-in Initializers -===================== +Initializers +============ +Interface +--------- @@ -9,6 +11,24 @@ Built-in Initializers The abstract base class for all initializers. +To define a new initializer, it is +enough to derive a new type, and implement one or more of the following methods: + +.. function:: _init_weight(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + +Or, if full behavior customization is needed, override the following function + +.. function:: call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + + + + +Built-in initializers +--------------------- + @@ -19,9 +39,31 @@ Built-in Initializers +.. function UniformInitializer(scale=0.07) + + Construct a :class:`UniformInitializer` with the specified scale. + + + + .. class:: NormalInitializer Initialize weights according to a univariate Gaussian distribution. + +.. function:: NormalIninitializer(; mu=0, sigma=0.01) + + Construct a :class:`NormalInitializer` with mean ``mu`` and variance ``sigma``. + + + + +.. class:: XaiverInitializer + + The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding + the difficulty of training deep feedforward neuralnetworks*. + + + diff --git a/docs/api/io.rst b/docs/api/io.rst index 076aa47159cf..b601db39c7ec 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -1,6 +1,8 @@ Data Providers ============== +Interface +--------- Data providers are wrappers that load external data, be it images, text, or general tensors, and split it into mini-batches so that the model can consume the data in a uniformed way. @@ -196,6 +198,12 @@ and split it into mini-batches so that the model can consume the data in a unifo +Built-in data providers +----------------------- + + + + .. class:: ArrayDataProvider A convenient tool to iterate :class:`NDArray` or Julia ``Array``. @@ -227,6 +235,12 @@ and split it into mini-batches so that the model can consume the data in a unifo +libmxnet data providers +----------------------- + + + + .. class:: MXDataProvider A data provider that wrap built-in data iterators from libmxnet. See below for @@ -235,9 +249,6 @@ and split it into mini-batches so that the model can consume the data in a unifo -Built-in data providers in libmxnet ------------------------------------ - .. function:: ImageRecordIter(...) Can also be called with the alias ``ImageRecordProvider``. diff --git a/docs/api/model.rst b/docs/api/model.rst index 7593e6e68f55..ab330db9bcfa 100644 --- a/docs/api/model.rst +++ b/docs/api/model.rst @@ -1,6 +1,6 @@ -Built-in Models and Interface -============================= +Models +====== The model API provides convenient high-level interface to do training and predicting on a network described using the symbolic API. diff --git a/docs/build-api.jl b/docs/build-api.jl index 0aed51a9a022..b70c480c9d79 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -74,12 +74,16 @@ end ################################################################################# # Build Documents ################################################################################# +extract_doc("context.rst", "context.jl") + extract_doc("ndarray.rst", "ndarray.jl") embed_mxnet_api("ndarray.rst", "ndarray", mx._import_ndarray_functions) extract_doc("symbol.rst", "symbol.jl") embed_mxnet_api("symbol.rst", "symbol", mx._import_atomic_symbol_creators) +extract_doc("executor.rst", "executor.jl") + extract_doc("initializer.rst", "initializer.jl") extract_doc("callback.rst", "callback.jl") extract_doc("model.rst", "model.jl") diff --git a/docs/index.rst b/docs/index.rst index eda80ac1c18d..7520047db11a 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -31,6 +31,7 @@ For more details, see documentation below. Please also checkout the `examples :maxdepth: 1 :caption: API Documentation + api/context api/model api/initializer api/optimizer @@ -38,6 +39,7 @@ For more details, see documentation below. Please also checkout the `examples api/io api/ndarray api/symbol + api/executor Indices and tables ================== diff --git a/src/context.jl b/src/context.jl index 5146d4afcb64..1e96c305fb04 100644 --- a/src/context.jl +++ b/src/context.jl @@ -1,5 +1,14 @@ +#=doc +Context +======= +=# @enum CONTEXT_TYPE CPU=1 GPU=2 CPU_PINNED=3 +#=doc +.. class:: Context + + A context describes the device type and id on which computation should be carried on. +=# immutable Context device_type :: CONTEXT_TYPE device_id :: Int @@ -11,9 +20,25 @@ function Base.show(io :: IO, ctx :: Context) print(io, "$(ctx.device_type)$(ctx.device_id)") end +#=doc +.. function:: cpu(dev_id=0) + + :param Int dev_id: the CPU id. + + Get a CPU context with a specific id. ``cpu()`` is usually the default context for many + operations when no context is specified. +=# function cpu(dev_id::Int=0) return Context(CPU, dev_id) end + +#=doc +.. function:: gpu(dev_id=0) + + :param Int dev_id: the GPU device id. + + Get a GPU context with a specific id. The K GPUs on a node is typically numbered as 0,...,K-1. +=# function gpu(dev_id::Int=0) return Context(GPU, dev_id) end diff --git a/src/executor.jl b/src/executor.jl index 4d57c1da7b7c..4485bc6dce9a 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -1,3 +1,15 @@ +#=doc +Executor +======== +=# + +#=doc +.. class:: Executor + + An executor is a realization of a symbolic architecture defined by a :class:`Symbol`. + The actual forward and backward computation specified by the network architecture can + be carried out with an executor. +=# type Executor handle :: MX_ExecutorHandle symbol :: Symbol @@ -58,6 +70,21 @@ function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDA return (args_hdr, args_vec) end +#=doc +.. function:: bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) + + Create an :class:`Executor` by binding a :class:`Symbol` to concrete :class:`NDArray`. + + :param Symbol sym: the network architecture describing the computation graph. + :param Context ctx: the context on which the computation should run. + :param args: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete + arrays for all the inputs in the network architecture. The inputs typically include + network parameters (weights, bias, filters, etc.), data and labels. See :func:`list_arguments` + and :func:`infer_shape`. + :param args_grad: TODO + :param aux_states: + :param grad_req: +=# @enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; args_grad :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), diff --git a/src/initializer.jl b/src/initializer.jl index 3f830860f586..8f78bfba9367 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -1,12 +1,26 @@ #=doc -Built-in Initializers -===================== +Initializers +============ +Interface +--------- =# #=doc .. class:: AbstractInitializer The abstract base class for all initializers. + +To define a new initializer, it is +enough to derive a new type, and implement one or more of the following methods: + +.. function:: _init_weight(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + +Or, if full behavior customization is needed, override the following function + +.. function:: call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) =# abstract AbstractInitializer @@ -42,6 +56,10 @@ function _init_zero(self :: AbstractInitializer, name :: Base.Symbol, array :: N array[:] = 0 end +#=doc +Built-in initializers +--------------------- +=# #=doc .. class:: UniformInitializer @@ -50,6 +68,11 @@ end immutable UniformInitializer <: AbstractInitializer scale :: AbstractFloat end +#=doc +.. function UniformInitializer(scale=0.07) + + Construct a :class:`UniformInitializer` with the specified scale. +=# UniformInitializer() = UniformInitializer(0.07) function _init_weight(self :: UniformInitializer, name :: Base.Symbol, array :: NDArray) @@ -65,12 +88,23 @@ immutable NormalInitializer <: AbstractInitializer μ :: AbstractFloat σ :: AbstractFloat end +#=doc +.. function:: NormalIninitializer(; mu=0, sigma=0.01) + + Construct a :class:`NormalInitializer` with mean ``mu`` and variance ``sigma``. +=# NormalInitializer(; mu=0, sigma=0.01) = NormalInitializer(mu, sigma) function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) randn!(self.μ, self.σ, array) end +#=doc +.. class:: XaiverInitializer + + The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding + the difficulty of training deep feedforward neuralnetworks*. +=# immutable XaiverInitializer <: AbstractInitializer end diff --git a/src/io.jl b/src/io.jl index ed63a2dbedfe..6bbb9a5cf6d5 100644 --- a/src/io.jl +++ b/src/io.jl @@ -1,6 +1,8 @@ #=doc Data Providers ============== +Interface +--------- Data providers are wrappers that load external data, be it images, text, or general tensors, and split it into mini-batches so that the model can consume the data in a uniformed way. @@ -238,6 +240,10 @@ function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name error("$name is not provided by this data provider") end +#=doc +Built-in data providers +----------------------- +=# ################################################################################ #=doc @@ -430,6 +436,11 @@ function get_label(provider :: ArrayDataProvider, batch :: ArrayDataBatch) end +#=doc +libmxnet data providers +----------------------- +=# + ################################################################################ #=doc .. class:: MXDataProvider @@ -518,9 +529,6 @@ function count_samples(provider :: MXDataProvider, batch :: MXDataBatch) end #=doc -Built-in data providers in libmxnet ------------------------------------ - **autogen:EMBED:io:EMBED:autogen** =# function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) diff --git a/src/model.jl b/src/model.jl index 55ba733b5d13..b978ec0c6f49 100644 --- a/src/model.jl +++ b/src/model.jl @@ -1,6 +1,6 @@ #=doc -Built-in Models and Interface -============================= +Models +====== The model API provides convenient high-level interface to do training and predicting on a network described using the symbolic API. From 388e91dc6381a3bdd549372c2779405c6372b7c0 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 30 Oct 2015 05:08:10 -0400 Subject: [PATCH 160/630] fix mnist doc links --- docs/tutorial/mnist.rst | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/docs/tutorial/mnist.rst b/docs/tutorial/mnist.rst index 2e5d087a5242..5fe21cde181e 100644 --- a/docs/tutorial/mnist.rst +++ b/docs/tutorial/mnist.rst @@ -71,7 +71,8 @@ the code to construct the data provider into ``mnist-data.jl`` so that it could include("mnist-data.jl") train_provider, eval_provider = get_mnist_providers(batch_size) -If you need to write your own data providers for customized data format, please refer to **TODO**: pointer to data provider API. +If you need to write your own data providers for customized data format, please +refer to :class:`AbstractDataProvider`. Given the architecture and data, we can instantiate an *model* to do the actual training. ``mx.FeedForward`` is the built-in model that is suitable for most feed-forward architectures. When constructing the model, we also specify the *context* on which the computation should be carried out. Because this is a really tiny MLP, we will just run on a single CPU device. @@ -249,4 +250,4 @@ Alternatively, when the dataset is huge, one can provide a callback to ``mx.predict``, then the callback function will be invoked with the outputs of each mini-batch. The callback could, for example, write the data to disk for future inspection. In this case, no value is returned from ``mx.predict``. See -also **TODO** provide link to prediction API. +also :func:`predict`. From 319c5f351ecdd6fe3583fb4d4237c24cdbcd25bb Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 2 Nov 2015 09:49:29 -0500 Subject: [PATCH 161/630] rename Softmax -> SoftmaxOutput (mxnet/mxnet#434) --- examples/cifar10/cifar10.jl | 2 +- examples/mnist/lenet.jl | 2 +- examples/mnist/mlp.jl | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl index c46e2b3bf15c..37cfacd2cec0 100644 --- a/examples/cifar10/cifar10.jl +++ b/examples/cifar10/cifar10.jl @@ -51,7 +51,7 @@ in5b = simple_factory(in5a, 176, 160) pool = mx.Pooling(data=in5b, pool_type=:avg, kernel=(7,7), name=:global_pool) flatten = mx.Flatten(data=pool, name=:flatten1) fc = mx.FullyConnected(data=flatten, num_hidden=10, name=:fc1) -softmax = mx.Softmax(data=fc, name=:loss) +softmax = mx.SoftmaxOutput(data=fc, name=:loss) #-------------------------------------------------------------------------------- diff --git a/examples/mnist/lenet.jl b/examples/mnist/lenet.jl index 804fc1ea5312..ca48e6693213 100644 --- a/examples/mnist/lenet.jl +++ b/examples/mnist/lenet.jl @@ -25,7 +25,7 @@ fc1 = @mx.chain mx.Flatten(data=conv2) => fc2 = mx.FullyConnected(data=fc1, num_hidden=10) # softmax loss -lenet = mx.Softmax(data=fc2, name=:softmax) +lenet = mx.SoftmaxOutput(data=fc2, name=:softmax) #-------------------------------------------------------------------------------- diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 857b25f50049..b0703c56e5d1 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -20,7 +20,7 @@ mlp = @mx.chain mx.Variable(:data) => mx.FullyConnected(name=:fc2, num_hidden=64) => mx.Activation(name=:relu2, act_type=:relu) => mx.FullyConnected(name=:fc3, num_hidden=10) => - mx.Softmax(name=:softmax) + mx.SoftmaxOutput(name=:softmax) # data provider batch_size = 100 From 63890942a8af45ef9772060dbdf246a9740dd6ac Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 2 Nov 2015 09:54:12 -0500 Subject: [PATCH 162/630] update doc Softmax -> SoftmaxOutput (dmlc/mxnet#434) --- README.md | 2 +- docs/api/ndarray.rst | 39 +++++++++++- docs/api/symbol.rst | 129 +++++++++++++++++++++++++++++++++++++++- docs/tutorial/mnist.rst | 6 +- examples/mnist/mlp.jl | 2 +- 5 files changed, 167 insertions(+), 11 deletions(-) diff --git a/README.md b/README.md index 2c28bc58f15e..ea7b8577de3e 100644 --- a/README.md +++ b/README.md @@ -20,7 +20,7 @@ mlp = @mx.chain mx.Variable(:data) => mx.FullyConnected(name=:fc2, num_hidden=64) => mx.Activation(name=:relu2, act_type=:relu) => mx.FullyConnected(name=:fc3, num_hidden=10) => - mx.Softmax(name=:softmax) + mx.SoftmaxOutput(name=:softmax) # data provider batch_size = 100 diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index 8ac5e9bda8f0..05a3dccba7dc 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -364,9 +364,9 @@ object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the out Public APIs ^^^^^^^^^^^ -.. function:: choose_element(...) +.. function:: choose_element_0index(...) - Choose one element from each line(row for python, column for R/Julia) in lhs according to index indicated by rhs + Choose one element from each line(row for python, column for R/Julia) in lhs according to index indicated by rhs. This function assume rhs uses 0-based index. :param lhs: Left operand to the function. :type lhs: NDArray @@ -413,9 +413,42 @@ Public APIs +.. function:: exp(...) + + Take exp of the src + + :param src: Source input to the function + :type src: NDArray + + + + + +.. function:: log(...) + + Take log of the src + + :param src: Source input to the function + :type src: NDArray + + + + + +.. function:: norm(...) + + Take L2 norm of the src.The result will be ndarray of shape (1,) on the same device. + + :param src: Source input to the function + :type src: NDArray + + + + + .. function:: sqrt(...) - Take square root of the src + Take sqrt of the src :param src: Source input to the function :type src: NDArray diff --git a/docs/api/symbol.rst b/docs/api/symbol.rst index 2c7df712c2f8..e01ecb35980d 100644 --- a/docs/api/symbol.rst +++ b/docs/api/symbol.rst @@ -143,7 +143,7 @@ Public APIs :type num_filter: int (non-negative), required - :param num_group: number of groups partition + :param num_group: Number of groups partition. This option is not supported by CuDNN, you can use SliceChannel to num_group,apply convolution and concat instead to achieve the same need. :type num_group: int (non-negative), optional, default=1 @@ -162,6 +162,57 @@ Public APIs +.. function:: Deconvolution(...) + + Apply deconvolution to input then add a bias. + + :param data: Input data to the DeconvolutionOp. + :type data: Symbol + + + :param weight: Weight matrix. + :type weight: Symbol + + + :param bias: Bias parameter. + :type bias: Symbol + + + :param kernel: deconvolution kernel size: (y, x) + :type kernel: Shape(tuple), required + + + :param stride: deconvolution stride: (y, x) + :type stride: Shape(tuple), optional, default=(1, 1) + + + :param pad: pad for deconvolution: (y, x) + :type pad: Shape(tuple), optional, default=(0, 0) + + + :param num_filter: deconvolution filter(channel) number + :type num_filter: int (non-negative), required + + + :param num_group: number of groups partition + :type num_group: int (non-negative), optional, default=1 + + + :param workspace: Tmp workspace for deconvolution (MB) + :type workspace: long (non-negative), optional, default=512 + + + :param no_bias: Whether to disable bias parameter. + :type no_bias: boolean, optional, default=True + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`Symbol`. + + + + + .. function:: Dropout(...) Apply dropout to input @@ -412,7 +463,7 @@ Public APIs .. function:: Softmax(...) - Perform a softmax transformation on input. + DEPRECATED: Perform a softmax transformation on input. Please use SoftmaxOutput :param data: Input data to softmax. :type data: Symbol @@ -433,9 +484,62 @@ Public APIs +.. function:: SoftmaxOutput(...) + + Perform a softmax transformation on input, backprop with logloss. + + :param data: Input data to softmax. + :type data: Symbol + + + :param grad_scale: Scale the gradient by a float factor + :type grad_scale: float, optional, default=1 + + + :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes + :type multi_output: boolean, optional, default=False + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`Symbol`. + + + + + +.. function:: exp(...) + + Take exp of the src + + :param src: Source symbolic input to the function + :type src: Symbol + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`Symbol`. + + + + + +.. function:: log(...) + + Take log of the src + + :param src: Source symbolic input to the function + :type src: Symbol + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`Symbol`. + + + + + .. function:: sqrt(...) - Take square root of the src + Take sqrt of the src :param src: Source symbolic input to the function :type src: Symbol @@ -505,6 +609,25 @@ Internal APIs +.. function:: _Native(...) + + Stub for implementing an operator implemented in native frontend language. + + :param info: + :type info: , required + + + :param need_top_grad: Whether this layer needs out grad for backward. Should be false for loss layers. + :type need_top_grad: boolean, optional, default=True + + :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`Symbol`. + + + + + .. function:: _Plus(...) Perform an elementwise plus. diff --git a/docs/tutorial/mnist.rst b/docs/tutorial/mnist.rst index 5fe21cde181e..fc2e548dd1c2 100644 --- a/docs/tutorial/mnist.rst +++ b/docs/tutorial/mnist.rst @@ -41,11 +41,11 @@ Note each composition we take the previous symbol as the `data` argument, formin Input --> 128 units (ReLU) --> 64 units (ReLU) --> 10 units where the last 10 units correspond to the 10 output classes (digits 0,...,9). We -then add a final ``Softmax`` operation to turn the 10-dimensional prediction to proper probability values for the 10 classes: +then add a final :class:`SoftmaxOutput` operation to turn the 10-dimensional prediction to proper probability values for the 10 classes: .. code-block:: julia - mlp = mx.Softmax(data = fc3, name=:softmax) + mlp = mx.SoftmaxOutput(data = fc3, name=:softmax) As we can see, the MLP is just a chain of layers. For this case, we can also use the ``mx.chain`` macro. The same architecture above can be defined as @@ -58,7 +58,7 @@ the ``mx.chain`` macro. The same architecture above can be defined as mx.FullyConnected(name=:fc2, num_hidden=64) => mx.Activation(name=:relu2, act_type=:relu) => mx.FullyConnected(name=:fc3, num_hidden=10) => - mx.Softmax(name=:softmax) + mx.SoftmaxOutput(name=:softmax) After defining the architecture, we are ready to load the MNIST data. MXNet.jl provide built-in data providers for the MNIST dataset, which could automatically diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index b0703c56e5d1..05d008d5255c 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -11,7 +11,7 @@ using MXNet # fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) # act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) # fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) -# mlp = mx.Softmax(data = fc3, name=:softmax) +# mlp = mx.SoftmaxOutput(data = fc3, name=:softmax) #-- Option 2: using the mx.chain macro mlp = @mx.chain mx.Variable(:data) => From 922fc8516f503da74591c6b97f8bee81ff5fdcc0 Mon Sep 17 00:00:00 2001 From: iamed2 Date: Mon, 2 Nov 2015 10:21:09 -0600 Subject: [PATCH 163/630] Reenable 0.4 testing. --- .travis.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.travis.yml b/.travis.yml index cae2bfbb7a22..90fd90c7de74 100644 --- a/.travis.yml +++ b/.travis.yml @@ -5,7 +5,7 @@ os: - linux - osx julia: - #- release + - 0.4 - nightly # dependent apt packages From 4acbce9f2f95452829566dd35e90abe5aff7a33f Mon Sep 17 00:00:00 2001 From: Eric Davies Date: Mon, 2 Nov 2015 10:41:37 -0600 Subject: [PATCH 164/630] Add coverage. --- .travis.yml | 3 +++ README.md | 1 + test/travis/run_coverage.sh | 1 + 3 files changed, 5 insertions(+) create mode 100644 test/travis/run_coverage.sh diff --git a/.travis.yml b/.travis.yml index 90fd90c7de74..ed0d03d4906c 100644 --- a/.travis.yml +++ b/.travis.yml @@ -34,3 +34,6 @@ notifications: script: - source $TRAVIS/run_test.sh + +after_success: + - source $TRAVIS/run_coverage.sh diff --git a/README.md b/README.md index ea7b8577de3e..10862ff8a6a6 100644 --- a/README.md +++ b/README.md @@ -1,6 +1,7 @@ # MXNet [![Build Status](https://travis-ci.org/dmlc/MXNet.jl.svg?branch=master)](https://travis-ci.org/dmlc/MXNet.jl) +[![codecov.io](https://codecov.io/github/dmlc/MXNet.jl/coverage.svg?branch=master)](https://codecov.io/github/dmlc/MXNet.jl?branch=master) [![Documentation Status](https://readthedocs.org/projects/mxnetjl/badge/?version=latest)](http://mxnetjl.readthedocs.org/en/latest/?badge=latest) [![License](http://dmlc.github.io/img/apache2.svg)](LICENSE.md) diff --git a/test/travis/run_coverage.sh b/test/travis/run_coverage.sh new file mode 100644 index 000000000000..73816fac7b98 --- /dev/null +++ b/test/travis/run_coverage.sh @@ -0,0 +1 @@ +julia -e 'cd(Pkg.dir("MXNet")); Pkg.add("Coverage"); using Coverage; Codecov.submit(process_folder())' \ No newline at end of file From c1d663df4b339838558400a1eabfea81ec6b5d3e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 2 Nov 2015 22:27:40 -0500 Subject: [PATCH 165/630] run mlp.jl on travis CI --- test/runtests.jl | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/test/runtests.jl b/test/runtests.jl index 1d5f49b4d1f1..71d7f8a79fc4 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -14,3 +14,7 @@ end include("common.jl") test_dir("unittest") +# run the basic MNIST mlp example +if haskey(ENV, "TRAVIS") && ENV["TRAVIS"] == "true" + include(joinpath(Pkg.dir("MXNet"), "examples", "mnist", "mlp.jl")) +end From b1e882b46fd43b45c0353d0ae6825da017c05beb Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 2 Nov 2015 22:29:06 -0500 Subject: [PATCH 166/630] fix env variable for detecting Travis CI --- test/runtests.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/test/runtests.jl b/test/runtests.jl index 71d7f8a79fc4..af60ab9f9185 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -15,6 +15,6 @@ include("common.jl") test_dir("unittest") # run the basic MNIST mlp example -if haskey(ENV, "TRAVIS") && ENV["TRAVIS"] == "true" +if haskey(ENV, "CONTINUOUS_INTEGRATION") include(joinpath(Pkg.dir("MXNet"), "examples", "mnist", "mlp.jl")) end From f82351028ccd7164f23f264c08e3128f93074077 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 2 Nov 2015 22:35:45 -0500 Subject: [PATCH 167/630] only run 1 epoch for MNIST on travis CI --- examples/mnist/mlp.jl | 3 ++- test/runtests.jl | 1 + 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 05d008d5255c..fd1bbf99e38b 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -34,7 +34,8 @@ model = mx.FeedForward(mlp, context=mx.cpu()) optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +mx.fit(model, optimizer, train_provider, eval_data=eval_provider, + n_epoch = isdefined(:n_epoch) ? n_epoch : 20) #-------------------------------------------------------------------------------- # Optional, demonstration of the predict API diff --git a/test/runtests.jl b/test/runtests.jl index af60ab9f9185..3d796bd7a5e2 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -16,5 +16,6 @@ test_dir("unittest") # run the basic MNIST mlp example if haskey(ENV, "CONTINUOUS_INTEGRATION") + n_epoch = 1 include(joinpath(Pkg.dir("MXNet"), "examples", "mnist", "mlp.jl")) end From 23378f1d23f80e9b9950707b37c445a43927f2da Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 2 Nov 2015 22:41:39 -0500 Subject: [PATCH 168/630] fix error due to API changes of subarray in Julia nightly --- src/metric.jl | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 59acb529a9a7..c88239ab8cc8 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -14,9 +14,8 @@ function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDA n_sample = size(pred)[end] metric.n_sample += n_sample for i = 1:n_sample - klass = indmax(sub(pred,:,i)) + klass = indmax(pred[:,i]) metric.acc_sum += (klass-1) == label[i] - #println("$(sub(pred,:,i)) $(klass-1) <=> $(label[i])") end end From d26c36b8b0b1d254cddfadf4c4c1e11606d23360 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 2 Nov 2015 23:10:27 -0500 Subject: [PATCH 169/630] a specific mlp script for Travis CI regression test. --- examples/mnist/mlp-test.jl | 75 ++++++++++++++++++++++++++++++++++++++ examples/mnist/mlp.jl | 3 +- test/runtests.jl | 3 +- 3 files changed, 77 insertions(+), 4 deletions(-) create mode 100644 examples/mnist/mlp-test.jl diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl new file mode 100644 index 000000000000..ad7446a98324 --- /dev/null +++ b/examples/mnist/mlp-test.jl @@ -0,0 +1,75 @@ +# This file is primarily to be included from runtest.jl. We tried to cover various +# features of MXNet.jl in this example in order to detect regression errors. + +using MXNet + + +function get_mnist_mlp() + mlp = @mx.chain mx.Variable(:data) => + mx.FullyConnected(name=:fc1, num_hidden=128) => + mx.Activation(name=:relu1, act_type=:relu) => + mx.FullyConnected(name=:fc2, num_hidden=64) => + mx.Activation(name=:relu2, act_type=:relu) => + mx.FullyConnected(name=:fc3, num_hidden=10) => + mx.SoftmaxOutput(name=:softmax) + return mlp +end + +function get_mnist_data(batch_size=100) + include("mnist-data.jl") + return get_mnist_providers(batch_size) +end + +function mnist_fit_and_predict(optimizer, initializer, n_epoch) + mlp = get_mnist_mlp() + train_provider, eval_provider = get_mnist_data() + + # setup model + model = mx.FeedForward(mlp, context=mx.cpu()) + + # fit parameters + cp_prefix = "mnist-test-cp" + mx.fit(model, optimizer, train_provider, eval_data=eval_provider, n_epoch=n_epoch, + initializer=initializer, callbacks=[mx.speedometer(), mx.do_checkpoint(cp_prefix, save_epoch_0=true)]) + + # make sure the checkpoints are saved + @test isfile("$cp_prefix-symbol.json") + for i_epoch = 0:n_epoch + @test isfile(mx.format("{1}-{2:04d}.params", cp_prefix, i_epoch)) + end + mlp_load = mx.load("$cp_prefix-symbol.json", mx.Symbol) + @test mx.to_json(mlp_load) == mx.to_json(mlp) + mlp_load = mx.from_json(readall("$cp_prefix-symbol.json"), mx.Symbol) + @test mx.to_json(mlp_load) == mx.to_json(mlp) + + #-------------------------------------------------------------------------------- + # the predict API + probs = mx.predict(model, eval_provider) + + # collect all labels from eval data + labels = Array[] + for batch in eval_provider + push!(labels, copy(mx.get(eval_provider, batch, :softmax_label))) + end + labels = cat(1, labels...) + + # Now we use compute the accuracy + correct = 0 + for i = 1:length(labels) + # labels are 0...9 + if indmax(probs[:,i]) == labels[i]+1 + correct += 1 + end + end + accuracy = 100correct/length(labels) + println(mx.format("Accuracy on eval set: {1:.2f}%", accuracy)) + + return accuracy +end + +function test_mnist_mlp() + @test mnist_fit_and_predict(mx.SGD(lr=0.1, momentum=0.9), mx.UniformInitializer(0.01), 2) > 90 + @test mnist_fit_and_predict(mx.ADAM(), mx.NormalInitializer(), 2) > 90 +end + +test_mnist_mlp() diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index fd1bbf99e38b..f6fbbd5c0870 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -34,8 +34,7 @@ model = mx.FeedForward(mlp, context=mx.cpu()) optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) # fit parameters -mx.fit(model, optimizer, train_provider, eval_data=eval_provider, - n_epoch = isdefined(:n_epoch) ? n_epoch : 20) +mx.fit(model, optimizer, train_provider, eval_data=eval_provider, n_epoch=20) #-------------------------------------------------------------------------------- # Optional, demonstration of the predict API diff --git a/test/runtests.jl b/test/runtests.jl index 3d796bd7a5e2..53c8cbc3bb74 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -16,6 +16,5 @@ test_dir("unittest") # run the basic MNIST mlp example if haskey(ENV, "CONTINUOUS_INTEGRATION") - n_epoch = 1 - include(joinpath(Pkg.dir("MXNet"), "examples", "mnist", "mlp.jl")) + include(joinpath(Pkg.dir("MXNet"), "examples", "mnist", "mlp-test.jl")) end From 1786bdb742f7243fe44c8487c361cdd73b56776f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 2 Nov 2015 23:12:56 -0500 Subject: [PATCH 170/630] wrap mnist test into a module --- examples/mnist/mlp-test.jl | 5 ++++- test/unittest/kvstore.jl | 10 ++++++++++ 2 files changed, 14 insertions(+), 1 deletion(-) diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl index ad7446a98324..71ed5d7747c9 100644 --- a/examples/mnist/mlp-test.jl +++ b/examples/mnist/mlp-test.jl @@ -1,8 +1,9 @@ # This file is primarily to be included from runtest.jl. We tried to cover various # features of MXNet.jl in this example in order to detect regression errors. -using MXNet +module MNISTTest +using MXNet function get_mnist_mlp() mlp = @mx.chain mx.Variable(:data) => @@ -73,3 +74,5 @@ function test_mnist_mlp() end test_mnist_mlp() + +end # module MNISTTest diff --git a/test/unittest/kvstore.jl b/test/unittest/kvstore.jl index bca77a556922..2770edf7a259 100644 --- a/test/unittest/kvstore.jl +++ b/test/unittest/kvstore.jl @@ -16,6 +16,15 @@ function init_kv() return kv end +function test_kv_basic() + info("KVStore::basic") + + kv = init_kv() + @test mx.get_type(kv) == :local + @test mx.get_rank(kv) == 0 + @test mx.get_num_workers(kv) == 1 +end + function test_single_kv_pair() info("KVStore::single") @@ -53,6 +62,7 @@ function test_aggregator() end end +test_kv_basic() test_single_kv_pair() test_aggregator() From 3bf43649c8ede0d7f6329a37e8ec6f66dcbfeee7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 2 Nov 2015 23:33:04 -0500 Subject: [PATCH 171/630] fix travis test error --- examples/mnist/mlp-test.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl index 71ed5d7747c9..04d917c6543d 100644 --- a/examples/mnist/mlp-test.jl +++ b/examples/mnist/mlp-test.jl @@ -2,8 +2,8 @@ # features of MXNet.jl in this example in order to detect regression errors. module MNISTTest - using MXNet +using Base.Test function get_mnist_mlp() mlp = @mx.chain mx.Variable(:data) => From d0dadad888e16f65953abd60451923b437741a54 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 3 Nov 2015 07:41:15 -0500 Subject: [PATCH 172/630] pull-back only when update_on_kvstore --- src/model.jl | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/src/model.jl b/src/model.jl index b978ec0c6f49..ef34ad1d7669 100644 --- a/src/model.jl +++ b/src/model.jl @@ -372,12 +372,13 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # init kv with gradients for idx = 1:length(param_arrays) param_on_devs = param_arrays[idx] - grad_on_devs = grad_arrays[idx] init!(kvstore, idx, self.arg_params[param_names[idx]]) - # pull weights back - pull!(kvstore, idx, param_on_devs, priority=-idx) + if update_on_kvstore + # pull weights back + pull!(kvstore, idx, param_on_devs, priority=-idx) + end end end From 75b3e68fa9cd57f946a5f206ee36606193952838 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 3 Nov 2015 13:43:56 -0500 Subject: [PATCH 173/630] SVMLight Data Provider --- plugins/io/svmlight.jl | 64 ++++++++++++++++++++++++++++++++++++++++++ src/io.jl | 24 ++++++++++++++-- 2 files changed, 86 insertions(+), 2 deletions(-) create mode 100644 plugins/io/svmlight.jl diff --git a/plugins/io/svmlight.jl b/plugins/io/svmlight.jl new file mode 100644 index 000000000000..ddc207854d4e --- /dev/null +++ b/plugins/io/svmlight.jl @@ -0,0 +1,64 @@ +using MXNet +using SVMLightLoader + +type SVMLightProvider <: mx.AbstractDataProvider + filename :: AbstractString + batch_size :: Int + fea_dim :: Int + data_name :: Symbol + label_name :: Symbol +end + +function SVMLightProvider(filename::AbstractString, batch_size::Int; fea_dim::Int=-1, + data_name::Symbol=:data, label_name::Symbol=:label) + if fea_dim == -1 + info("SVMLightProvider: going over file to get feature dimension of $filename") + f = SVMLightFile(filename) + for (data, label) in f + fea_dim = max(fea_dim, length(data)) + end + end + + return SVMLightProvider(filename, batch_size, fea_dim, data_name, label_name) +end + +mx.get_batch_size(provider :: SVMLightProvider) = provider.batch_size +function mx.provide_data(provider :: SVMLightProvider) + [(provider.data_name, (provider.fea_dim, provider.batch_size))] +end +function mx.provide_label(provider :: SVMLightProvider) + [(provider.label_name, (provider.batch_size,))] +end + +function mx.eachbatch(provider :: SVMLightProvider) + data_jl = zeros(mx.MX_float, (provider.fea_dim, provider.batch_size)) + data_nd = mx.empty(size(data_jl)) + label_jl = zeros(mx.MX_float, (provider.batch_size,)) + label_nd = mx.empty(size(label_jl)) + + batch = mx.DataBatch([data_nd], [label_nd], provider.batch_size) + function _svmlight_iter() + f = SVMLightFile(provider.filename) + while true + raw = collect(take(f, provider.batch_size)) + cnt = length(raw) + if cnt == 0 + # end of file, no more data to see + return + end + + data_jl[:] = 0 + for i = 1:provider.batch_size + vec, gnd = raw[min(i,cnt)] + data_jl[1:length(vec),i] = vec + label_jl[i] = gnd + end + mx.copy!(data_nd, data_jl) + mx.copy!(label_nd, label_jl) + batch.count = cnt + produce(batch) + end + end + + return Task(_svmlight_iter) +end diff --git a/src/io.jl b/src/io.jl index 6bbb9a5cf6d5..385de35a2936 100644 --- a/src/io.jl +++ b/src/io.jl @@ -42,7 +42,7 @@ and split it into mini-batches so that the model can consume the data in a unifo .. code-block:: julia - for batch in provider + for batch in eachbatch(provider) data = get_data(provider, batch) end @@ -50,12 +50,15 @@ and split it into mini-batches so that the model can consume the data in a unifo .. code-block:: julia - state = Base.start(provider) + state = Base.start(eachbatch(provider)) while !Base.done(provider, state) (batch, state) = Base.next(provider, state) data = get_data(provider, batch) end + By default, :func:`eachbatch` simply returns the provider itself, so the iterator interface + is implemented on the provider type itself. But the extra layer of abstraction allows us to + implement a data provider easily via a Julia ``Task`` coroutine. The detailed interface function is listed below: .. function:: Base.eltype(provider) -> AbstractDataBatch @@ -189,6 +192,21 @@ abstract AbstractDataProviderState =# abstract AbstractDataBatch +#=doc +.. class:: DataBatch + + A basic subclass of :class:`AbstractDataBatch`, that implement the interface by + accessing member fields. +=# +type DataBatch <: AbstractDataBatch + data :: Vector{NDArray} + label :: Vector{NDArray} + count :: Int +end +count_samples(batch :: DataBatch) = batch.count +get_data(batch :: DataBatch) = batch.data +get_label(batch :: DataBatch) = batch.label + #=doc .. class:: SlicedNDArray @@ -240,6 +258,8 @@ function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name error("$name is not provided by this data provider") end +eachbatch(provider :: AbstractDataProvider) = provider + #=doc Built-in data providers ----------------------- From f6cbba1ca080089cabeb297ea44f1b7e0463c208 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 3 Nov 2015 13:47:09 -0500 Subject: [PATCH 174/630] add description of SVMLight Provider --- plugins/io/svmlight.jl | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/plugins/io/svmlight.jl b/plugins/io/svmlight.jl index ddc207854d4e..94563357ee6e 100644 --- a/plugins/io/svmlight.jl +++ b/plugins/io/svmlight.jl @@ -1,3 +1,7 @@ +#=doc +SVMLight / LibSVM is a popular data format for sparse features. Some preprocessed +datasets in this format could be found at http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/ +=# using MXNet using SVMLightLoader From 0f22cfa3897668cb044db41059c51d06a600d608 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 3 Nov 2015 13:53:26 -0500 Subject: [PATCH 175/630] add readme for plugins --- plugins/README.md | 14 ++++++++++++++ 1 file changed, 14 insertions(+) create mode 100644 plugins/README.md diff --git a/plugins/README.md b/plugins/README.md new file mode 100644 index 000000000000..38882889f494 --- /dev/null +++ b/plugins/README.md @@ -0,0 +1,14 @@ +# Plugins of MXNet.jl + +This directory contains *plugins* of MXNet.jl. A plugin is typically a component that could be part of MXNet.jl, but excluded from the `mx` namespace. The plugins are included here primarily for two reasons: + +* To minimize the dependency of MXNet.jl on other optional packages. +* To serve as examples on how to extend some components of MXNet.jl. + +The most straightforward way to use a plugin is to `include` the code. For example + +```julia +include(joinpath(Pkg.dir("MXNet"), "plugins", "io", "svmlight.jl")) + +provider = SVMLightProvider("/path/to/dataset", 100) +``` From 7ed591d7d83b10cd07f5ece128f8114e8bdbe9f8 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 5 Nov 2015 15:14:11 +0900 Subject: [PATCH 176/630] add libatlas-base for cblas --- .travis.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.travis.yml b/.travis.yml index ed0d03d4906c..8771dfa989b6 100644 --- a/.travis.yml +++ b/.travis.yml @@ -19,6 +19,7 @@ addons: - git - libcurl4-openssl-dev - unzip + - libatlas-base-dev - libatlas-dev - libopencv-dev - gcc-4.8 From ee855ecd36ff3bde759be569e4e0dcd3b49ef1d9 Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 5 Nov 2015 09:00:46 -0500 Subject: [PATCH 177/630] fix cifar10 example --- examples/cifar10/cifar10.jl | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl index 37cfacd2cec0..e5ff751eca7d 100644 --- a/examples/cifar10/cifar10.jl +++ b/examples/cifar10/cifar10.jl @@ -77,9 +77,7 @@ gpus = [mx.Context(mx.GPU, i) for i = 0:num_gpus-1] model = mx.FeedForward(softmax, context=gpus) # optimizer -optimizer = mx.SGD(lr_scheduler=mx.FixedLearningRateScheduler(0.05), - mom_scheduler=mx.FixedMomentumScheduler(0.9), - weight_decay=0.0001) +optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.0001) # fit parameters mx.fit(model, optimizer, train_provider, n_epoch=num_epoch, eval_data=test_provider, From 726badd23dd6960ae800a01f048bab94eb91b3f2 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 7 Nov 2015 18:59:26 -0500 Subject: [PATCH 178/630] update doc for updated data iter API --- docs/api/io.rst | 15 +++++++++++++-- src/model.jl | 6 +++--- 2 files changed, 16 insertions(+), 5 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index b601db39c7ec..a7568a7b6f71 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -43,7 +43,7 @@ and split it into mini-batches so that the model can consume the data in a unifo .. code-block:: julia - for batch in provider + for batch in eachbatch(provider) data = get_data(provider, batch) end @@ -51,12 +51,15 @@ and split it into mini-batches so that the model can consume the data in a unifo .. code-block:: julia - state = Base.start(provider) + state = Base.start(eachbatch(provider)) while !Base.done(provider, state) (batch, state) = Base.next(provider, state) data = get_data(provider, batch) end + By default, :func:`eachbatch` simply returns the provider itself, so the iterator interface + is implemented on the provider type itself. But the extra layer of abstraction allows us to + implement a data provider easily via a Julia ``Task`` coroutine. The detailed interface function is listed below: .. function:: Base.eltype(provider) -> AbstractDataBatch @@ -191,6 +194,14 @@ and split it into mini-batches so that the model can consume the data in a unifo +.. class:: DataBatch + + A basic subclass of :class:`AbstractDataBatch`, that implement the interface by + accessing member fields. + + + + .. class:: SlicedNDArray A alias type of ``Tuple{UnitRange{Int},NDArray}``. diff --git a/src/model.jl b/src/model.jl index ef34ad1d7669..c291243093c6 100644 --- a/src/model.jl +++ b/src/model.jl @@ -185,7 +185,7 @@ function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::B batch_size = get_batch_size(data) data_arrays = [self.pred_exec.arg_dict[name] for name in data_names] output_list = [Array{MX_float}[] for i=1:length(self.pred_exec.outputs)] - for batch in data + for batch in eachbatch(data) load_data!(data, batch, data_arrays) forward(self.pred_exec, is_train=false) if isa(callback, Void) @@ -402,7 +402,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # invoke callbacks on iteration 0 _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) - for batch in data + for batch in eachbatch(data) load_data!(data, batch, data_arrays) load_label!(data, batch, label_arrays) @@ -473,7 +473,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra @assert(get_batch_size(opts.eval_data) == batch_size) reset!(opts.eval_metric) - for batch in opts.eval_data + for batch in eachbatch(opts.eval_data) load_data!(opts.eval_data, batch, data_arrays) # forward and backward From 637bf0cfbb28a93060e9f44281d28c3e7caf517c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 7 Nov 2015 19:09:35 -0500 Subject: [PATCH 179/630] avoid calling mxdataiter reset --- src/io.jl | 22 ++++++++++++++++++---- test/runtests.jl | 4 ++-- 2 files changed, 20 insertions(+), 6 deletions(-) diff --git a/src/io.jl b/src/io.jl index 385de35a2936..d618a4eef1be 100644 --- a/src/io.jl +++ b/src/io.jl @@ -473,6 +473,11 @@ type MXDataProvider <: AbstractDataProvider data_shape :: Vector{Tuple{Base.Symbol, Tuple}} label_shape:: Vector{Tuple{Base.Symbol, Tuple}} batch_size :: Int + + # those two a auxiliary variables to help avoid calling reset + # but still pre-fetch first batch to get shape information + first_epoch:: Bool + first_batch:: Bool end function _reset_data_iter(handle :: MX_DataIterHandle) @@ -499,7 +504,6 @@ function MXDataProvider(handle :: MX_DataIterHandle; label_name :: Union{Base.Symbol,Void}=:softmax_label, kwargs...) # for convenience, we ignore the rest keyword arguments # init iterator, load the first batch and get shapes - _reset_data_iter(handle) @assert(_iter_next(handle), "Failed to load the first batch in MXDataProvider") data_shape = Tuple{Base.Symbol, Tuple}[(data_name, size(_get_data(handle)))] if !isa(label_name, Void) @@ -508,7 +512,7 @@ function MXDataProvider(handle :: MX_DataIterHandle; label_shape = Tuple{Base.Symbol, Tuple}[] end - MXDataProvider(handle, data_shape, label_shape, data_shape[1][2][end]) + MXDataProvider(handle, data_shape, label_shape, data_shape[1][2][end], true, true) end provide_data(provider::MXDataProvider) = provider.data_shape @@ -525,11 +529,21 @@ function Base.eltype(provider :: MXDataProvider) MXDataBatch end function Base.start(provider :: MXDataProvider) - _reset_data_iter(provider.handle) + if !provider.first_epoch + _reset_data_iter(provider.handle) + else + provider.first_epoch = false + end + return MXDataProviderState(true) end function Base.done(provider :: MXDataProvider, state :: MXDataProviderState) - state.has_next = _iter_next(provider.handle) + if provider.first_batch + state.has_next = true + provider.first_batch = false + else + state.has_next = _iter_next(provider.handle) + end return !state.has_next end function Base.next(provider :: MXDataProvider, state :: MXDataProviderState) diff --git a/test/runtests.jl b/test/runtests.jl index 53c8cbc3bb74..cd9087b7202b 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -11,8 +11,8 @@ function test_dir(dir) end end -include("common.jl") -test_dir("unittest") +include(joinpath(dirname(@__FILE__), "common.jl")) +test_dir(joinpath(dirname(@__FILE__), "unittest")) # run the basic MNIST mlp example if haskey(ENV, "CONTINUOUS_INTEGRATION") From ee0583f82d093654b0d66379a118822fca26da1c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 8 Nov 2015 10:43:57 -0500 Subject: [PATCH 180/630] remove unused variable --- src/kvstore.jl | 1 - 1 file changed, 1 deletion(-) diff --git a/src/kvstore.jl b/src/kvstore.jl index 562edc3d4850..d52433f567b2 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -107,7 +107,6 @@ end # extra handle parameter of the API to pass the updater object around. Fix this when someday # full closure cfunction is supported in Julia. function _kvstore_update_wrapper(index::Cint, nd_recv::MX_handle, nd_local::MX_handle, updater::Ptr{Void}) - x = unsafe_pointer_to_objref(updater) updater_func = unsafe_pointer_to_objref(updater) :: Function updater_func(Int(index), NDArray(MX_NDArrayHandle(nd_recv)), NDArray(MX_NDArrayHandle(nd_local))) return nothing From 315c1a4aff9355e2be6baa1d9993de26145e078b Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 00:29:06 -0500 Subject: [PATCH 181/630] simplify a bit io test --- test/unittest/io.jl | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/test/unittest/io.jl b/test/unittest/io.jl index d34fb674b689..33be1eac3da1 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -52,8 +52,7 @@ function test_arrays_impl(data::Vector, label::Vector, provider::mx.ArrayDataPro info("IO::Array::#data=$(length(data)),#label=$(length(label)),batch_size=$batch_size") for (idx, batch) in zip(idx_all, provider) data_batch = [x[[Colon() for i=1:ndims(x)-1]..., idx:min(idx+batch_size-1,sample_count)] for x in data] - data_get = [mx.empty(size(x)[1:end-1]..., batch_size) for x in data] - mx.load_data!(provider, batch, [[(1:batch_size, x)] for x in data_get]) + data_get = mx.get_data(provider, batch) for (d_real, d_get) in zip(data_batch, data_get) @test reldiff(d_real, copy(d_get)[[1:n for n in size(d_real)]...]) < 1e-6 From 722eb369998133e0820f27611229fc60d15c6afa Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 00:50:51 -0500 Subject: [PATCH 182/630] fix array data iter provide size not properly reported (see #14) --- src/io.jl | 4 ++-- test/unittest/io.jl | 7 +++++++ 2 files changed, 9 insertions(+), 2 deletions(-) diff --git a/src/io.jl b/src/io.jl index d618a4eef1be..c7e5616c6565 100644 --- a/src/io.jl +++ b/src/io.jl @@ -394,10 +394,10 @@ function ArrayDataProvider(data::Any, label::Any; batch_size::Int=0, shuffle::Bo end function provide_data(provider::ArrayDataProvider) - return collect(zip(provider.data_names, map(size, provider.data_arrays))) + return collect(zip(provider.data_names, map(size, provider.data_batch))) end function provide_label(provider::ArrayDataProvider) - return collect(zip(provider.label_names, map(size, provider.label_arrays))) + return collect(zip(provider.label_names, map(size, provider.label_batch))) end get_batch_size(provider::ArrayDataProvider) = provider.batch_size diff --git a/test/unittest/io.jl b/test/unittest/io.jl index 33be1eac3da1..8ef3b57d948c 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -49,6 +49,13 @@ function test_arrays_impl(data::Vector, label::Vector, provider::mx.ArrayDataPro batch_size = mx.get_batch_size(provider) idx_all = 1:batch_size:sample_count + for (d1, (_, d2)) in zip(data, mx.provide_data(provider)) + @test size(d1)[1:end-1] == d2[1:end-1] + end + for (d1, (_, d2)) in zip(label, mx.provide_label(provider)) + @test size(d1)[1:end-1] == d2[1:end-1] + end + info("IO::Array::#data=$(length(data)),#label=$(length(label)),batch_size=$batch_size") for (idx, batch) in zip(idx_all, provider) data_batch = [x[[Colon() for i=1:ndims(x)-1]..., idx:min(idx+batch_size-1,sample_count)] for x in data] From 189e755b0ba537d4f81e10d30579931ea727992a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 09:37:03 -0500 Subject: [PATCH 183/630] prepare for v0.0.4 --- NEWS.md | 9 ++++++++- docs/conf.py | 4 ++-- 2 files changed, 10 insertions(+), 3 deletions(-) diff --git a/NEWS.md b/NEWS.md index 84858e3aca13..f970f7d64703 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,4 +1,11 @@ -# v.0.03 (2015.10.27) +# v0.0.4 (2015.11.09) + +* ADAM optimizer (@cbecker) +* Improved data provider API. +* More documentation. +* Fix a bug in array data iterator (@vchuravy) + +# v0.0.3 (2015.10.27) * Model prediction API. * Model checkpoint loading and saving. diff --git a/docs/conf.py b/docs/conf.py index ca57eed31146..b009877694a0 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -56,9 +56,9 @@ # built documents. # # The short X.Y version. -version = '0.0.3' +version = '0.0.4' # The full version, including alpha/beta/rc tags. -release = '0.0.3' +release = '0.0.4' # The language for content autogenerated by Sphinx. Refer to documentation # for a list of supported languages. From 76261c736743d3256a0a9502429b1d95f2796026 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 15:19:58 -0500 Subject: [PATCH 184/630] refactoring: Symbol -> Node --- src/MXNet.jl | 2 +- src/executor.jl | 16 ++-- src/io.jl | 2 +- src/model.jl | 12 +-- src/{symbol.jl => node.jl} | 122 +++++++++++++-------------- test/unittest/{symbol.jl => node.jl} | 16 ++-- 6 files changed, 85 insertions(+), 85 deletions(-) rename src/{symbol.jl => node.jl} (77%) rename test/unittest/{symbol.jl => node.jl} (91%) diff --git a/src/MXNet.jl b/src/MXNet.jl index 53553d417941..68875b62da90 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -15,7 +15,7 @@ include("ndarray.jl") include("random.jl") include("name.jl") -include("symbol.jl") +include("node.jl") include("executor.jl") include("metric.jl") diff --git a/src/executor.jl b/src/executor.jl index 4485bc6dce9a..6dea17763101 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -6,13 +6,13 @@ Executor #=doc .. class:: Executor - An executor is a realization of a symbolic architecture defined by a :class:`Symbol`. + An executor is a realization of a symbolic architecture defined by a :class:`Node`. The actual forward and backward computation specified by the network architecture can be carried out with an executor. =# type Executor handle :: MX_ExecutorHandle - symbol :: Symbol + symbol :: Node arg_arrays :: Vector{NDArray} grad_arrays :: Vector{Union{Void,NDArray}} aux_arrays :: Vector{NDArray} @@ -20,7 +20,7 @@ type Executor arg_dict :: Dict{Base.Symbol, NDArray} aux_dict :: Dict{Base.Symbol, NDArray} end -function Executor(hdr :: MX_ExecutorHandle, symbol :: Symbol, +function Executor(hdr :: MX_ExecutorHandle, symbol :: Node, arg_arrays :: Vector{NDArray}, grad_arrays :: Vector{Union{Void,NDArray}}, aux_arrays :: Vector{NDArray}) # get output arrays @@ -73,9 +73,9 @@ end #=doc .. function:: bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) - Create an :class:`Executor` by binding a :class:`Symbol` to concrete :class:`NDArray`. + Create an :class:`Executor` by binding a :class:`Node` to concrete :class:`NDArray`. - :param Symbol sym: the network architecture describing the computation graph. + :param Node sym: the network architecture describing the computation graph. :param Context ctx: the context on which the computation should run. :param args: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete arrays for all the inputs in the network architecture. The inputs typically include @@ -86,7 +86,7 @@ end :param grad_req: =# @enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 -function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; +function bind(self :: Node, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; args_grad :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), aux_states :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), grad_req :: Union{GRAD_REQ,Vector{GRAD_REQ},Dict{Base.Symbol,GRAD_REQ}} = GRAD_WRITE) @@ -116,7 +116,7 @@ function bind(self :: Symbol, ctx :: Context, args :: Union{Vector{NDArray},Dict executor = Executor(MX_ExecutorHandle(ref_hdr[]), self, args, args_grad, aux_states) end -function bind(self :: Symbol; kwargs...) +function bind(self :: Node; kwargs...) kwargs = Dict(kwargs) @assert(haskey(kwargs, :args), "Must specify args") args = pop!(kwargs, :args) @@ -128,7 +128,7 @@ function bind(self :: Symbol; kwargs...) bind(self, context, args; kwargs...) end -function simple_bind(self :: Symbol, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) +function simple_bind(self :: Node, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) arg_shapes, out_shapes, aux_shapes = infer_shape(self; kwargs...) @assert(!isa(arg_shapes, Void), "Information not enough to perform complete shape inference") diff --git a/src/io.jl b/src/io.jl index c7e5616c6565..5c59e96bb611 100644 --- a/src/io.jl +++ b/src/io.jl @@ -35,7 +35,7 @@ and split it into mini-batches so that the model can consume the data in a unifo training stage, both *data* and *label* will be feeded into the model, while during prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and of any shapes. The provided data and label names here should match the input names in a target - :class:`Symbol`. + :class:`Node`. A data provider should also implement the Julia iteration interface, in order to allow iterating through the data set. The provider will be called in the following way: diff --git a/src/model.jl b/src/model.jl index c291243093c6..93189124d9b0 100644 --- a/src/model.jl +++ b/src/model.jl @@ -23,7 +23,7 @@ abstract AbstractModel that handles sequential data explicitly, please use **TODO**... =# type FeedForward <: AbstractModel - arch :: Symbol + arch :: Node ctx :: Vector{Context} arg_params :: Dict{Base.Symbol, NDArray} @@ -32,7 +32,7 @@ type FeedForward <: AbstractModel pred_exec :: Union{Executor, Void} # leave the rest fields undefined - FeedForward(arch :: Symbol, ctx :: Vector{Context}) = new(arch, ctx) + FeedForward(arch :: Node, ctx :: Vector{Context}) = new(arch, ctx) end """Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector @@ -52,14 +52,14 @@ function _split_inputs(batch_size :: Int, n_split :: Int) end #=doc -.. function:: FeedForward(arch :: Symbol, ctx) +.. function:: FeedForward(arch :: Node, ctx) :param arch: the architecture of the network constructed using the symbolic API. :param ctx: the devices on which this model should do computation. It could be a single :class:`Context` or a list of :class:`Context` objects. In the latter case, data parallelization will be used for training. If no context is provided, the default context ``cpu()`` will be used. =# -function FeedForward(arch :: Symbol; context :: Union{Context, Vector{Context}, Void} = nothing) +function FeedForward(arch :: Node; context :: Union{Context, Vector{Context}, Void} = nothing) if isa(context, Void) context = [Context(CPU)] elseif isa(context, Context) @@ -514,7 +514,7 @@ end function save_checkpoint(self :: FeedForward, prefix :: AbstractString, state :: OptimizationState) save_checkpoint(self.arch, self.arg_params, self.aux_params, prefix, state.curr_epoch) end -function save_checkpoint(sym :: Symbol, arg_params :: Dict{Base.Symbol, NDArray}, +function save_checkpoint(sym :: Node, arg_params :: Dict{Base.Symbol, NDArray}, aux_params :: Dict{Base.Symbol, NDArray}, prefix :: AbstractString, epoch :: Int) save("$prefix-symbol.json", sym) save_dict = merge(Dict([symbol("arg:$k") => v for (k,v) in arg_params]), @@ -525,7 +525,7 @@ function save_checkpoint(sym :: Symbol, arg_params :: Dict{Base.Symbol, NDArray} end function load_checkpoint(prefix :: AbstractString, epoch :: Int) - arch = load("$prefix-symbol.json", Symbol) + arch = load("$prefix-symbol.json", Node) saved_dict = load(format("{1}-{2:04d}.params", prefix, epoch), NDArray) arg_params = Dict{Base.Symbol, NDArray}() aux_params = Dict{Base.Symbol, NDArray}() diff --git a/src/symbol.jl b/src/node.jl similarity index 77% rename from src/symbol.jl rename to src/node.jl index 13338602f259..337d50864684 100644 --- a/src/symbol.jl +++ b/src/node.jl @@ -4,50 +4,50 @@ Symbolic API =# #=doc -.. class:: Symbol +.. class:: Node - Symbol is the basic building block of the symbolic graph in MXNet.jl. + Node is the basic building block of the symbolic graph in MXNet.jl. .. note:: - Throughout this documentation, ``Symbol`` always refer to this :class:`Symbol` type. - When we refer to the Julia's build-in symbol type (e.g. ``typeof(:foo)``), we always + Throughout this documentation, ``Node`` always refer to this :class:`Node` type. + When we refer to the Julia's build-in Node type (e.g. ``typeof(:foo)``), we always say ``Base.Symbol``. =# -type Symbol +type Node handle :: MX_SymbolHandle end -function Base.unsafe_convert(::Type{MX_handle}, obj::Symbol) +function Base.unsafe_convert(::Type{MX_handle}, obj::Node) Base.unsafe_convert(MX_handle, obj.handle) end -Base.convert(t::Type{MX_handle}, obj::Symbol) = Base.unsafe_convert(t, obj) -Base.cconvert(t::Type{MX_handle}, obj::Symbol) = Base.unsafe_convert(t, obj) +Base.convert(t::Type{MX_handle}, obj::Node) = Base.unsafe_convert(t, obj) +Base.cconvert(t::Type{MX_handle}, obj::Node) = Base.unsafe_convert(t, obj) #=doc -.. function:: deepcopy(self :: Symbol) +.. function:: deepcopy(self :: Node) - Make a deep copy of a symbol. + Make a deep copy of a Node. =# -function Base.deepcopy(self :: Symbol) +function Base.deepcopy(self :: Node) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCopy, (MX_handle, Ref{MX_handle}), self, ref_hdr) - return Symbol(MX_SymbolHandle(ref_hdr[])) + return Node(MX_SymbolHandle(ref_hdr[])) end #=doc -.. function:: copy(self :: Symbol) +.. function:: copy(self :: Node) - Make a copy of a symbol. The same as making a deep copy. + Make a copy of a Node. The same as making a deep copy. =# -function Base.copy(self :: Symbol) +function Base.copy(self :: Node) Base.deepcopy(self) end -function Base.call(self :: Symbol, args :: Symbol...) +function Base.call(self :: Node, args :: Node...) s = deepcopy(self) _compose!(s, args...) end -function Base.call(self :: Symbol; kwargs...) +function Base.call(self :: Node; kwargs...) s = deepcopy(self) _compose!(s; kwargs...) end @@ -64,10 +64,10 @@ macro _list_symbol_info(self, func_name) return names end end -function list_arguments(self :: Symbol) +function list_arguments(self :: Node) @_list_symbol_info(self, :MXSymbolListArguments) end -function list_outputs(self :: Symbol) +function list_outputs(self :: Node) @_list_symbol_info(self, :MXSymbolListOutputs) end """List all auxiliary states in the symbool. @@ -77,31 +77,31 @@ and do not have gradient. But still be useful for the specific operations. A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. Most operators do not have Auxiliary states. """ -function list_auxiliary_states(self :: Symbol) +function list_auxiliary_states(self :: Node) @_list_symbol_info(self, :MXSymbolListAuxiliaryStates) end -"Get a new grouped symbol whose output contains all the internal outputs of this symbol." -function get_internals(self :: Symbol) +"Get a new grouped Node whose output contains all the internal outputs of this Node." +function get_internals(self :: Node) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolGetInternals, (MX_handle, Ref{MX_handle}), self, ref_hdr) - return Symbol(MX_SymbolHandle(ref_hdr[])) + return Node(MX_SymbolHandle(ref_hdr[])) end "Create a symbolic variable with the given name" function Variable(name :: Union{Base.Symbol, AbstractString}) hdr_ref = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) - Symbol(MX_SymbolHandle(hdr_ref[])) + Node(MX_SymbolHandle(hdr_ref[])) end -"Create a symbol that groups symbols together" -function Group(symbols :: Symbol...) +"Create a Node that groups symbols together" +function Group(symbols :: Node...) handles = MX_handle[symbols...] ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateGroup, (MX_uint, Ptr{MX_handle}, Ref{MX_handle}), length(handles), handles, ref_hdr) - Symbol(MX_SymbolHandle(ref_hdr[])) + Node(MX_SymbolHandle(ref_hdr[])) end macro _infer_shape(self, keys, indptr, sdata) @@ -147,7 +147,7 @@ macro _infer_shape(self, keys, indptr, sdata) end end end -function infer_shape(self :: Symbol; kwargs...) +function infer_shape(self :: Node; kwargs...) sdata = MX_uint[] indptr = MX_uint[0] for (k,v) in kwargs @@ -157,7 +157,7 @@ function infer_shape(self :: Symbol; kwargs...) keys = AbstractString[string(x[1]) for x in kwargs] @_infer_shape(self, keys, indptr, sdata) end -function infer_shape(self :: Symbol, args :: Union{Tuple, Void}...) +function infer_shape(self :: Node, args :: Union{Tuple, Void}...) sdata = MX_uint[] indptr = MX_uint[0] for arg in args @@ -169,42 +169,42 @@ function infer_shape(self :: Symbol, args :: Union{Tuple, Void}...) @_infer_shape(self, keys, indptr, sdata) end -function Base.getindex(self :: Symbol, idx :: Union{Base.Symbol, AbstractString}) +function Base.getindex(self :: Node, idx :: Union{Base.Symbol, AbstractString}) idx = symbol(idx) i_idx = find(idx .== list_outputs(self)) @assert(length(i_idx) > 0, "Cannot find output with name '$idx'") @assert(length(i_idx) < 2, "Found duplicated output with name '$idx'") Base.getindex(self, i_idx[1]) end -function Base.getindex(self :: Symbol, idx :: Int) +function Base.getindex(self :: Node, idx :: Int) ref_hdr = Ref{MX_handle}(0) # note Julia is 1-based, while MXNet is 0-based @mxcall(:MXSymbolGetOutput, (MX_handle, MX_uint, Ref{MX_handle}), self, idx-1, ref_hdr) - return Symbol(MX_SymbolHandle(ref_hdr[])) + return Node(MX_SymbolHandle(ref_hdr[])) end import Base: +, .+ -function +(self :: Symbol, args :: Symbol...) +function +(self :: Node, args :: Node...) ret = self for arg in args ret = _Plus(ret, arg) end ret end -function .+(self :: Symbol, args :: Symbol...) +function .+(self :: Node, args :: Node...) +(self, args...) end import Base: -, .- -function -(self :: Symbol, arg :: Symbol) +function -(self :: Node, arg :: Node) _Minus(self, arg) end -function .-(self :: Symbol, arg :: Symbol) +function .-(self :: Node, arg :: Node) -(self, arg) end import Base: .* -function .*(self :: Symbol, args :: Symbol...) +function .*(self :: Node, args :: Node...) ret = self for arg in args ret = _Mul(ret, arg) @@ -213,11 +213,11 @@ function .*(self :: Symbol, args :: Symbol...) end import Base: ./ -function ./(self :: Symbol, arg :: Symbol) +function ./(self :: Node, arg :: Node) _Div(self, arg) end -function _compose!(sym :: Symbol; kwargs...) +function _compose!(sym :: Node; kwargs...) name = char_p(0) arg_keys = AbstractString[] arg_vals = MX_handle[] @@ -226,7 +226,7 @@ function _compose!(sym :: Symbol; kwargs...) if k == :name name = string(v) else - @assert(isa(v, Symbol), "Compose expect `Symbol` as arguments") + @assert(isa(v, Node), "Compose expect `Node` as arguments") push!(arg_keys, string(k)) push!(arg_vals, v) end @@ -237,10 +237,10 @@ function _compose!(sym :: Symbol; kwargs...) sym, name, length(arg_keys), arg_keys, arg_vals) return sym end -function _compose!(sym :: Symbol, args::Symbol...) +function _compose!(sym :: Node, args::Node...) _compose!(sym, char_p(0), args...) end -function _compose!(sym :: Symbol, name :: Union{Base.Symbol, char_p}, args::Symbol...) +function _compose!(sym :: Node, name :: Union{Base.Symbol, char_p}, args::Node...) if isa(name, Base.Symbol); name = string(name); end arg_keys = Ptr{char_p}(0) arg_vals = MX_handle[args...] @@ -251,27 +251,27 @@ function _compose!(sym :: Symbol, name :: Union{Base.Symbol, char_p}, args::Symb return sym end -"""Save Symbol into a JSON string""" -function to_json(self :: Symbol) +"""Save Node into a JSON string""" +function to_json(self :: Node) ref_json = Ref{char_p}(0) @mxcall(:MXSymbolSaveToJSON, (MX_handle, Ref{char_p}), self, ref_json) return bytestring(ref_json[]) end -"""Load Symbol from a JSON string representation.""" -function from_json(repr :: AbstractString, ::Type{Symbol}) +"""Load Node from a JSON string representation.""" +function from_json(repr :: AbstractString, ::Type{Node}) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateFromJSON, (char_p, Ref{MX_handle}), repr, ref_hdr) - return Symbol(MX_SymbolHandle(ref_hdr[])) + return Node(MX_SymbolHandle(ref_hdr[])) end -"""Load Symbol from a JSON file.""" -function load(filename :: AbstractString, ::Type{Symbol}) +"""Load Node from a JSON file.""" +function load(filename :: AbstractString, ::Type{Node}) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateFromFile, (char_p, Ref{MX_handle}), filename, ref_hdr) - return Symbol(MX_SymbolHandle(ref_hdr[])) + return Node(MX_SymbolHandle(ref_hdr[])) end -function save(filename :: AbstractString, sym :: Symbol) +function save(filename :: AbstractString, sym :: Node) @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), sym, filename) end @@ -279,10 +279,10 @@ end libmxnet APIs ------------- -**autogen:EMBED:symbol:EMBED:autogen** +**autogen:EMBED:Node:EMBED:autogen** =# ################################################################################ -# Atomic Symbol functions dynamically imported from libmxnet +# Atomic Node functions dynamically imported from libmxnet ################################################################################ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) ref_name = Ref{char_p}(0) @@ -305,11 +305,11 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) if gen_docs f_desc = bytestring(ref_desc[]) * "\n\n" if !isempty(kv_nargs_s) - f_desc *= "This function support variable length positional :class:`Symbol` inputs.\n\n" + f_desc *= "This function support variable length positional :class:`Node` inputs.\n\n" end f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional.\n\n" - f_desc *= ":return: the constructed :class:`Symbol`.\n\n" + f_desc *= ":param Base.Symbol name: The name of the Node. (e.g. `:my_symbol`), optional.\n\n" + f_desc *= ":return: the constructed :class:`Node`.\n\n" return (func_name, f_desc) end @@ -325,7 +325,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) param_keys = AbstractString[] param_vals = AbstractString[] - symbol_kws = Dict{Base.Symbol, Symbol}() + symbol_kws = Dict{Base.Symbol, Node}() $(if kv_nargs != symbol("") quote @@ -338,7 +338,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) for (k,v) in kwargs if k == :name; continue; end - if isa(v, Symbol) + if isa(v, Node) symbol_kws[k] = v else push!(param_keys, string(k)) @@ -352,20 +352,20 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) $(if kv_nargs != symbol("") quote if length(symbol_kws) > 0 - @assert(false, "$func_name takes variable number of Symbol arguments, please pass input Symbols " * + @assert(false, "$func_name takes variable number of Node arguments, please pass input Symbols " * "via positional arguments, instead of keyword arguments.") end end end) - # create the symbol + # create the Node ref_sym_hdr = Ref{MX_handle}() @mxcall(:MXSymbolCreateAtomicSymbol, (MX_handle, MX_uint, Ptr{char_p}, Ptr{char_p}, Ref{MX_handle}), $hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) sym_hdr = ref_sym_hdr[] - sym = Symbol(MX_SymbolHandle(sym_hdr)) + sym = Node(MX_SymbolHandle(sym_hdr)) hint = lowercase(string($func_name)) name = get!(DEFAULT_NAME_MANAGER, name, hint) diff --git a/test/unittest/symbol.jl b/test/unittest/node.jl similarity index 91% rename from test/unittest/symbol.jl rename to test/unittest/node.jl index 3397b7eaf70d..f7e9b51e60f0 100644 --- a/test/unittest/symbol.jl +++ b/test/unittest/node.jl @@ -1,4 +1,4 @@ -module TestSymbol +module TestNode using MXNet using Base.Test @@ -8,7 +8,7 @@ using ..Main: mlp2 # Test Implementations ################################################################################ function test_basic() - info("Symbol::basic") + info("Node::basic") model = mlp2() @test mx.list_arguments(model) == [:data,:fc1_weight,:fc1_bias,:fc2_weight,:fc2_bias] @@ -17,7 +17,7 @@ function test_basic() end function test_internal() - info("Symbol::internal") + info("Node::internal") data = mx.Variable(:data) oldfc = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) @@ -31,7 +31,7 @@ function test_internal() end function test_compose() - info("Symbol::compose") + info("Node::compose") data = mx.Variable(:data) net1 = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) @@ -47,7 +47,7 @@ function test_compose() end function test_infer_shape() - info("Symbol::infer_shape::mlp2") + info("Node::infer_shape::mlp2") model = mlp2() data_shape = (100, 100) @@ -61,7 +61,7 @@ function test_infer_shape() end function test_infer_shape_error() - info("Symbol::infer_shape::throws") + info("Node::infer_shape::throws") model = mlp2() weight_shape = (100, 1) @@ -70,12 +70,12 @@ function test_infer_shape_error() end function test_saveload() - info("Symbol::saveload::mlp2") + info("Node::saveload::mlp2") model = mlp2() fname = tempname() mx.save(fname, model) - model2 = mx.load(fname, mx.Symbol) + model2 = mx.load(fname, mx.Node) @test mx.to_json(model) == mx.to_json(model2) rm(fname) From 955b6d2d1f028950e7540a9f5d468f3c91ba657e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 15:22:25 -0500 Subject: [PATCH 185/630] refactor: Node -> SymbolicNode --- src/MXNet.jl | 2 +- src/MXNet.jl-e | 35 + src/base.jl-e | 212 ++++++ src/callback.jl-e | 142 ++++ src/context.jl-e | 44 ++ src/executor.jl | 16 +- src/executor.jl-e | 197 +++++ src/initializer.jl-e | 117 +++ src/io.jl | 2 +- src/io.jl-e | 641 ++++++++++++++++ src/kvstore.jl | 2 +- src/kvstore.jl-e | 132 ++++ src/metric.jl-e | 37 + src/model.jl | 12 +- src/model.jl-e | 566 ++++++++++++++ src/name.jl-e | 44 ++ src/ndarray.jl-e | 800 ++++++++++++++++++++ src/optimizer.jl-e | 226 ++++++ src/random.jl-e | 25 + src/symbolic-node.jl | 437 +++++++++++ src/{node.jl => symbolic-node.jl-e} | 0 src/util.jl-e | 70 ++ test/unittest/{node.jl => symbolic-node.jl} | 16 +- 23 files changed, 3750 insertions(+), 25 deletions(-) create mode 100644 src/MXNet.jl-e create mode 100644 src/base.jl-e create mode 100644 src/callback.jl-e create mode 100644 src/context.jl-e create mode 100644 src/executor.jl-e create mode 100644 src/initializer.jl-e create mode 100644 src/io.jl-e create mode 100644 src/kvstore.jl-e create mode 100644 src/metric.jl-e create mode 100644 src/model.jl-e create mode 100644 src/name.jl-e create mode 100644 src/ndarray.jl-e create mode 100644 src/optimizer.jl-e create mode 100644 src/random.jl-e create mode 100644 src/symbolic-node.jl rename src/{node.jl => symbolic-node.jl-e} (100%) create mode 100644 src/util.jl-e rename test/unittest/{node.jl => symbolic-node.jl} (90%) diff --git a/src/MXNet.jl b/src/MXNet.jl index 68875b62da90..f9f9e8664c4f 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -15,7 +15,7 @@ include("ndarray.jl") include("random.jl") include("name.jl") -include("node.jl") +include("symbolic-node.jl") include("executor.jl") include("metric.jl") diff --git a/src/MXNet.jl-e b/src/MXNet.jl-e new file mode 100644 index 000000000000..f9f9e8664c4f --- /dev/null +++ b/src/MXNet.jl-e @@ -0,0 +1,35 @@ +__precompile__() + +module MXNet + +# we put everything in the namespace mx, because there are a lot of +# functions with the same names as built-in utilities like "zeros", etc. +export mx +module mx +using Formatting + +include("base.jl") +include("context.jl") + +include("ndarray.jl") +include("random.jl") + +include("name.jl") +include("symbolic-node.jl") +include("executor.jl") + +include("metric.jl") +include("optimizer.jl") +include("initializer.jl") + +include("io.jl") +include("kvstore.jl") + +include("callback.jl") +include("model.jl") + +include("util.jl") + +end # mx + +end # module MXNet diff --git a/src/base.jl-e b/src/base.jl-e new file mode 100644 index 000000000000..0988400b9d31 --- /dev/null +++ b/src/base.jl-e @@ -0,0 +1,212 @@ +"Exception thrown when an error occurred calling MXNet API." +immutable MXError <: Exception + msg :: AbstractString +end + +################################################################################ +# Common types used in MXNet API +################################################################################ +typealias MX_uint Cuint +typealias MX_float Cfloat +typealias MX_handle Ptr{Void} + +typealias char_p Ptr{UInt8} +typealias char_pp Ptr{char_p} + +################################################################################ +# Initialization and library API entrance +################################################################################ +const MXNET_LIB = Libdl.find_library(["libmxnet.so","libmxnet.dll"], + [joinpath("$(get(ENV,"MXNET_HOME",""))","lib"), + joinpath(Pkg.dir("MXNet"),"deps/usr/lib")]) +if isempty(MXNET_LIB) + # touch this file, so that after the user properly build libmxnet, the precompiled + # MXNet.ji will be re-compiled to get MXNET_LIB properly. + touch(@__FILE__) + error("Cannot find or load libmxnet.so. Please see the document on how to build it.") +end + +function __init__() + _import_ndarray_functions() + _import_atomic_symbol_creators() + _import_io_iterators() + + atexit() do + # notify libmxnet we are shutting down + ccall( ("MXNotifyShutdown", MXNET_LIB), Cint, () ) + end +end + +function mx_get_last_error() + msg = ccall( ("MXGetLastError", MXNET_LIB), char_p, () ) + if msg == C_NULL + throw(MXError("Failed to get last error message")) + end + return bytestring(msg) +end + +"Utility macro to call MXNet API functions" +macro mxcall(fv, argtypes, args...) + f = eval(fv) + args = map(esc, args) + quote + _mxret = ccall( ($(Meta.quot(f)), $MXNET_LIB), + Cint, $argtypes, $(args...) ) + if _mxret != 0 + err_msg = mx_get_last_error() + throw(MXError(err_msg)) + end + end +end + +################################################################################ +# Handle types +################################################################################ +macro mx_define_handle_t(name, destructor) + name = esc(name) + quote + type $name + value :: MX_handle + + function $name(value = C_NULL) + hdr = new(value) + + $(if destructor != :nop + :(finalizer(hdr, delete!)) + end) + + return hdr + end + end + + $(if finalizer != :nop + quote + function delete!(h :: $name) + if h.value != C_NULL + @mxcall($(Meta.quot(destructor)), (MX_handle,), h.value) + h.value = C_NULL + end + end + end + end) + + function Base.unsafe_convert(::Type{MX_handle}, obj::$name) + obj.value + end + Base.convert(t::Type{MX_handle}, obj::$name) = Base.unsafe_convert(t, obj) + Base.cconvert(t::Type{MX_handle}, obj::$name) = Base.unsafe_convert(t, obj) + + function Base.isnull(obj::$name) obj.value == C_NULL end + end +end + +@mx_define_handle_t(MX_NDArrayHandle, MXNDArrayFree) +@mx_define_handle_t(MX_FunctionHandle, nop) +@mx_define_handle_t(MX_SymbolHandle, MXSymbolFree) +@mx_define_handle_t(MX_ExecutorHandle, MXExecutorFree) +@mx_define_handle_t(MX_DataIterHandle, MXDataIterFree) +@mx_define_handle_t(MX_KVStoreHandle, MXKVStoreFree) + +################################################################################ +# MXNet Params +# +# MXNet API use string to pass some common parameters like the configurations +# when defining layers. Typically, it is enough to use string(obj) to get a +# recognizable representation for libmxnet. However, there is currently a +# caveat: +# +# Because Julia use column-major ordering for tensors. In order to properly +# interact with Julia Arrays, the shape will look "reversed" from the Julia +# side. For example, a typical MNIST mini-batch tensor is of shape (28,28,1,100) +# from Julia side, while the shape information for the same piece of memory +# should be interpreted as (100,1,28,28) from C/C++/Python side. +# +# Therefore, when passing parameters to libmxnet, we should reverse the shape +# parameter. For example, when the user specify a non-square kernel size for +# a convolution or pooling layer. Unfortunately, those operators are automatically +# imported, and information about the type of each parameter is somehow limited. +# One hacky way is to match the type description for the string "Shape(tuple)" +# when importing operators. But currently we simply decided to reverse **all** +# NTuple{N, Int} passed to libmxnet. +# +# TODO: find a better solution in case this cause issues in the future. +################################################################################ +function dump_mx_param(val :: Any) + string(val) +end +function dump_mx_param{N,T<:Integer}(shape :: NTuple{N, T}) + string(tuple(flipdim([shape...],1)...)) +end + +"""A convenient macro copied from Mocha.jl that could be used to define structs +with default values and type checks. For example +```julia +@defstruct MyStruct Any ( + field1 :: Int = 0, + (field2 :: AbstractString = "", !isempty(field2)) +) +``` +where each field could be either +```julia +field_name :: field_type = default_value +``` +or put within a tuple, with the second element +specifying a validation check on the field value. +In the example above, the default value for +field2 does not satisfy the assertion, this +could be used to force user to provide a +valid value when no meaningful default value +is available. + +The macro will define a constructor that could accept +the keyword arguments. +""" +macro defstruct(name, super_name, fields) + @assert fields.head == :tuple + fields = fields.args + @assert length(fields) > 0 + name = esc(name) + super_name = esc(super_name) + + field_defs = Array(Expr, length(fields)) # :(field2 :: Int) + field_names = Array(Expr, length(fields)) # :field2 + field_defaults = Array(Expr, length(fields)) # :(field2 = 0) + field_types = Array(Expr, length(fields)) # Int + field_asserts = Array(Expr, length(fields)) # :(field2 >= 0) + + for i = 1:length(fields) + field = fields[i] + if field.head == :tuple + field_asserts[i] = esc(field.args[2]) + field = field.args[1] + end + field_defs[i] = esc(field.args[1]) + field_names[i] = esc(field.args[1].args[1]) + field_types[i] = esc(field.args[1].args[2]) + field_defaults[i] = Expr(:kw, field.args[1].args[1], esc(field.args[2])) + end + + # body of layer type, defining fields + type_body = Expr(:block, field_defs...) + + # constructor + converts = map(zip(field_names, field_types)) do param + f_name, f_type = param + :($f_name = convert($f_type, $f_name)) + end + asserts = map(filter(i -> isdefined(field_asserts,i), 1:length(fields))) do i + :(@assert($(field_asserts[i]))) + end + construct = Expr(:call, name, field_names...) + ctor_body = Expr(:block, converts..., asserts..., construct) + ctor_def = Expr(:call, name, Expr(:parameters, field_defaults...)) + ctor = Expr(:(=), ctor_def, ctor_body) + + quote + type $(name) <: $super_name + $type_body + end + + $ctor + end +end diff --git a/src/callback.jl-e b/src/callback.jl-e new file mode 100644 index 000000000000..9f3d85b576ff --- /dev/null +++ b/src/callback.jl-e @@ -0,0 +1,142 @@ +#=doc +Callbacks in training +===================== +=# + +#=doc +.. class:: AbstractCallback + + Abstract type of callback functions used in training. +=# +abstract AbstractCallback + +#=doc +.. class:: AbstractBatchCallback + + Abstract type of callbacks to be called every mini-batch. +=# +abstract AbstractBatchCallback <: AbstractCallback + +#=doc +.. class:: AbstractEpochCallback + + Abstract type of callbacks to be called every epoch. +=# +abstract AbstractEpochCallback <: AbstractCallback + +type BatchCallback <: AbstractBatchCallback + frequency :: Int + call_on_0 :: Bool + callback :: Function +end + +#=doc +.. function:: every_n_batch(callback :: Function, n :: Int; call_on_0 = false) + + A convenient function to construct a callback that runs every ``n`` mini-batches. + + :param Int call_on_0: keyword argument, default false. Unless set, the callback + will **not** be run on batch 0. + + For example, the :func:`speedometer` callback is defined as + + .. code-block:: julia + + every_n_iter(frequency, call_on_0=true) do state :: OptimizationState + if state.curr_batch == 0 + # reset timer + else + # compute and print speed + end + end + + :seealso: :func:`every_n_epoch`, :func:`speedometer`. +=# +function every_n_batch(callback :: Function, n :: Int; call_on_0 :: Bool = false) + BatchCallback(n, call_on_0, callback) +end +function Base.call(cb :: BatchCallback, state :: OptimizationState) + if state.curr_batch == 0 + if cb.call_on_0 + cb.callback(state) + end + elseif state.curr_batch % cb.frequency == 0 + cb.callback(state) + end +end + +#=doc +.. function:: speedometer(; frequency=50) + + Create an :class:`AbstractBatchCallback` that measure the training speed + (number of samples processed per second) every k mini-batches. + + :param Int frequency: keyword argument, default 50. The frequency (number of + min-batches) to measure and report the speed. +=# +function speedometer(;frequency::Int=50) + cl_tic = 0 + every_n_batch(frequency, call_on_0=true) do state :: OptimizationState + if state.curr_batch == 0 + # reset timer + cl_tic = time() + else + speed = frequency * state.batch_size / (time() - cl_tic) + info(format("Speed: {1:>6.2f} samples/sec", speed)) + cl_tic = time() + end + end +end + + +type EpochCallback <: AbstractEpochCallback + frequency :: Int + call_on_0 :: Bool + callback :: Function +end + +#=doc +.. function:: every_n_epoch(callback :: Function, n :: Int; call_on_0 = false) + + A convenient function to construct a callback that runs every ``n`` full data-passes. + + :param Int call_on_0: keyword argument, default false. Unless set, the callback + will **not** be run on epoch 0. Epoch 0 means no training has been performed + yet. This is useful if you want to inspect the randomly initialized model + that has not seen any data yet. + + :seealso: :func:`every_n_iter`. +=# +function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) + EpochCallback(n, call_on_0, callback) +end +function Base.call(cb :: EpochCallback, model :: Any, state :: OptimizationState) + if state.curr_epoch == 0 + if cb.call_on_0 + cb.callback(model, state) + end + elseif state.curr_epoch % cb.frequency == 0 + cb.callback(model, state) + end +end + +#=doc +.. function:: do_checkpoint(prefix; frequency=1, save_epoch_0=false) + + Create an :class:`AbstractEpochCallback` that save checkpoints of the model to disk. + The checkpoints can be loaded back later on. + + :param AbstractString prefix: the prefix of the filenames to save the model. The model + architecture will be saved to prefix-symbol.json, while the weights will be saved + to prefix-0012.params, for example, for the 12-th epoch. + :param Int frequency: keyword argument, default 1. The frequency (measured in epochs) to + save checkpoints. + :param Bool save_epoch_0: keyword argument, default false. Whether we should save a + checkpoint for epoch 0 (model initialized but not seen any data yet). +=# +function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) + mkpath(dirname(prefix)) + every_n_epoch(frequency, call_on_0=save_epoch_0) do model, state + save_checkpoint(model, prefix, state) + end +end diff --git a/src/context.jl-e b/src/context.jl-e new file mode 100644 index 000000000000..1e96c305fb04 --- /dev/null +++ b/src/context.jl-e @@ -0,0 +1,44 @@ +#=doc +Context +======= +=# +@enum CONTEXT_TYPE CPU=1 GPU=2 CPU_PINNED=3 + +#=doc +.. class:: Context + + A context describes the device type and id on which computation should be carried on. +=# +immutable Context + device_type :: CONTEXT_TYPE + device_id :: Int +end +Context(dev_type :: Union{CONTEXT_TYPE, Int}, dev_id :: Int = 0) = + Context(convert(CONTEXT_TYPE, dev_type), dev_id) + +function Base.show(io :: IO, ctx :: Context) + print(io, "$(ctx.device_type)$(ctx.device_id)") +end + +#=doc +.. function:: cpu(dev_id=0) + + :param Int dev_id: the CPU id. + + Get a CPU context with a specific id. ``cpu()`` is usually the default context for many + operations when no context is specified. +=# +function cpu(dev_id::Int=0) + return Context(CPU, dev_id) +end + +#=doc +.. function:: gpu(dev_id=0) + + :param Int dev_id: the GPU device id. + + Get a GPU context with a specific id. The K GPUs on a node is typically numbered as 0,...,K-1. +=# +function gpu(dev_id::Int=0) + return Context(GPU, dev_id) +end diff --git a/src/executor.jl b/src/executor.jl index 6dea17763101..5844a62e446c 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -6,13 +6,13 @@ Executor #=doc .. class:: Executor - An executor is a realization of a symbolic architecture defined by a :class:`Node`. + An executor is a realization of a symbolic architecture defined by a :class:`SymbolicNode`. The actual forward and backward computation specified by the network architecture can be carried out with an executor. =# type Executor handle :: MX_ExecutorHandle - symbol :: Node + symbol :: SymbolicNode arg_arrays :: Vector{NDArray} grad_arrays :: Vector{Union{Void,NDArray}} aux_arrays :: Vector{NDArray} @@ -20,7 +20,7 @@ type Executor arg_dict :: Dict{Base.Symbol, NDArray} aux_dict :: Dict{Base.Symbol, NDArray} end -function Executor(hdr :: MX_ExecutorHandle, symbol :: Node, +function Executor(hdr :: MX_ExecutorHandle, symbol :: SymbolicNode, arg_arrays :: Vector{NDArray}, grad_arrays :: Vector{Union{Void,NDArray}}, aux_arrays :: Vector{NDArray}) # get output arrays @@ -73,9 +73,9 @@ end #=doc .. function:: bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) - Create an :class:`Executor` by binding a :class:`Node` to concrete :class:`NDArray`. + Create an :class:`Executor` by binding a :class:`SymbolicNode` to concrete :class:`NDArray`. - :param Node sym: the network architecture describing the computation graph. + :param SymbolicNode sym: the network architecture describing the computation graph. :param Context ctx: the context on which the computation should run. :param args: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete arrays for all the inputs in the network architecture. The inputs typically include @@ -86,7 +86,7 @@ end :param grad_req: =# @enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 -function bind(self :: Node, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; +function bind(self :: SymbolicNode, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; args_grad :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), aux_states :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), grad_req :: Union{GRAD_REQ,Vector{GRAD_REQ},Dict{Base.Symbol,GRAD_REQ}} = GRAD_WRITE) @@ -116,7 +116,7 @@ function bind(self :: Node, ctx :: Context, args :: Union{Vector{NDArray},Dict{B executor = Executor(MX_ExecutorHandle(ref_hdr[]), self, args, args_grad, aux_states) end -function bind(self :: Node; kwargs...) +function bind(self :: SymbolicNode; kwargs...) kwargs = Dict(kwargs) @assert(haskey(kwargs, :args), "Must specify args") args = pop!(kwargs, :args) @@ -128,7 +128,7 @@ function bind(self :: Node; kwargs...) bind(self, context, args; kwargs...) end -function simple_bind(self :: Node, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) +function simple_bind(self :: SymbolicNode, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) arg_shapes, out_shapes, aux_shapes = infer_shape(self; kwargs...) @assert(!isa(arg_shapes, Void), "Information not enough to perform complete shape inference") diff --git a/src/executor.jl-e b/src/executor.jl-e new file mode 100644 index 000000000000..6dea17763101 --- /dev/null +++ b/src/executor.jl-e @@ -0,0 +1,197 @@ +#=doc +Executor +======== +=# + +#=doc +.. class:: Executor + + An executor is a realization of a symbolic architecture defined by a :class:`Node`. + The actual forward and backward computation specified by the network architecture can + be carried out with an executor. +=# +type Executor + handle :: MX_ExecutorHandle + symbol :: Node + arg_arrays :: Vector{NDArray} + grad_arrays :: Vector{Union{Void,NDArray}} + aux_arrays :: Vector{NDArray} + outputs :: Vector{NDArray} + arg_dict :: Dict{Base.Symbol, NDArray} + aux_dict :: Dict{Base.Symbol, NDArray} +end +function Executor(hdr :: MX_ExecutorHandle, symbol :: Node, + arg_arrays :: Vector{NDArray}, grad_arrays :: Vector{Union{Void,NDArray}}, + aux_arrays :: Vector{NDArray}) + # get output arrays + ref_size = Ref{MX_uint}(0) + ref_hdrs = Ref{Ptr{MX_handle}}(0) + @mxcall(:MXExecutorOutputs, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_handle}}), + hdr, ref_size, ref_hdrs) + out_hdrs = pointer_to_array(ref_hdrs[], ref_size[]) + out_arrays = [NDArray(MX_NDArrayHandle(x)) for x in out_hdrs] + + arg_names = list_arguments(symbol) + @assert(length(arg_names) == length(unique(arg_names)), "Duplicated names in arguments: $arg_names") + arg_dict = Dict{Base.Symbol,NDArray}(zip(arg_names, arg_arrays)) + + aux_names = list_auxiliary_states(symbol) + @assert(length(aux_names) == length(unique(aux_names)), "Duplicated names in auxiliary states: $aux_names") + aux_dict = Dict{Base.Symbol,NDArray}(zip(aux_names, aux_arrays)) + + Executor(hdr, symbol, arg_arrays, grad_arrays, aux_arrays, out_arrays, arg_dict, aux_dict) +end + +function Base.unsafe_convert(::Type{MX_handle}, obj::Executor) + Base.unsafe_convert(MX_handle, obj.handle) +end +Base.convert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) +Base.cconvert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) + +function _get_ndarray_inputs(arg_key::AbstractString, args::Vector{NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) + @assert(length(args) == length(arg_names), "Length of $arg_key does not match number of arguments") + return (MX_handle[args...], args) +end +function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) + args_vec = map(arg_names) do name + arr = get(args, name, nothing) + if !allow_missing + @assert(!isa(arr, Void), "Must specify all arguments in $arg_key ($name is missing)") + end + arr + end + # help the type inference + if allow_missing + args_vec = Union{NDArray,Void}[args_vec...] + else + args_vec = NDArray[args_vec...] + end + args_hdr = MX_handle[(isa(x,Void) ? MX_handle(0) : x) for x in args_vec] + return (args_hdr, args_vec) +end + +#=doc +.. function:: bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) + + Create an :class:`Executor` by binding a :class:`Node` to concrete :class:`NDArray`. + + :param Node sym: the network architecture describing the computation graph. + :param Context ctx: the context on which the computation should run. + :param args: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete + arrays for all the inputs in the network architecture. The inputs typically include + network parameters (weights, bias, filters, etc.), data and labels. See :func:`list_arguments` + and :func:`infer_shape`. + :param args_grad: TODO + :param aux_states: + :param grad_req: +=# +@enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 +function bind(self :: Node, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; + args_grad :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), + aux_states :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), + grad_req :: Union{GRAD_REQ,Vector{GRAD_REQ},Dict{Base.Symbol,GRAD_REQ}} = GRAD_WRITE) + + arg_names = list_arguments(self) + + args_hdr, args = _get_ndarray_inputs("args", args, arg_names, false) + args_grad_hdr, args_grad = _get_ndarray_inputs("args_grad", args_grad, arg_names, true) + aux_args_hdr, aux_states = _get_ndarray_inputs("aux_states", aux_states, list_auxiliary_states(self), false) + + if isa(grad_req, GRAD_REQ) + reqs = MX_uint[grad_req for i=1:length(args)] + elseif isa(grad_req, Vector{GRAD_REQ}) + @assert(length(grad_req) == length(args)) + reqs = MX_uint[grad_req...] + elseif isa(grad_req, Dict{Base.Symbol, GRAD_REQ}) + reqs = MX_uint[get(grad_req, name, GRAD_NOP) for name in arg_names] + end + + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXExecutorBind, + (MX_handle, Cint, Cint, MX_uint, Ptr{MX_handle}, Ptr{MX_handle}, Ptr{MX_uint}, + MX_uint, Ptr{MX_handle}, Ref{MX_handle}), + self, ctx.device_type, ctx.device_id, length(args), args_hdr, + args_grad_hdr, reqs, length(aux_states), aux_args_hdr, ref_hdr) + args_grad = convert(Vector{Union{Void,NDArray}}, args_grad) + executor = Executor(MX_ExecutorHandle(ref_hdr[]), self, + args, args_grad, aux_states) +end +function bind(self :: Node; kwargs...) + kwargs = Dict(kwargs) + @assert(haskey(kwargs, :args), "Must specify args") + args = pop!(kwargs, :args) + if haskey(kwargs, :context) + context = pop!(kwargs, :context) + else + context = cpu() + end + bind(self, context, args; kwargs...) +end + +function simple_bind(self :: Node, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) + arg_shapes, out_shapes, aux_shapes = infer_shape(self; kwargs...) + @assert(!isa(arg_shapes, Void), "Information not enough to perform complete shape inference") + + arg_arrays = NDArray[zeros(shape, ctx) for shape in arg_shapes] + arg_names = list_arguments(self) + if grad_req == GRAD_NOP + grad_arrays = Dict{Base.Symbol,NDArray}() + else + provided_data_names = [x[1] for x in kwargs] + grad_arrays = Dict{Base.Symbol,NDArray}() + for (name, shape) in zip(arg_names, arg_shapes) + # if not in provided data, should be parameters + if !in(name, provided_data_names) + grad_arrays[name] = zeros(shape, ctx) + end + end + end + + aux_arrays = [zeros(shape, ctx) for shape in aux_shapes] + return bind(self, ctx, arg_arrays, args_grad=grad_arrays, grad_req=grad_req, aux_states=aux_arrays) +end + + +function forward(self :: Executor; is_train::Bool=false, kwargs...) + for (k,v) in kwargs + @assert(k ∈ self.arg_dict, "Unknown argument $k") + @assert(isa(v, NDArray), "Keyword argument $k must be an NDArray") + copy!(self.arg_dict[k], v) + end + + @mxcall(:MXExecutorForward, (MX_handle, Cint), self, is_train) +end + +function backward(self :: Executor) + backward(self, NDArray[]) +end +function backward(self :: Executor, out_grad :: NDArray) + backward(self, [out_grad]) +end +function backward(self :: Executor, out_grads :: Vector{NDArray}) + out_grads = MX_handle[out_grads...] + @mxcall(:MXExecutorBackward, (MX_handle, MX_uint, Ptr{MX_handle}), self, length(out_grads), out_grads) +end + + +function copy_params_from(self::Executor, arg_params::Dict{Base.Symbol,NDArray}, + aux_params::Union{Void,Dict{Base.Symbol,NDArray}}=nothing; + allow_extra_params::Bool=false) + for (name, array) in arg_params + if haskey(self.arg_dict, name) + copy!(self.arg_dict[name], array) + else + @assert(allow_extra_params, "Extra params $name not in the arguments") + end + end + + if !isa(aux_params, Void) + for (name, array) in aux_params + if haskey(self.aux_dict, name) + copy!(self.aux_dict[name], array) + else + @assert(allow_extra_params, "Extra auxiliary state $name not recognized") + end + end + end +end diff --git a/src/initializer.jl-e b/src/initializer.jl-e new file mode 100644 index 000000000000..8f78bfba9367 --- /dev/null +++ b/src/initializer.jl-e @@ -0,0 +1,117 @@ +#=doc +Initializers +============ +Interface +--------- +=# + +#=doc +.. class:: AbstractInitializer + + The abstract base class for all initializers. + +To define a new initializer, it is +enough to derive a new type, and implement one or more of the following methods: + +.. function:: _init_weight(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + +Or, if full behavior customization is needed, override the following function + +.. function:: call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +=# +abstract AbstractInitializer + +function call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + strname = string(name) + if endswith(strname, "bias") + _init_bias(self, name, array) + elseif endswith(strname, "gamma") + _init_gamma(self, name, array) + elseif endswith(strname, "beta") + _init_beta(self, name, array) + elseif endswith(strname, "weight") + _init_weight(self, name, array) + elseif endswith(strname, "moving_mean") + _init_zero(self, name, array) + elseif endswith(strname, "moving_var") + _init_zero(self, name, array) + else + _init_default(self, name, array) + end +end + +function _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + array[:] = 0 +end +function _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + array[:] = 1 +end +function _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + array[:] = 0 +end +function _init_zero(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + array[:] = 0 +end + +#=doc +Built-in initializers +--------------------- +=# +#=doc +.. class:: UniformInitializer + + Initialize weights according to a uniform distribution within the provided scale. +=# +immutable UniformInitializer <: AbstractInitializer + scale :: AbstractFloat +end +#=doc +.. function UniformInitializer(scale=0.07) + + Construct a :class:`UniformInitializer` with the specified scale. +=# +UniformInitializer() = UniformInitializer(0.07) + +function _init_weight(self :: UniformInitializer, name :: Base.Symbol, array :: NDArray) + rand!(-self.scale, self.scale, array) +end + +#=doc +.. class:: NormalInitializer + + Initialize weights according to a univariate Gaussian distribution. +=# +immutable NormalInitializer <: AbstractInitializer + μ :: AbstractFloat + σ :: AbstractFloat +end +#=doc +.. function:: NormalIninitializer(; mu=0, sigma=0.01) + + Construct a :class:`NormalInitializer` with mean ``mu`` and variance ``sigma``. +=# +NormalInitializer(; mu=0, sigma=0.01) = NormalInitializer(mu, sigma) + +function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) + randn!(self.μ, self.σ, array) +end + +#=doc +.. class:: XaiverInitializer + + The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding + the difficulty of training deep feedforward neuralnetworks*. +=# +immutable XaiverInitializer <: AbstractInitializer +end + +function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) + dims = size(array) + fan_in = prod(dims[2:end]) + fan_out = dims[1] + scale = sqrt(3 / (fan_in + fan_out)) + rand!(-scale, scale, array) +end diff --git a/src/io.jl b/src/io.jl index 5c59e96bb611..71bbc38a7f50 100644 --- a/src/io.jl +++ b/src/io.jl @@ -35,7 +35,7 @@ and split it into mini-batches so that the model can consume the data in a unifo training stage, both *data* and *label* will be feeded into the model, while during prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and of any shapes. The provided data and label names here should match the input names in a target - :class:`Node`. + :class:`SymbolicNode`. A data provider should also implement the Julia iteration interface, in order to allow iterating through the data set. The provider will be called in the following way: diff --git a/src/io.jl-e b/src/io.jl-e new file mode 100644 index 000000000000..5c59e96bb611 --- /dev/null +++ b/src/io.jl-e @@ -0,0 +1,641 @@ +#=doc +Data Providers +============== +Interface +--------- + +Data providers are wrappers that load external data, be it images, text, or general tensors, +and split it into mini-batches so that the model can consume the data in a uniformed way. +=# + +#=doc +.. class:: AbstractDataProvider + + The root type for all data provider. A data provider should implement the following interfaces: + + .. function:: get_batch_size(provider) -> Int + + :param AbstractDataProvider provider: the data provider. + :return: the mini-batch size of the provided data. All the provided data should have the + same mini-batch size (i.e. the last dimension). + + .. function:: provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} + + :param AbstractDataProvider provider: the data provider. + :return: a vector of (name, shape) pairs describing the names of the data it provides, and + the corresponding shapes. + + .. function:: provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} + + :param AbstractDataProvider provider: the data provider. + :return: a vector of (name, shape) pairs describing the names of the labels it provides, and + the corresponding shapes. + + The difference between *data* and *label* is that during + training stage, both *data* and *label* will be feeded into the model, while during + prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and + of any shapes. The provided data and label names here should match the input names in a target + :class:`Node`. + + A data provider should also implement the Julia iteration interface, in order to allow iterating + through the data set. The provider will be called in the following way: + + .. code-block:: julia + + for batch in eachbatch(provider) + data = get_data(provider, batch) + end + + which will be translated by Julia compiler into + + .. code-block:: julia + + state = Base.start(eachbatch(provider)) + while !Base.done(provider, state) + (batch, state) = Base.next(provider, state) + data = get_data(provider, batch) + end + + By default, :func:`eachbatch` simply returns the provider itself, so the iterator interface + is implemented on the provider type itself. But the extra layer of abstraction allows us to + implement a data provider easily via a Julia ``Task`` coroutine. + The detailed interface function is listed below: + + .. function:: Base.eltype(provider) -> AbstractDataBatch + + :param AbstractDataProvider provider: the data provider. + :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. + + .. function:: Base.start(provider) -> AbstractDataProviderState + + :param AbstractDataProvider provider: the data provider. + + This function is always called before iterating into the dataset. It should initialize + the iterator, reset the index, and do data shuffling if needed. + + .. function:: Base.done(provider, state) -> Bool + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. + :return: true if there is no more data to iterate in this dataset. + + .. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) + + :param AbstractDataProvider provider: the data provider. + :return: the current data batch, and the state for the next iteration. + + Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that + is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this + case, you can safely assume that + + * :func:`Base.start` will always be called, and called only once before the iteration starts. + * :func:`Base.done` will always be called at the beginning of every iteration and always be called once. + * If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with + a call to :func:`Base.start`. + * :func:`Base.next` will always be called only once in each iteration. It will always be called after + one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will + not be called. + + With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation + of the built-in :class:`MXDataProvider` for example. + + .. caution:: + + Please do not use the one data provider simultaneously in two different places, either in parallel, + or in a nested loop. For example, the behavior for the following code is undefined + + .. code-block:: julia + + for batch in data + # updating the parameters + + # now let's test the performance on the training set + for b2 in data + # ... + end + end +=# +abstract AbstractDataProvider + +#=doc +.. class:: AbstractDataProviderState + + Base type for data provider states. +=# +abstract AbstractDataProviderState + +#=doc +.. class:: AbstractDataBatch + + Base type for a data mini-batch. It should implement the following interfaces: + + .. function:: count_samples(provider, batch) -> Int + + :param AbstractDataBatch batch: the data batch object. + :return: the number of samples in this batch. This number should be greater than 0, but + less than or equal to the batch size. This is used to indicate at the end of + the data set, there might not be enough samples for a whole mini-batch. + + .. function:: get_data(provider, batch) -> Vector{NDArray} + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :return: a vector of data in this batch, should be in the same order as declared in + :func:`provide_data() `. + + The last dimension of each :class:`NDArray` should always match the batch_size, even when + :func:`count_samples` returns a value less than the batch size. In this case, + the data provider is free to pad the remaining contents with any value. + + .. function:: get_label(provider, batch) -> Vector{NDArray} + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :return: a vector of labels in this batch. Similar to :func:`get_data`. + + + The following utility functions will be automatically defined. + + .. function:: get(provider, batch, name) -> NDArray + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :param Base.Symbol name: the name of the data to get, should be one of the names + provided in either :func:`provide_data() ` + or :func:`provide_label() `. + :return: the corresponding data array corresponding to that name. + + .. function:: load_data!(provider, batch, targets) + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :param targets: the targets to load data into. + :type targets: Vector{Vector{SlicedNDArray}} + + The targets is a list of the same length as number of data provided by this provider. + Each element in the list is a list of :class:`SlicedNDArray`. This list described a + spliting scheme of this data batch into different slices, each slice is specified by + a slice-ndarray pair, where *slice* specify the range of samples in the mini-batch + that should be loaded into the corresponding *ndarray*. + + This utility function is used in data parallelization, where a mini-batch is splited + and computed on several different devices. + + .. function:: load_label!(provider, batch, targets) + + :param AbstractDataProvider provider: the data provider. + :param AbstractDataBatch batch: the data batch object. + :param targets: the targets to load label into. + :type targets: Vector{Vector{SlicedNDArray}} + + The same as :func:`load_data!`, except that this is for loading labels. +=# +abstract AbstractDataBatch + +#=doc +.. class:: DataBatch + + A basic subclass of :class:`AbstractDataBatch`, that implement the interface by + accessing member fields. +=# +type DataBatch <: AbstractDataBatch + data :: Vector{NDArray} + label :: Vector{NDArray} + count :: Int +end +count_samples(batch :: DataBatch) = batch.count +get_data(batch :: DataBatch) = batch.data +get_label(batch :: DataBatch) = batch.label + +#=doc +.. class:: SlicedNDArray + + A alias type of ``Tuple{UnitRange{Int},NDArray}``. +=# +typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} + +function _load_general!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, + targets :: Vector{Vector{SlicedNDArray}}, loader::Function) + data = loader(provider, batch) + for (d_src, d_targets) in zip(data, targets) + for (slice_idx, d_dst) in d_targets + copy!(d_dst, slice(d_src, slice_idx)) + end + end +end +function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, + targets :: Vector{Vector{SlicedNDArray}}) + _load_general!(provider, batch, targets, get_data) +end +function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, + targets :: Vector{Vector{SlicedNDArray}}) + _load_general!(provider, batch, targets, get_label) +end + +function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{NDArray}) + for (src, dst) in zip(get_data(provider, batch), targets) + copy!(dst, src) + end +end +function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{NDArray}) + for (src, dst) in zip(get_label(provider, batch), targets) + copy!(dst, src) + end +end + +import Base.get +function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name :: Base.Symbol) + for (idx, (k, s)) in enumerate(provide_data(provider)) + if name == k + return get_data(provider, batch)[idx] + end + end + for (idx, (k, s)) in enumerate(provide_label(provider)) + if name == k + return get_label(provider, batch)[idx] + end + end + error("$name is not provided by this data provider") +end + +eachbatch(provider :: AbstractDataProvider) = provider + +#=doc +Built-in data providers +----------------------- +=# + +################################################################################ +#=doc +.. class:: ArrayDataProvider + + A convenient tool to iterate :class:`NDArray` or Julia ``Array``. +=# +type ArrayDataProvider <: AbstractDataProvider + data_arrays :: Vector{Array{MX_float}} + data_names :: Vector{Base.Symbol} + label_arrays :: Vector{Array{MX_float}} + label_names :: Vector{Base.Symbol} + batch_size :: Int + sample_count :: Int + shuffle :: Bool + data_padding :: MX_float + label_padding :: MX_float + + data_batch :: Vector{NDArray} + label_batch :: Vector{NDArray} +end + +#=doc +.. function:: ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) + + Construct a data provider from :class:`NDArray` or Julia Arrays. + + :param data: the data, could be + + - a :class:`NDArray`, or a Julia Array. This is equivalent to ``:data => data``. + - a name-data pair, like ``:mydata => array``, where ``:mydata`` is the name of the data + and ``array`` is an :class:`NDArray` or a Julia Array. + - a list of name-data pairs. + + :param label: the same as the ``data`` parameter. When this argument is omitted, the constructed + provider will provide no labels. + :param Int batch_size: the batch size, default is 0, which means treating the whole array as a + single mini-batch. + :param Bool shuffle: turn on if the data should be shuffled at every epoch. + :param Real data_padding: when the mini-batch goes beyond the dataset boundary, there might + be less samples to include than a mini-batch. This value specify a scalar to pad the + contents of all the missing data points. + :param Real label_padding: the same as ``data_padding``, except for the labels. +=# +# Julia's type system is sometimes very frustrating. You cannot specify a function +# with argument Vector{Pair} to expect to be matched when calling with the parameter +# [:foo => zeros(2,3), :bar => zeros(3)] because the type inference gives very specific +# results, about the parametric type in the Pair{T1,T2} type, thus does not match the +# generic Pair type. In general, Int <: Number but Vector{Int} <: Vector{Number} is not +# true. So let us just use Any here... +function ArrayDataProvider(data::Any; batch_size::Int=0, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) + ArrayDataProvider(data, [], batch_size=batch_size, shuffle=shuffle, data_padding=data_padding, label_padding=label_padding) +end +function ArrayDataProvider(data::Any, label::Any; batch_size::Int=0, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) + asarr{T}(arr :: Array{T}) = convert(Array{MX_float}, arr) + asarr(arr :: NDArray) = copy(arr) + + if isa(data, Union{NDArray, Array}) && eltype(data) <: Real + data_names = [:data] + data_arrays = Array{MX_float}[asarr(data)] + elseif isa(data, Pair) + @assert isa(data.first, Base.Symbol) && isa(data.second, Union{NDArray, Array}) + data_names = [data.first] + data_arrays = Array{MX_float}[asarr(data.second)] + elseif isa(data, Vector) || isa(data, Tuple) + map(data) do d + @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) + end + data_names = Base.Symbol[d.first for d in data] + data_arrays = Array{MX_float}[asarr(d.second) for d in data] + else + error("Invalid data argument type") + end + + if isa(label, Union{NDArray, Array}) && eltype(label) <: Real + label_names = [:softmax_label] + label_arrays = Array{MX_float}[asarr(label)] + elseif isa(label, Pair) + @assert isa(label.first, Base.Symbol) && isa(label.second, Union{NDArray, Array}) + label_names = [label.first] + label_arrays = Array{MX_float}[asarr(label.second)] + elseif isa(label, Vector) || isa(label, Tuple) + map(label) do d + @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) + end + label_names = Base.Symbol[d.first for d in label] + label_arrays = Array{MX_float}[asarr(d.second) for d in label] + else + error("Invalid label argument type") + end + + @assert length(data_arrays) > 0 + sample_count = size(data_arrays[1])[end] + for i = 1:length(data_names) + @assert(size(data_arrays[i])[end] == sample_count, + "Number of samples in $(data_names[i]) is mismatch with $(data_names[1])") + end + for i = 1:length(label_names) + @assert(size(label_arrays[i])[end] == sample_count, + "Number of samples in $(label_names[i]) is mismatch with $(data_names[1])") + end + + if batch_size == 0 + batch_size = sample_count + end + @assert 0 < batch_size <= sample_count + + function gen_batch_nds(arrs :: Vector{Array{MX_float}}, bsize :: Int) + map(arrs) do arr + shape = size(arr) + empty(shape[1:end-1]..., bsize) + end + end + + data_batch = gen_batch_nds(data_arrays, batch_size) + label_batch = gen_batch_nds(label_arrays, batch_size) + + # reshape data and labels into 2D tensors, so that it is easier to work with them + data_arrays = map(data_arrays) do arr + reshape(arr, prod(size(arr)[1:end-1]), size(arr)[end]) + end + label_arrays = map(label_arrays) do arr + reshape(arr, prod(size(arr)[1:end-1]), size(arr)[end]) + end + + ArrayDataProvider(data_arrays, data_names, label_arrays, label_names, batch_size, + sample_count, shuffle, data_padding, label_padding, data_batch, label_batch) +end + +function provide_data(provider::ArrayDataProvider) + return collect(zip(provider.data_names, map(size, provider.data_batch))) +end +function provide_label(provider::ArrayDataProvider) + return collect(zip(provider.label_names, map(size, provider.label_batch))) +end +get_batch_size(provider::ArrayDataProvider) = provider.batch_size + +immutable ArrayDataProviderState <: AbstractDataProviderState + curr_idx :: Int +end + +function Base.eltype(provider :: ArrayDataProvider) + ArrayDataProviderState +end + +function Base.start(provider :: ArrayDataProvider) + if provider.shuffle + # re-shuffle all data + idx_perm = randperm(provider.sample_count) + provider.data_arrays = map(x->x[:,idx_perm], provider.data_arrays) + provider.label_arrays = map(x->x[:,idx_perm], provider.label_arrays) + end + + return ArrayDataProviderState(1) +end + +function Base.done(provider::ArrayDataProvider, state :: ArrayDataProviderState) + return state.curr_idx > provider.sample_count +end + +immutable ArrayDataBatch <: AbstractDataBatch + idx :: UnitRange{Int} +end +function Base.next(provider :: ArrayDataProvider, state :: ArrayDataProviderState) + idx = state.curr_idx:min(state.curr_idx+provider.batch_size-1, provider.sample_count) + return (ArrayDataBatch(idx), ArrayDataProviderState(idx.stop+1)) +end + +function count_samples(provider :: ArrayDataProvider, batch :: ArrayDataBatch) + return length(batch.idx) +end + +function get_data(provider :: ArrayDataProvider, batch :: ArrayDataBatch) + for (src, dst) in zip(provider.data_arrays, provider.data_batch) + copy_ignore_shape!(dst[1:length(batch.idx)], src[:, batch.idx]) + if length(batch.idx) < provider.batch_size + dst[length(batch.idx)+1:provider.batch_size] = provider.data_padding + end + end + return provider.data_batch +end +function get_label(provider :: ArrayDataProvider, batch :: ArrayDataBatch) + for (src, dst) in zip(provider.label_arrays, provider.label_batch) + copy_ignore_shape!(dst[1:length(batch.idx)], src[:, batch.idx]) + if length(batch.idx) < provider.batch_size + dst[length(batch.idx)+1:provider.batch_size] = provider.label_padding + end + end + return provider.label_batch +end + + +#=doc +libmxnet data providers +----------------------- +=# + +################################################################################ +#=doc +.. class:: MXDataProvider + + A data provider that wrap built-in data iterators from libmxnet. See below for + a list of built-in data iterators. +=# +type MXDataProvider <: AbstractDataProvider + handle :: MX_DataIterHandle + data_shape :: Vector{Tuple{Base.Symbol, Tuple}} + label_shape:: Vector{Tuple{Base.Symbol, Tuple}} + batch_size :: Int + + # those two a auxiliary variables to help avoid calling reset + # but still pre-fetch first batch to get shape information + first_epoch:: Bool + first_batch:: Bool +end + +function _reset_data_iter(handle :: MX_DataIterHandle) + @mxcall(:MXDataIterBeforeFirst, (MX_handle,), handle) +end +function _iter_next(handle :: MX_DataIterHandle) + ref_ret = Ref{Cint}(0) + @mxcall(:MXDataIterNext, (MX_handle, Ref{Cint}), handle, ref_ret) + return Bool(ref_ret[]) +end +function _get_data(handle :: MX_DataIterHandle) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXDataIterGetData, (MX_handle, Ref{MX_handle}), handle, ref_hdr) + return NDArray(MX_NDArrayHandle(ref_hdr[]), false) +end +function _get_label(handle :: MX_DataIterHandle) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXDataIterGetLabel, (MX_handle, Ref{MX_handle}), handle, ref_hdr) + return NDArray(MX_NDArrayHandle(ref_hdr[]), false) +end + +function MXDataProvider(handle :: MX_DataIterHandle; + data_name :: Base.Symbol=:data, + label_name :: Union{Base.Symbol,Void}=:softmax_label, + kwargs...) # for convenience, we ignore the rest keyword arguments + # init iterator, load the first batch and get shapes + @assert(_iter_next(handle), "Failed to load the first batch in MXDataProvider") + data_shape = Tuple{Base.Symbol, Tuple}[(data_name, size(_get_data(handle)))] + if !isa(label_name, Void) + label_shape = Tuple{Base.Symbol, Tuple}[(label_name::Base.Symbol, size(_get_label(handle)))] + else + label_shape = Tuple{Base.Symbol, Tuple}[] + end + + MXDataProvider(handle, data_shape, label_shape, data_shape[1][2][end], true, true) +end + +provide_data(provider::MXDataProvider) = provider.data_shape +provide_label(provider::MXDataProvider) = provider.label_shape +get_batch_size(provider::MXDataProvider) = provider.batch_size + +type MXDataProviderState <: AbstractDataProviderState + has_next :: Bool +end +immutable MXDataBatch <: AbstractDataBatch +end + +function Base.eltype(provider :: MXDataProvider) + MXDataBatch +end +function Base.start(provider :: MXDataProvider) + if !provider.first_epoch + _reset_data_iter(provider.handle) + else + provider.first_epoch = false + end + + return MXDataProviderState(true) +end +function Base.done(provider :: MXDataProvider, state :: MXDataProviderState) + if provider.first_batch + state.has_next = true + provider.first_batch = false + else + state.has_next = _iter_next(provider.handle) + end + return !state.has_next +end +function Base.next(provider :: MXDataProvider, state :: MXDataProviderState) + return (MXDataBatch(), state) +end + +function get_data(provider :: MXDataProvider, batch :: MXDataBatch) + return NDArray[_get_data(provider.handle)] +end +function get_label(provider :: MXDataProvider, batch :: MXDataBatch) + return NDArray[_get_label(provider.handle)] +end +function count_samples(provider :: MXDataProvider, batch :: MXDataBatch) + ref_pad = Ref{Cint}(0) + @mxcall(:MXDataIterGetPadNum, (MX_handle, Ref{Cint}), provider.handle, ref_pad) + return provider.batch_size - Int(ref_pad[]) +end + +#=doc +**autogen:EMBED:io:EMBED:autogen** +=# +function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) + ref_name = Ref{char_p}(0) + ref_desc = Ref{char_p}(0) + ref_narg = Ref{MX_uint}(0) + ref_arg_names = Ref{char_pp}(0) + ref_arg_types = Ref{char_pp}(0) + ref_arg_descs = Ref{char_pp}(0) + + @mxcall(:MXDataIterGetIterInfo, + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), + hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) + + iter_name = symbol(bytestring(ref_name[])) + + if gen_docs + if endswith(string(iter_name), "Iter") + f_desc = "Can also be called with the alias ``$(string(iter_name)[1:end-4] * "Provider")``.\n" + else + f_desc = "" + end + f_desc *= bytestring(ref_desc[]) * "\n\n" + f_desc *= ":param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data.\n" + f_desc *= ":param Base.Symbol label_name: keyword argument, default ``:softmax_label``. " * + "The name of the label. Could be ``nothing`` if no label is presented in this dataset.\n\n" + f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) + f_desc *= ":return: the constructed :class:`MXDataProvider`." + return (iter_name, f_desc) + end + + defun = quote + function $iter_name(; kwargs...) + arg_keys = AbstractString[string(k) for (k,v) in kwargs] + arg_vals = AbstractString[dump_mx_param(v) for (k,v) in kwargs] + ref_hdr = Ref{MX_handle}(0) + + @mxcall(:MXDataIterCreateIter, (MX_handle, MX_uint, char_pp, char_pp, Ref{MX_handle}), + $hdr, length(arg_keys), arg_keys, arg_vals, ref_hdr) + + return MXDataProvider(MX_DataIterHandle(ref_hdr[]); kwargs...) + end + end + eval(defun) + + # add an alias XXXProvider => XXXIter + if endswith(string(iter_name), "Iter") + alias_name = symbol(string(iter_name)[1:end-4] * "Provider") + eval(:($alias_name = $iter_name)) + end +end + +function _import_io_iterators(;gen_docs::Bool=false) + n_ref = Ref{MX_uint}(0) + h_ref = Ref{Ptr{MX_handle}}(0) + @mxcall(:MXListDataIters, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) + + n_creators = n_ref[] + h_creators = pointer_to_array(h_ref[], n_creators) + + if gen_docs + docs = Dict{Base.Symbol, AbstractString}() + end + + for i = 1:n_creators + creator_hdr = h_creators[i] + ret = _define_data_iter_creator(creator_hdr; gen_docs=gen_docs) + if gen_docs + docs[ret[1]] = ret[2] + end + end + + if gen_docs + return docs + end +end diff --git a/src/kvstore.jl b/src/kvstore.jl index d52433f567b2..1d8c98935768 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -121,7 +121,7 @@ end function set_optimizer(self :: KVStore, optimizer :: AbstractOptimizer) ref_is_worker = Ref{Cint}(0) - @mxcall(:MXKVStoreIsWorkerNode, (Ref{Cint},), ref_is_worker) + @mxcall(:MXKVStoreIsWorkerSymbolicNode, (Ref{Cint},), ref_is_worker) is_worker = ref_is_worker[] if ismatch(r"dist", string(get_type(self))) && is_worker diff --git a/src/kvstore.jl-e b/src/kvstore.jl-e new file mode 100644 index 000000000000..d52433f567b2 --- /dev/null +++ b/src/kvstore.jl-e @@ -0,0 +1,132 @@ +type KVStore + handle :: MX_KVStoreHandle + updater_c :: Ptr{Void} + updater :: Function + + KVStore(hdr :: MX_KVStoreHandle) = new(hdr, Ptr{Void}(0)) +end + +function KVStore(kv_type::Base.Symbol = :local) + #@assert(kv_type ∈ [:local]) # TODO: update with allowed types + + ref_hdr = Ref{MX_handle}(0) + kv_type = string(kv_type) + @mxcall(:MXKVStoreCreate, (char_p, Ref{MX_handle}), kv_type, ref_hdr) + return KVStore(MX_KVStoreHandle(ref_hdr[])) +end +function Base.unsafe_convert(::Type{MX_handle}, obj::KVStore) + Base.unsafe_convert(MX_handle, obj.handle) +end +Base.convert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) +Base.cconvert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) + +function _flatten_kvlist(keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) + @assert length(keys) == length(vals) + keys_flt = Int[] + vals_flt = NDArray[] + for (k,v) in zip(keys, vals) + append!(keys_flt, Base.ones(Int, length(v))*k) + append!(vals_flt, v) + end + return (keys_flt, vals_flt) +end + +function init!(self :: KVStore, key :: Int, val :: NDArray) + init!(self, [key], [val]) +end +function init!(self :: KVStore, key :: Int, vals :: Vector{NDArray}) + init!(self, Base.ones(Int, length(vals))*key, vals) +end +function init!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) + init!(self, _flatten_kvlist(keys, vals)...) +end +function init!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{NDArray}) + @assert length(keys) == length(vals) + keys = Cint[keys...] + vals = MX_handle[vals...] + @mxcall(:MXKVStoreInit, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}), + self, length(keys), keys, vals) +end + +import Base.push! +function push!(self :: KVStore, key :: Int, val :: NDArray; priority :: Int = 0) + push!(self, [key], [val]; priority = priority) +end +function push!(self :: KVStore, key :: Int, vals :: Vector{NDArray}; priority :: Int = 0) + push!(self, Base.ones(Int, length(vals))*key, vals; priority = priority) +end +function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}; priority::Int=0) + push!(self, _flatten_kvlist(keys, vals)...; priority = priority) +end +function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{NDArray}; priority::Int=0) + @assert length(keys) == length(vals) + keys = Cint[keys...] + vals = MX_handle[vals...] + @mxcall(:MXKVStorePush, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}, Cint), + self, length(keys), keys, vals, priority) +end + +function pull!(self :: KVStore, key :: Int, out :: NDArray; priority :: Int = 0) + pull!(self, [key], [out]) +end +function pull!(self :: KVStore, key :: Int, outs :: Vector{NDArray}; priority :: Int = 0) + pull!(self, Base.ones(Int, length(outs))*key, outs; priority = priority) +end +function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{Vector{NDArray}}; priority::Int=0) + pull!(self, _flatten_kvlist(keys, outs)...; priority = priority) +end +function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{NDArray}; priority::Int=0) + @assert length(keys) == length(outs) + keys = Cint[keys...] + outs = MX_handle[outs...] + @mxcall(:MXKVStorePull, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}, Cint), + self, length(keys), keys, outs, priority) +end + + +function get_type(self :: KVStore) + type_ref = Ref{char_p}(0) + @mxcall(:MXKVStoreGetType, (MX_handle, Ref{char_p}), self, type_ref) + return symbol(bytestring(type_ref[])) +end + +function get_num_workers(self :: KVStore) + ref_size = Ref{Cint}(0) + @mxcall(:MXKVStoreGetGroupSize, (MX_handle, Ref{Cint}), self, ref_size) + return Int(ref_size[]) +end + +function get_rank(self :: KVStore) + ref_rank = Ref{Cint}(0) + @mxcall(:MXKVStoreGetRank, (MX_handle, Ref{Cint}), self, ref_rank) + return Int(ref_rank[]) +end + + +# TODO: Currently Julia does not support closure in c-callbacks, so we are making use of the +# extra handle parameter of the API to pass the updater object around. Fix this when someday +# full closure cfunction is supported in Julia. +function _kvstore_update_wrapper(index::Cint, nd_recv::MX_handle, nd_local::MX_handle, updater::Ptr{Void}) + updater_func = unsafe_pointer_to_objref(updater) :: Function + updater_func(Int(index), NDArray(MX_NDArrayHandle(nd_recv)), NDArray(MX_NDArrayHandle(nd_local))) + return nothing +end +function set_updater(self :: KVStore, updater :: Function) + self.updater = updater # keep a reference to the julia object so that updater_c is kept valid + self.updater_c = cfunction(_kvstore_update_wrapper, Void, (Cint, MX_handle, MX_handle, Ptr{Void})) + + @mxcall(:MXKVStoreSetUpdater, (MX_handle, Ptr{Void}, Any), + self, self.updater_c, updater) +end + +function set_optimizer(self :: KVStore, optimizer :: AbstractOptimizer) + ref_is_worker = Ref{Cint}(0) + @mxcall(:MXKVStoreIsWorkerNode, (Ref{Cint},), ref_is_worker) + is_worker = ref_is_worker[] + + if ismatch(r"dist", string(get_type(self))) && is_worker + # TODO + else + set_updater(self, get_updater(optimizer)) + end +end diff --git a/src/metric.jl-e b/src/metric.jl-e new file mode 100644 index 000000000000..c88239ab8cc8 --- /dev/null +++ b/src/metric.jl-e @@ -0,0 +1,37 @@ +abstract AbstractEvalMetric + +type Accuracy <: AbstractEvalMetric + acc_sum :: Float64 + n_sample :: Int + + Accuracy() = new(0.0, 0) +end + +function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDArray) + label = copy(label) + pred = copy(pred) + + n_sample = size(pred)[end] + metric.n_sample += n_sample + for i = 1:n_sample + klass = indmax(pred[:,i]) + metric.acc_sum += (klass-1) == label[i] + end +end + +function update!(metric :: Accuracy, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + @assert length(labels) == length(preds) + for i = 1:length(labels) + _update_single_output(metric, labels[i], preds[i]) + end +end + +import Base: get +function get(metric :: Accuracy) + return [(:accuracy, metric.acc_sum / metric.n_sample)] +end + +function reset!(metric :: Accuracy) + metric.acc_sum = 0.0 + metric.n_sample = 0 +end diff --git a/src/model.jl b/src/model.jl index 93189124d9b0..1a9d11facbe2 100644 --- a/src/model.jl +++ b/src/model.jl @@ -23,7 +23,7 @@ abstract AbstractModel that handles sequential data explicitly, please use **TODO**... =# type FeedForward <: AbstractModel - arch :: Node + arch :: SymbolicNode ctx :: Vector{Context} arg_params :: Dict{Base.Symbol, NDArray} @@ -32,7 +32,7 @@ type FeedForward <: AbstractModel pred_exec :: Union{Executor, Void} # leave the rest fields undefined - FeedForward(arch :: Node, ctx :: Vector{Context}) = new(arch, ctx) + FeedForward(arch :: SymbolicNode, ctx :: Vector{Context}) = new(arch, ctx) end """Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector @@ -52,14 +52,14 @@ function _split_inputs(batch_size :: Int, n_split :: Int) end #=doc -.. function:: FeedForward(arch :: Node, ctx) +.. function:: FeedForward(arch :: SymbolicNode, ctx) :param arch: the architecture of the network constructed using the symbolic API. :param ctx: the devices on which this model should do computation. It could be a single :class:`Context` or a list of :class:`Context` objects. In the latter case, data parallelization will be used for training. If no context is provided, the default context ``cpu()`` will be used. =# -function FeedForward(arch :: Node; context :: Union{Context, Vector{Context}, Void} = nothing) +function FeedForward(arch :: SymbolicNode; context :: Union{Context, Vector{Context}, Void} = nothing) if isa(context, Void) context = [Context(CPU)] elseif isa(context, Context) @@ -514,7 +514,7 @@ end function save_checkpoint(self :: FeedForward, prefix :: AbstractString, state :: OptimizationState) save_checkpoint(self.arch, self.arg_params, self.aux_params, prefix, state.curr_epoch) end -function save_checkpoint(sym :: Node, arg_params :: Dict{Base.Symbol, NDArray}, +function save_checkpoint(sym :: SymbolicNode, arg_params :: Dict{Base.Symbol, NDArray}, aux_params :: Dict{Base.Symbol, NDArray}, prefix :: AbstractString, epoch :: Int) save("$prefix-symbol.json", sym) save_dict = merge(Dict([symbol("arg:$k") => v for (k,v) in arg_params]), @@ -525,7 +525,7 @@ function save_checkpoint(sym :: Node, arg_params :: Dict{Base.Symbol, NDArray}, end function load_checkpoint(prefix :: AbstractString, epoch :: Int) - arch = load("$prefix-symbol.json", Node) + arch = load("$prefix-symbol.json", SymbolicNode) saved_dict = load(format("{1}-{2:04d}.params", prefix, epoch), NDArray) arg_params = Dict{Base.Symbol, NDArray}() aux_params = Dict{Base.Symbol, NDArray}() diff --git a/src/model.jl-e b/src/model.jl-e new file mode 100644 index 000000000000..93189124d9b0 --- /dev/null +++ b/src/model.jl-e @@ -0,0 +1,566 @@ +#=doc +Models +====== + +The model API provides convenient high-level interface to do training and predicting on +a network described using the symbolic API. +=# + +#=doc +.. class:: AbstractModel + + The abstract super type of all models in MXNet.jl. +=# +abstract AbstractModel + +#=doc +.. class:: FeedForward + + The feedforward model provides convenient interface to train and predict on + feedforward architectures like multi-layer MLP, ConvNets, etc. There is no + explicitly handling of *time index*, but it is relatively easy to implement + unrolled RNN / LSTM under this framework (**TODO**: add example). For models + that handles sequential data explicitly, please use **TODO**... +=# +type FeedForward <: AbstractModel + arch :: Node + ctx :: Vector{Context} + + arg_params :: Dict{Base.Symbol, NDArray} + aux_params :: Dict{Base.Symbol, NDArray} + + pred_exec :: Union{Executor, Void} + + # leave the rest fields undefined + FeedForward(arch :: Node, ctx :: Vector{Context}) = new(arch, ctx) +end + +"""Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector + of length `n_split`, with each entry a `UnitRange{Int}` indicating the slice index for that + piece. +""" +function _split_inputs(batch_size :: Int, n_split :: Int) + @assert(batch_size >= n_split) + per_split = floor(Int, batch_size / n_split) + counts = Base.zeros(Int, n_split)+per_split + extra = batch_size - sum(counts) + counts[1:extra] += 1 + + cum = [0, cumsum(counts)...] + idx = [cum[i-1]+1:cum[i] for i = 2:length(cum)] + return idx +end + +#=doc +.. function:: FeedForward(arch :: Node, ctx) + + :param arch: the architecture of the network constructed using the symbolic API. + :param ctx: the devices on which this model should do computation. It could be a single :class:`Context` + or a list of :class:`Context` objects. In the latter case, data parallelization will be used + for training. If no context is provided, the default context ``cpu()`` will be used. +=# +function FeedForward(arch :: Node; context :: Union{Context, Vector{Context}, Void} = nothing) + if isa(context, Void) + context = [Context(CPU)] + elseif isa(context, Context) + context = [context] + end + FeedForward(arch, context) +end + +#=doc +.. function:: init_model(self, initializer; overwrite=false, input_shapes...) + + Initialize the weights in the model. + + This method will be called automatically when training a model. So there is usually no + need to call this method unless one needs to inspect a model with only randomly initialized + weights. + + :param FeedForward self: the model to be initialized. + :param AbstractInitializer initializer: an initializer describing how the weights should be initialized. + :param Bool overwrite: keyword argument, force initialization even when weights already exists. + :param input_shapes: the shape of all data and label inputs to this model, given as keyword arguments. + For example, ``data=(28,28,1,100), label=(100,)``. +=# +function init_model(self :: FeedForward, initializer :: AbstractInitializer; overwrite::Bool=false, input_shapes...) + # all arg names, including data, label, and parameters + arg_names = list_arguments(self.arch) + + input_names = [x[1] for x in input_shapes] + + param_names = setdiff(arg_names, input_names) + aux_names = list_auxiliary_states(self.arch) + + arg_defined = true + aux_defined = true + + arg_shapes, out_shapes, aux_shapes = infer_shape(self.arch; input_shapes...) + if !isdefined(self, :arg_params) + param_name_shapes = filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) + self.arg_params = Dict([name => empty(shape) for (name,shape) in param_name_shapes]) + arg_defined = false + end + if !isdefined(self, :aux_params) + self.aux_params = Dict([name => empty(shape) for (name,shape) in zip(aux_names,aux_shapes)]) + aux_defined = false + end + + # initialize the contents of the parameters + if !arg_defined || overwrite + for (k,v) in self.arg_params + initializer(k, v) + end + end + if !aux_defined || overwrite + for (k,v) in self.aux_params + initializer(k, v) + end + end + + return (arg_names, param_names, aux_names) +end + +function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_shapes...) + if !isdefined(self, :pred_exec) || isa(self.pred_exec, Void) || overwrite + if !isdefined(self, :arg_params) || !isdefined(self, :aux_params) + @assert(false, "Model weights not defined, please init or train the model, or load from file") + end + + # the predictor use only the first device + self.pred_exec = simple_bind(self.arch, self.ctx[1]; grad_req=GRAD_NOP, data_shapes...) + copy_params_from(self.pred_exec, self.arg_params, self.aux_params) + else + # make sure the new setup is compatible with the existing one + for (d_name, d_shape) in data_shapes + @assert(d_shape == size(self.pred_exec.arg_dict[d_name]), + "Shape of $d_name mismatch with existing predictor, use overwrite=true overwrite existing predictor") + end + end +end + +#=doc +.. function:: + predict(self, data; overwrite=false, callback=nothing) + + Predict using an existing model. The model should be already initialized, or trained or loaded from + a checkpoint. There is an overloaded function that allows to pass the callback as the first argument, + so it is possible to do + + .. code-block:: julia + + predict(model, data) do batch_output + # consume or write batch_output to file + end + + :param FeedForward self: the model. + :param AbstractDataProvider data: the data to perform prediction on. + :param Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory + allocation of the :class:`Executor` depends on the mini-batch size of the test + data provider. If you call predict twice with data provider of the same batch-size, + then the executor can be re-used. Otherwise, if ``overwrite`` is false (default), + an error will be raised; if ``overwrite`` is set to true, a new :class:`Executor` + will be created to replace the old one. + + .. note:: + + Prediction is computationally much less costly than training, so the bottleneck sometimes becomes the IO + for copying mini-batches of data. Since there is no concern about convergence in prediction, it is better + to set the mini-batch size as large as possible (limited by your device memory) if prediction speed is a + concern. + + For the same reason, currently prediction will only use the first device even if multiple devices are + provided to construct the model. + + :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` +=# +function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = false) + predict(self, data; overwrite = overwrite, callback=callback) +end +function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::Bool=false, callback::Union{Function,Void}=nothing) + data_shapes = provide_data(data) + data_names = [x[1] for x in data_shapes] + _setup_predictor(self, overwrite; data_shapes...) + + batch_size = get_batch_size(data) + data_arrays = [self.pred_exec.arg_dict[name] for name in data_names] + output_list = [Array{MX_float}[] for i=1:length(self.pred_exec.outputs)] + for batch in eachbatch(data) + load_data!(data, batch, data_arrays) + forward(self.pred_exec, is_train=false) + if isa(callback, Void) + # no callback, accumulate the data and return at the end + for (o_list, o_nd) in zip(output_list, self.pred_exec.outputs) + push!(o_list, copy(slice(o_nd, 1:count_samples(data, batch)))) + end + else + outputs = self.pred_exec.outputs + if length(outputs) == 1 + outputs = outputs[1] + end + callback(outputs) + end + end + + if !isa(callback, Void) + # callback exists, do not accumulate data + return nothing + end + + if isempty(output_list) + # maybe model does not have outputs + return nothing + end + if isempty(output_list[1]) + # maybe no output because data is empty + return length(output_list) == 1 ? output_list[1] : output_list + end + + # concatenate along mini-batches + output_arrays = [cat(ndims(x[1]), x...) for x in output_list] + if length(output_arrays) == 1 + # only 1 output, return it directly, instead of a list + output_arrays = output_arrays[1] + end + return output_arrays +end + +function _init_model(self :: FeedForward, data :: AbstractDataProvider, initializer :: AbstractInitializer, overwrite :: Bool) + init_model(self, initializer; overwrite=overwrite, [provide_data(data)..., provide_label(data)...]...) +end + +function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}) + if num_device == 1 && !ismatch(r"dist", string(kv_type)) + kv = nothing + else + if kv_type == :local + max_size = maximum([prod(size(param)) for (k,param) in arg_params]) + if max_size < 1024 * 1024 * 16 + kv_type = :local_update_cpu + else + kv_type = :local_allreduce_cpu + end + info("Auto-select kvstore type = $kv_type") + end + kv = KVStore(kv_type) + end + + update_on_kvstore = true + if isa(kv, Void) || ismatch(r"local_allreduce", string(get_type(kv))) + update_on_kvstore = false + end + + return (kv, update_on_kvstore) +end + +@defstruct TrainingOptions Any ( + initializer :: AbstractInitializer = UniformInitializer(0.01), + n_epoch :: Int = 10, + eval_data :: Union{Void, AbstractDataProvider} = nothing, + eval_metric :: AbstractEvalMetric = Accuracy(), + kvstore :: Union{Base.Symbol, KVStore} = :local, + force_init :: Bool = false, + callbacks :: Vector{AbstractCallback} = AbstractCallback[], +) + +function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, + state::OptimizationState, type_filter::Type) + map(callbacks) do cb + if isa(cb, type_filter) + if type_filter == AbstractEpochCallback + # epoch callback have extra access to the model object + cb(self, state) + else + cb(state) + end + end + end +end + +#=doc +.. function:: train(model :: FeedForward, ...) + + Alias to :func:`fit`. +=# +function train(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) + fit(self, optimizer, data; kwargs...) +end + +#=doc +.. function:: fit(model :: FeedForward, optimizer, data; kwargs...) + + Train the ``model`` on ``data`` with the ``optimizer``. + + :param FeedForward model: the model to be trained. + :param AbstractOptimizer optimizer: the optimization algorithm to use. + :param AbstractDataProvider data: the training data provider. + :param Int n_epoch: default 10, the number of full data-passes to run. + :param AbstractDataProvider eval_data: keyword argument, default ``nothing``. The data provider for + the validation set. + :param AbstractEvalMetric eval_metric: keyword argument, default ``Accuracy()``. The metric used + to evaluate the training performance. If ``eval_data`` is provided, the same metric is also + calculated on the validation set. + :param kvstore: keyword argument, default ``:local``. The key-value store used to synchronize gradients + and parameters when multiple devices are used for training. + :type kvstore: :class:`KVStore` or ``Base.Symbol`` + :param AbstractInitializer initializer: keyword argument, default ``UniformInitializer(0.01)``. + :param Bool force_init: keyword argument, default false. By default, the random initialization using the + provided ``initializer`` will be skipped if the model weights already exists, maybe from a previous + call to :func:`train` or an explicit call to :func:`init_model` or :func:`load_checkpoint`. When + this option is set, it will always do random initialization at the begining of training. + :param callbacks: keyword argument, default ``[]``. Callbacks to be invoked at each epoch or mini-batch, + see :class:`AbstractCallback`. + :type callbacks: ``Vector{AbstractCallback}`` +=# +function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) + opts = TrainingOptions(; kwargs...) + + info("Start training on $(self.ctx)") + + batch_size = get_batch_size(data) + num_dev = length(self.ctx) + slices = _split_inputs(batch_size, num_dev) + + # initialize parameters + info("Initializing parameters...") + arg_names, param_names, aux_names = _init_model(self, data, opts.initializer, opts.force_init) + + # setup kvstore + kvstore = opts.kvstore + if isa(kvstore, Base.Symbol) + info("Creating KVStore...") + kvstore, update_on_kvstore = _create_kvstore(kvstore, length(self.ctx), self.arg_params) + end + + train_execs = Array(Executor, num_dev) + for i = 1:num_dev + data_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)] + label_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)] + train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=GRAD_WRITE, data_shapes..., label_shapes...) + + copy_params_from(train_execs[i], self.arg_params, self.aux_params) + end + + # set up input data structures + data_names = [x[1] for x in provide_data(data)] + label_names = [x[1] for x in provide_label(data)] + + data_arrays = [SlicedNDArray[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] + for name in data_names] + label_arrays = [SlicedNDArray[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] + for name in label_names] + + param_idx = filter(i -> in(arg_names[i], param_names), 1:length(arg_names)) + + param_arrays = [NDArray[exec.arg_arrays[i] for exec in train_execs] for i in param_idx] + grad_arrays = [NDArray[exec.grad_arrays[i] for exec in train_execs] for i in param_idx] + aux_arrays = [NDArray[exec.aux_arrays[i] for exec in train_execs] for i = 1:length(aux_names)] + + op_state = OptimizationState(batch_size) + optimizer.state = op_state + + if !update_on_kvstore + updater = get_updater(optimizer) + end + + if !isa(kvstore, Void) + if update_on_kvstore + set_optimizer(kvstore, optimizer) + end + + info("Initializing KVStore...") + # init kv with gradients + for idx = 1:length(param_arrays) + param_on_devs = param_arrays[idx] + + init!(kvstore, idx, self.arg_params[param_names[idx]]) + + if update_on_kvstore + # pull weights back + pull!(kvstore, idx, param_on_devs, priority=-idx) + end + end + end + + # set up output and labels in CPU for evaluation metric + output_shapes = [tuple(size(x)[1:end-1]...,batch_size) for x in train_execs[1].outputs] + cpu_dev = Context(CPU) + cpu_output_arrays = [empty(shape, cpu_dev) for shape in output_shapes] + cpu_label_arrays = [empty(shape, cpu_dev) for (name,shape) in provide_label(data)] + + # invoke callbacks on epoch 0 + _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) + + # now start training... + for i_epoch = 1:opts.n_epoch + time_start = time() + reset!(opts.eval_metric) + + op_state.curr_epoch = i_epoch + op_state.curr_batch = 0 + + # invoke callbacks on iteration 0 + _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) + + for batch in eachbatch(data) + load_data!(data, batch, data_arrays) + load_label!(data, batch, label_arrays) + + # forward and backward + for (texec, islice) in zip(train_execs, slices) + forward(texec, is_train=true) + + # copy outputs into cpu ndarray, for evaluation metric + for (cpu_out, dev_out) in zip(cpu_output_arrays, texec.outputs) + copy!(slice(cpu_out, islice), dev_out) + end + + backward(texec) + end + + op_state.curr_iter += 1 + op_state.curr_batch += 1 + optimizer.state = op_state + + # update parameters + for idx = 1:length(param_names) + # gradient synchronization + if !isa(kvstore, Void) + # push gradient, priority is negative index + push!(kvstore, idx, grad_arrays[idx], priority=-idx) + if update_on_kvstore + # pull back the weights + pull!(kvstore, idx, param_arrays[idx], priority=-idx) + else + # pull back the sum-ed gradients, to the same locations + pull!(kvstore, idx, grad_arrays[idx], priority=-idx) + end + end + + if !update_on_kvstore + # manual updating + for i_dev = 1:num_dev + # create a fake index, so that the updater create states + # for different param AND different devices, TODO(mli) + # use a better solution later + fake_idx = idx * num_dev + i_dev + updater(fake_idx, grad_arrays[idx][i_dev], param_arrays[idx][i_dev]) + end + end + end + + # invoke callbacks after finishing each iteration + _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) + + # update evaluation metric on training set + load_label!(data, batch, cpu_label_arrays) + update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) + end # end of one epoch + + time_stop = time() + info(format("== Epoch {1:0>3d} ==========", i_epoch)) + info("## Training summary") + for (name, value) in get(opts.eval_metric) + info(format("{1:>15s} = {2:.4f}", name, value)) + end + info(format("{1:>15s} = {2:.4f} seconds", "time", time_stop-time_start)) + + # evaluation on validation set + if !isa(opts.eval_data, Void) + # because we are re-using the memory allocated for the training network, + # the batch_size of the validation dataset must be the same as the training + # batch_size + @assert(get_batch_size(opts.eval_data) == batch_size) + + reset!(opts.eval_metric) + for batch in eachbatch(opts.eval_data) + load_data!(opts.eval_data, batch, data_arrays) + + # forward and backward + for (texec, islice) in zip(train_execs, slices) + forward(texec, is_train=true) + + # copy outputs into cpu ndarray, for evaluation metric + for (cpu_out, dev_out) in zip(cpu_output_arrays, texec.outputs) + copy!(slice(cpu_out, islice), dev_out) + end + end + load_label!(opts.eval_data, batch, cpu_label_arrays) + update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) + end + + info("## Validation summary") + for (name, value) in get(opts.eval_metric) + info(format("{1:>15s} = {2:.4f}", name, value)) + end + end + + if i_epoch == opts.n_epoch || any(x->isa(x, AbstractEpochCallback), opts.callbacks) + # copy data back to cpu + for (name, weights) in zip(param_names, param_arrays) + # average parameters across devices + weight = +([copy(w, cpu()) for w in weights]...) / length(weights) + copy!(self.arg_params[name], weight) + end + for (name, aux_devs) in zip(aux_names, aux_arrays) + aux_avg = +([copy(aux, cpu()) for aux in aux_devs]...) / length(aux_devs) + copy!(self.aux_params[name], aux_avg) + end + end + _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) + end # end of all epochs +end + +function save_checkpoint(self :: FeedForward, prefix :: AbstractString, state :: OptimizationState) + save_checkpoint(self.arch, self.arg_params, self.aux_params, prefix, state.curr_epoch) +end +function save_checkpoint(sym :: Node, arg_params :: Dict{Base.Symbol, NDArray}, + aux_params :: Dict{Base.Symbol, NDArray}, prefix :: AbstractString, epoch :: Int) + save("$prefix-symbol.json", sym) + save_dict = merge(Dict([symbol("arg:$k") => v for (k,v) in arg_params]), + Dict([symbol("aux:$k") => v for (k,v) in aux_params])) + save_filename = format("{1}-{2:04d}.params", prefix, epoch) + save(save_filename, save_dict) + info("Saved checkpoint to '$save_filename'") +end + +function load_checkpoint(prefix :: AbstractString, epoch :: Int) + arch = load("$prefix-symbol.json", Node) + saved_dict = load(format("{1}-{2:04d}.params", prefix, epoch), NDArray) + arg_params = Dict{Base.Symbol, NDArray}() + aux_params = Dict{Base.Symbol, NDArray}() + for (k,v) in saved_dict + tp, name = split(string(k), ':') + name = symbol(name) + if tp == "arg" + arg_params[name] = v + else + aux_params[name] = v + end + end + + return (arch, arg_params, aux_params) +end + +function load_checkpoint(prefix :: AbstractString, epoch :: Int, ::Type{FeedForward}) + arch, arg_params, aux_params = load_checkpoint(prefix, epoch) + model = FeedForward(arch) + model.arg_params = arg_params + model.aux_params = aux_params + return model +end + +function load_checkpoint(self :: FeedForward, prefix :: AbstractString, epoch :: Int; overwrite :: Bool = true) + if isdefined(self, :arg_params) && isdefined(self, :aux_params) && !overwrite + info("model weights already exists, skip loading... (call with overwrite=true if needed)") + return self + end + + arch, arg_params, aux_params = load_checkpoint(prefix, epoch) + # TODO: is there better way to compare two symbols + @assert(to_json(self.arch) == to_json(arch), "Cannot load from a checkpoint with different network architecture") + self.arg_params = arg_params + self.aux_params = aux_params + return self +end + diff --git a/src/name.jl-e b/src/name.jl-e new file mode 100644 index 000000000000..5ebf10917ce6 --- /dev/null +++ b/src/name.jl-e @@ -0,0 +1,44 @@ +abstract AbstractNameManager +typealias NameType Union{Base.Symbol, AbstractString} +typealias NameCounter Dict{Base.Symbol, Int} + +import Base: get! + +# Default implementation for generating a name for a symbol. +# When a name is specified by the user, it will be used. Otherwise, a name +# is automatically generated based on the hint string. +function _default_get_name!(counter :: NameCounter, name :: NameType, hint :: NameType) + if isa(name, Base.Symbol) || !isempty(name) + return symbol(name) + end + + hint = symbol(hint) + if !haskey(counter, hint) + counter[hint] = 0 + end + name = symbol("$hint$(counter[hint])") + counter[hint] += 1 + return name +end + +type BasicNameManager <: AbstractNameManager + counter :: NameCounter +end +BasicNameManager() = BasicNameManager(NameCounter()) + +function get!(manager :: BasicNameManager, name :: NameType, hint :: NameType) + _default_get_name!(manager.counter, name, hint) +end + +type PrefixNameManager <: AbstractNameManager + prefix :: Base.Symbol + counter :: NameCounter +end +PrefixNameManager(prefix :: NameType) = PrefixNameManager(symbol(prefix), NameCounter()) + +function get!(manager :: PrefixNameManager, name :: NameType, hint :: NameType) + name = _default_get_name!(manager.counter, name, hint) + return symbol("$(manager.prefix)$name") +end + +DEFAULT_NAME_MANAGER = BasicNameManager() diff --git a/src/ndarray.jl-e b/src/ndarray.jl-e new file mode 100644 index 000000000000..82293d2fdbe9 --- /dev/null +++ b/src/ndarray.jl-e @@ -0,0 +1,800 @@ +#=doc +NDArray API +=========== +=# + +# create a NDArray handle of specific shape +function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) + h_ref = Ref{MX_handle}(0) + shape = flipdim(MX_uint[shape...],1) + @mxcall(:MXNDArrayCreate, (Ptr{MX_uint}, MX_uint, Cint, Cint, Cint, Ref{MX_handle}), + shape, length(shape), ctx.device_type, ctx.device_id, delay_alloc, h_ref) + handle = MX_NDArrayHandle(h_ref[]) + return handle +end + +# create a handle to an empty NDArray, this handle can be used to hold +# results returned by libmx API calls +function _ndarray_alloc() + h_ref = Ref{MX_handle}(0) + @mxcall(:MXNDArrayCreateNone, (Ref{MX_handle},), h_ref) + return MX_NDArrayHandle(h_ref[]) +end + +################################################################################ +# NDArray Type +################################################################################ +#=doc +.. class:: NDArray + + Wrapper of the ``NDArray`` type in ``libmxnet``. This is the basic building block + of tensor-based computation. + + .. _ndarray-shape-note: + + .. note:: + + since C/C++ use row-major ordering for arrays while Julia follows a + column-major ordering. To keep things consistent, we keep the underlying data + in their original layout, but use *language-native* convention when we talk + about shapes. For example, a mini-batch of 100 MNIST images is a tensor of + C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory + have shape (28,28,1,100). +=# +type NDArray + handle :: MX_NDArrayHandle + writable :: Bool + + function NDArray(handle, writable=true) + new(handle, writable) + end +end + +function Base.show(io :: IO, arr :: NDArray) + print(io, "mx.NDArray$(size(arr))") +end + +function NDArray{T<:Real}(data :: Array{T}) + copy(data, cpu()) +end + +function Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) + Base.unsafe_convert(MX_handle, obj.handle) +end +Base.convert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) +Base.cconvert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) + +################################################################################ +# NDArray functions exported to the users +################################################################################ +#=doc +.. function:: context(arr :: NDArray) + + Get the context that this :class:`NDArray` lives on. +=# +function context(arr :: NDArray) + ref_typeid = Ref{Cint}(0) + ref_devid = Ref{Cint}(0) + @mxcall(:MXNDArrayGetContext, (MX_handle, Ref{Cint}, Ref{Cint}), + arr, ref_typeid, ref_devid) + return Context(ref_typeid[], ref_devid[]) +end + +#=doc +.. function:: + empty(shape :: Tuple, ctx :: Context) + empty(shape :: Tuple) + empty(dim1, dim2, ...) + + Allocate memory for an uninitialized :class:`NDArray` with specific shape. +=# +function empty{N}(shape :: NTuple{N, Int}) + empty(shape, cpu()) +end +function empty{N}(shape :: NTuple{N, Int}, ctx :: Context) + NDArray(_ndarray_alloc(shape, ctx, false)) +end +function empty(shape :: Int...) + empty(shape) +end + +#=doc +Interface functions similar to Julia Arrays +------------------------------------------- +=# + +#=doc +.. function:: + zeros(shape :: Tuple, ctx :: Context) + zeros(shape :: Tuple) + zeros(dim1, dim2, ...) + + Create zero-ed :class:`NDArray` with specific shape. +=# +function zeros{N}(shape :: NTuple{N, Int}) + zeros(shape, cpu()) +end +function zeros{N}(shape :: NTuple{N, Int}, ctx :: Context) + arr = empty(shape, ctx) + arr[:] = 0 + return arr +end +function zeros(shape :: Int...) + zeros(shape) +end + +#=doc +.. function:: + ones(shape :: Tuple, ctx :: Context) + ones(shape :: Tuple) + ones(dim1, dim2, ...) + + Create an :class:`NDArray` with specific shape and initialize with 1. +=# +function ones{N}(shape :: NTuple{N, Int}) + ones(shape, cpu()) +end +function ones{N}(shape :: NTuple{N, Int}, ctx :: Context) + arr = empty(shape, ctx) + arr[:] = 1 + return arr +end +function ones(shape :: Int...) + ones(shape) +end + +import Base: size, length, ndims, eltype + +#=doc +.. function:: + size(arr :: NDArray) + size(arr :: NDArray, dim :: Int) + + Get the shape of an :class:`NDArray`. The shape is in Julia's column-major convention. See + also the :ref:`notes on NDArray shapes `. +=# +function size(arr :: NDArray) + ref_ndim = Ref{MX_uint}(0) + ref_shape = Ref{Ptr{MX_uint}}(0) + @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), + arr, ref_ndim, ref_shape) + tuple(map(Int, flipdim(pointer_to_array(ref_shape[], ref_ndim[]),1))...) +end +function size(arr :: NDArray, dim :: Int) + size(arr)[dim] +end + +#=doc +.. function:: length(arr :: NDArray) + + Get the number of elements in an :class:`NDArray`. +=# +function length(arr :: NDArray) + prod(size(arr)) +end + +#=doc +.. function:: ndims(arr :: NDArray) + + Get the number of dimensions of an :class:`NDArray`. Is equivalent to ``length(size(arr))``. +=# +function ndims(arr :: NDArray) + length(size(arr)) +end + +#=doc +.. function:: eltype(arr :: NDArray) + + Get the element type of an :class:`NDArray`. Currently the element type is always ``mx.MX_float``. +=# +function eltype(arr :: NDArray) + MX_float +end + + +import Base: slice +#=doc +.. function:: slice(arr :: NDArray, start:stop) + + Create a view into a sub-slice of an :class:`NDArray`. Note only slicing at the slowest + changing dimension is supported. In Julia's column-major perspective, this is the last + dimension. For example, given an :class:`NDArray` of shape (2,3,4), ``slice(array, 2:3)`` will create + a :class:`NDArray` of shape (2,3,2), sharing the data with the original array. This operation is + used in data parallelization to split mini-batch into sub-batches for different devices. +=# +function slice(arr :: NDArray, ::Colon) + arr +end +function slice(arr :: NDArray, slice::UnitRange{Int}) + dim1 = size(arr)[end] + @assert(1 <= slice.start <= slice.stop <= dim1) + if slice.start == 1 && slice.stop == dim1 + return arr + end + + hdr_ref = Ref{MX_handle}(0) + # note Julia is 1-based, inclusive-inclusive indexing, while C++ is + # 0-based, inclusive-exclusive indexing. So 1:3 in Julia should + # translates into 0:3 in C++. + @mxcall(:MXNDArraySlice, (MX_handle, MX_uint, MX_uint, Ref{MX_handle}), + arr, slice.start-1, slice.stop, hdr_ref) + return NDArray(MX_NDArrayHandle(hdr_ref[]), arr.writable) +end + +import Base: setindex! + +#=doc +.. function:: setindex!(arr :: NDArray, val, idx) + + Assign values to an :class:`NDArray`. Elementwise assignment is not implemented, only the following + scenarios are supported + + - ``arr[:] = val``: whole array assignment, ``val`` could be a scalar or an array (Julia ``Array`` + or :class:`NDArray`) of the same shape. + - ``arr[start:stop] = val``: assignment to a *slice*, ``val`` could be a scalar or an array of + the same shape to the slice. See also :func:`slice`. +=# +function setindex!(arr :: NDArray, val :: Real, ::Colon) + @assert(arr.writable) + _set_value(val, arr) + return arr +end +function setindex!{T<:Real}(arr :: NDArray, val :: Array{T}, ::Colon) + copy!(arr, val) +end +function setindex!(arr :: NDArray, val :: NDArray, ::Colon) + copy!(arr, val) +end +function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, idx::UnitRange{Int}) + setindex!(slice(arr, idx), val, Colon()) +end + +#=doc +.. function:: getindex(arr :: NDArray, idx) + + Shortcut for :func:`slice`. A typical use is to write + + .. code-block:: julia + + arr[:] += 5 + + which translates into + + .. code-block:: julia + + arr[:] = arr[:] + 5 + + which furthur translates into + + .. code-block:: julia + + setindex!(getindex(arr, Colon()), 5, Colon()) + + .. note:: + + The behavior is quite different from indexing into Julia's ``Array``. For example, ``arr[2:5]`` + create a **copy** of the sub-array for Julia ``Array``, while for :class:`NDArray`, this is + a *slice* that shares the memory. +=# +import Base: getindex +"""Shortcut for `slice`. **NOTE** the behavior for Julia's built-in index slicing is to create a +copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. +""" +function getindex(arr :: NDArray, ::Colon) + return arr +end +function getindex(arr :: NDArray, idx::UnitRange{Int}) + slice(arr, idx) +end + +#=doc +Copying functions +----------------- +=# +import Base: copy!, copy, convert +#=doc +.. function:: + copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) + + Copy contents of ``src`` into ``dst``. +=# +function copy!(dst :: NDArray, src :: NDArray) + @assert(dst.writable) + if dst.handle == src.handle + warn("Copying an NDArray to itself") + return + end + + _copyto(src, dst) + return dst +end + +function copy!(dst :: Array{MX_float}, src :: NDArray) + @assert size(dst) == size(src) + @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{MX_float}, Csize_t), + src, pointer(dst), length(dst)) + return dst +end +function copy!{T<:Real}(dst :: Array{T}, src :: NDArray) + copy!(dst, copy(src)) +end + +function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) + @assert dst.writable + @assert size(dst) == size(src) + src = convert(Array{MX_float}, src) # this might involve copying + @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), + dst.handle, pointer(src), length(src)) + return dst +end + +function copy_ignore_shape!{T<:Real}(dst :: NDArray, src :: Array{T}) + @assert dst.writable + @assert length(dst) == length(src) + src = convert(Array{MX_float}, src) # this might involve copying + @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), + dst.handle, pointer(src), length(src)) + return dst +end + + +#=doc +.. function:: + copy(arr :: NDArray) + copy(arr :: NDArray, ctx :: Context) + copy(arr :: Array, ctx :: Context) + + Create a copy of an array. When no :class:`Context` is given, create a Julia ``Array``. + Otherwise, create an :class:`NDArray` on the specified context. +=# +# Create copy: NDArray -> Julia Array +function copy(arr :: NDArray) + j_arr = Array(MX_float, size(arr)) + copy!(j_arr, arr) +end + +# Create copy: NDArray -> NDArray in a given context +function copy(arr :: NDArray, ctx :: Context) + dst = NDArray(_ndarray_alloc(size(arr), ctx, true)) + copy!(dst, arr) +end + +# Create copy: Julia Array -> NDArray in a given context +function copy{T<:Real}(arr :: Array{T}, ctx :: Context) + dst = empty(size(arr), ctx) + copy!(dst, arr) +end + +#=doc +.. function:: convert(::Type{Array{T}}, arr :: NDArray) + + Convert an :class:`NDArray` into a Julia ``Array`` of specific type. +=# +# Convert copy: NDArray -> Julia Array +function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) + convert(t, copy(arr)) +end + + +#=doc +Basic arithmetics +----------------- +=# + +#=doc +.. function:: @inplace + + Julia does not support re-definiton of ``+=`` operator (like ``__iadd__`` in python), + When one write ``a += b``, it gets translated to ``a = a+b``. ``a+b`` will allocate new + memory for the results, and the newly allocated :class:`NDArray` object is then assigned + back to a, while the original contents in a is discarded. This is very inefficient + when we want to do inplace update. + + This macro is a simple utility to implement this behavior. Write + + .. code-block:: julia + + @mx.inplace a += b + + will translate into + + .. code-block:: julia + + mx.add_to!(a, b) + + which will do inplace adding of the contents of ``b`` into ``a``. +=# +macro inplace(stmt) + if stmt.head == :+= || stmt.head == :.+= + Expr(:call, :add_to!, esc(stmt.args[1]), esc(stmt.args[2])) + elseif stmt.head == :-= || stmt.head == :.-= + Expr(:call, :sub_from!, esc(stmt.args[1]), esc(stmt.args[2])) + elseif stmt.head == :.*= + Expr(:call, :mul_to!, esc(stmt.args[1]), esc(stmt.args[2])) + elseif stmt.head == :./= + Expr(:call, :div_from!, esc(stmt.args[1]), esc(stmt.args[2])) + else + error("unsupported inplace translation for $stmt") + end +end + +#=doc +.. function:: add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) + + Add a bunch of arguments into ``dst``. Inplace updating. +=# +function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) + @assert dst.writable + for arg in args + if isa(arg, Real) + _plus_scalar(dst, arg, dst) + else + _plus(dst, arg, dst) + end + end + return dst +end + +#=doc +.. function:: + +(args...) + .+(args...) + + Summation. Multiple arguments of either scalar or :class:`NDArray` could be + added together. Note at least the first or second argument needs to be an :class:`NDArray` to + avoid ambiguity of built-in summation. +=# +import Base: +, .+ +function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) + ret = copy(arg0, context(arg0)) + add_to!(ret, args...) +end +function .+(arg0 :: NDArray, args :: Union{Real, NDArray}...) + +(arg0, args...) +end +function +(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) + +(arg1, arg0, args...) +end +function .+(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) + .+(arg1, arg0, args...) +end + +#=doc +.. function:: sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) + + Subtract a bunch of arguments from ``dst``. Inplace updating. +=# +function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) + @assert dst.writable + if isa(arg, Real) + _minus_scalar(dst, arg, dst) + else + _minus(dst, arg, dst) + end +end + +#=doc +.. function:: + -(arg0, arg1) + -(arg0) + .-(arg0, arg1) + + Subtraction ``arg0 - arg1``, of scalar types or :class:`NDArray`. Or create + the negative of ``arg0``. +=# +import Base: -, .- +function -(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) + ret = copy(arg0, context(arg0)) + sub_from!(ret, arg1) +end +function .-(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) + -(arg0, arg1) +end +function -(arg0 :: Real, arg1 :: NDArray) + ret = -arg1 + add_to!(ret, arg0) + return ret +end +function .-(arg0 :: Real, arg1 :: NDArray) + -(arg0, arg1) +end + +function -(arg0 :: NDArray) + _mul_scalar(arg0, -1.0) +end + +#=doc +.. function:: mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) + + Elementwise multiplication into ``dst`` of either a scalar or an :class:`NDArray` of the same shape. + Inplace updating. +=# +function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) + @assert dst.writable + if isa(arg, Real) + _mul_scalar(dst, arg, dst) + else + _mul(dst, arg, dst) + end + return dst +end + +#=doc +.. function:: + .*(arg0, arg1) + + Elementwise multiplication of ``arg0`` and ``arg``, could be either scalar or :class:`NDArray`. +=# +import Base: .*, * +function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) + ret = copy(arg0, context(arg0)) + mul_to!(ret, arg) +end +function .*(arg0 :: Real, arg :: NDArray) + .*(arg, arg0) +end + +#=doc +.. function:: + *(arg0, arg1) + + Currently only multiplication a scalar with an :class:`NDArray` is implemented. Matrix multiplication + is to be added soon. +=# +function *(arg0 :: NDArray, arg :: Real) + ret = copy(arg0, context(arg0)) + mul_to!(ret, arg) +end +function *(arg0 :: Real, arg :: NDArray) + *(arg, arg0) +end + +#=doc +.. function:: div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) + + Elementwise divide a scalar or an :class:`NDArray` of the same shape from ``dst``. Inplace updating. +=# +function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) + @assert dst.writable + if isa(arg, Real) + _div_scalar(dst, arg, dst) + else + _div(dst, arg, dst) + end +end + +import Base: ./, / +#=doc +.. function:: ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) + + Elementwise dividing an :class:`NDArray` by a scalar or another :class:`NDArray` of the same shape. +=# +function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) + ret = copy(arg0, context(arg0)) + div_from!(ret, arg) +end + +#=doc +.. function:: /(arg0 :: NDArray, arg :: Real) + + Divide an :class:`NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. +=# +function /(arg0 :: NDArray, arg :: Real) + ./(arg0, arg) +end + +#=doc +IO +-- +=# +#=doc +.. function:: load(filename, ::Type{NDArray}) + + Load NDArrays from binary file. + + :param AbstractString filename: the path of the file to load. It could be S3 or HDFS address. + :return: Either ``Dict{Base.Symbol, NDArray}`` or ``Vector{NDArray}``. + + If the ``libmxnet`` is built with the corresponding component enabled. Examples + + * ``s3://my-bucket/path/my-s3-ndarray`` + * ``hdfs://my-bucket/path/my-hdfs-ndarray`` + * ``/path-to/my-local-ndarray`` +=# +function load(filename::AbstractString, ::Type{NDArray}) + out_size = Ref{MX_uint}(0) + out_hdrs = Ref{Ptr{MX_handle}}(0) + out_name_size = Ref{MX_uint}(0) + out_names = Ref{char_pp}(0) + @mxcall(:MXNDArrayLoad, (char_p, Ref{MX_uint}, Ref{Ptr{MX_handle}}, Ref{MX_uint}, Ref{char_pp}), + filename, out_size, out_hdrs, out_name_size, out_names) + out_name_size = out_name_size[] + out_size = out_size[] + if out_name_size == 0 + return [NDArray(MX_NDArrayHandle(hdr)) for hdr in pointer_to_array(out_hdrs[], out_size)] + else + @assert out_size == out_name_size + return Dict([(symbol(bytestring(k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in + zip(pointer_to_array(out_names[], out_size), pointer_to_array(out_hdrs[], out_size))]) + end +end + +#=doc +.. function:: save(filename :: AbstractString, data) + + Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built + with corresponding support. + + :param AbstractString filename: path to the binary file to write to. + :param data: data to save to file. + :type data: :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. +=# +function save(filename::AbstractString, data::NDArray) + save(filename, [data]) +end +function save(filename::AbstractString, data::Vector{NDArray}) + @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), + filename, length(data), MX_handle[data...], char_pp(0)) +end +function save(filename::AbstractString, data::Dict{Base.Symbol,NDArray}) + names = [k for k in keys(data)] + arrays = MX_handle[data[k] for k in names] + names = AbstractString[string(k) for k in names] + + @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), + filename, length(names), arrays, names) +end + +#=doc +libmxnet APIs +------------- +=# +################################################################################ +# NDArray functions dynamically imported from libmxnet +################################################################################ +function _invoke_mxfunction(func_handle::MX_handle, use_vars, scalars, mut_vars) + @mxcall(:MXFuncInvoke, + (MX_handle, Ptr{MX_handle}, Ptr{MX_float}, Ptr{MX_handle}), + func_handle, use_vars, scalars, mut_vars) +end + +@enum(LIBMX_FUNC_TYPE_MASK, + NDARRAY_ARG_BEFORE_SCALAR = 1, + ACCEPT_EMPTY_MUTATE_TARGET = (1 << 2) +) + +# Import corresponding math functions from base so the automatically defined libmxnet +# functions can overload them +import Base: sqrt + +#=doc +The libxmnet APIs are automatically imported from ``libmxnet.so``. The functions listed +here operate on :class:`NDArray` objects. The arguments to the functions are typically ordered +as + +.. code-block:: julia + + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) + +unless ``NDARRAY_ARG_BEFORE_SCALAR`` is not set. In this case, the scalars are put before the input arguments: + +.. code-block:: julia + + func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) + + +If ``ACCEPT_EMPTY_MUTATE_TARGET`` is set. An overloaded function without the output arguments will also be defined: + +.. code-block:: julia + + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) + +Upon calling, the output arguments will be automatically initialized with empty NDArrays. + +Those functions always return the output arguments. If there is only one output (the typical situation), that +object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. + +**autogen:EMBED:ndarray:EMBED:autogen** +=# +function _import_ndarray_functions(;gen_docs=false) + n_ref = Ref{MX_uint}(0) + h_ref = Ref{Ptr{MX_handle}}(0) + @mxcall(:MXListFunctions, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) + + n_funcs = n_ref[] + h_funcs = pointer_to_array(h_ref[], n_funcs) + + if gen_docs + docs = Dict{Base.Symbol, AbstractString}() + end + + for i = 1:n_funcs + func_handle = h_funcs[i] + + #---------------------------------------- + # get function information (human readable) + ref_name = Ref{char_p}(0) + ref_desc = Ref{char_p}(0) + ref_narg = Ref{MX_uint}(0) + + ref_arg_names = Ref{char_pp}(0) + ref_arg_types = Ref{char_pp}(0) + ref_arg_descs = Ref{char_pp}(0) + + @mxcall(:MXFuncGetInfo, + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), + func_handle, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) + + func_name = symbol(bytestring(ref_name[])) + + if gen_docs + # generate document only + f_desc = bytestring(ref_desc[]) * "\n\n" + f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) + docs[func_name] = f_desc + else + #---------------------------------------- + # get function specification + ref_n_use_vars = Ref{MX_uint}(0) + ref_n_scalars = Ref{MX_uint}(0) + ref_n_mut_vars = Ref{MX_uint}(0) + ref_type_mask = Ref{Cint}(0) + @mxcall(:MXFuncDescribe, + (MX_handle, Ref{MX_uint}, Ref{MX_uint}, Ref{MX_uint}, Ref{Cint}), + func_handle, ref_n_use_vars, ref_n_scalars, ref_n_mut_vars, ref_type_mask) + + #---------------------------------------- + # prepare function definition + n_used_vars = ref_n_use_vars[] + n_scalars = ref_n_scalars[] + n_mutate_vars = ref_n_mut_vars[] + type_mask = ref_type_mask[] + accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 + arg_before_scalar = (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 + + # general ndarray function + if arg_before_scalar + args = vcat([Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], + [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + else + args = vcat([Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], + [Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + end + + _use_vars = Expr(:ref, :MX_handle, [symbol("in$i") for i=1:n_used_vars]...) + _scalars = Expr(:ref, :MX_float, [symbol("sca$i") for i=1:n_scalars]...) + _mut_vars = Expr(:ref, :MX_handle, [symbol("out$i") for i=1:n_mutate_vars]...) + stmt_call = Expr(:call, :_invoke_mxfunction, func_handle, _use_vars, _scalars, _mut_vars) + if n_mutate_vars == 1 + stmt_ret = :(return out1) + else + stmt_ret = Expr(:return, Expr(:tuple, [symbol("out$i") for i=1:n_mutate_vars]...)) + end + + func_body = Expr(:block, stmt_call, stmt_ret) + func_head = Expr(:call, func_name, args...) + + func_def = Expr(:function, func_head, func_body) + eval(func_def) + + if accept_empty_mutate + args0 = args[1:n_used_vars+n_scalars] + func_head0 = Expr(:call, func_name, args0...) + _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] + stmt_call0 = Expr(:call, func_name, args0..., _mut_vars0...) + func_body0 = Expr(:block, stmt_call0) + func_head0 = Expr(:call, func_name, args0...) + + func_def0 = Expr(:function, func_head0, func_body0) + eval(func_def0) + end + end + end + + if gen_docs + return docs + end +end + diff --git a/src/optimizer.jl-e b/src/optimizer.jl-e new file mode 100644 index 000000000000..a5f0bfd5ec60 --- /dev/null +++ b/src/optimizer.jl-e @@ -0,0 +1,226 @@ +#=doc +Optimizers +========== + +Common interfaces +----------------- +=# + + +#=doc +.. class:: AbstractOptimizer + + Base type for all optimizers. +=# +abstract AbstractOptimizer + +#=doc +.. class:: AbstractLearningRateScheduler + + Base type for all learning rate scheduler. +=# +abstract AbstractLearningRateScheduler + +#=doc +.. class:: AbstractMomentumScheduler + + Base type for all momentum scheduler. +=# +abstract AbstractMomentumScheduler + + + +#=doc +.. class:: OptimizationState + + .. attribute:: batch_size + + The size of the mini-batch used in stochastic training. + + .. attribute:: curr_epoch + + The current epoch count. Epoch 0 means no training yet, during the first + pass through the data, the epoch will be 1; during the second pass, the + epoch count will be 1, and so on. + + .. attribute:: curr_batch + + The current mini-batch count. The batch count is reset during every epoch. + The batch count 0 means the beginning of each epoch, with no mini-batch + seen yet. During the first mini-batch, the mini-batch count will be 1. + + .. attribute:: curr_iter + + The current iteration count. One iteration corresponds to one mini-batch, + but unlike the mini-batch count, the iteration count does **not** reset + in each epoch. So it track the *total* number of mini-batches seen so far. +=# +type OptimizationState + batch_size :: Int + curr_epoch :: Int + curr_batch :: Int + curr_iter :: Int +end +OptimizationState(batch_size::Int) = OptimizationState(batch_size, 0, 0, 0) + + +#=doc +.. function:: get_learning_rate(scheduler, state) + + :param AbstractLearningRateScheduler scheduler: a learning rate scheduler. + :param OptimizationState state: the current state about epoch, mini-batch and iteration count. + :return: the current learning rate. +=# +function get_learning_rate +end + +################################################################################ +# The learning rate module +module LearningRate +import ..mx: AbstractLearningRateScheduler, OptimizationState, get_learning_rate + +#=doc +.. class:: LearningRate.Fixed + + Fixed learning rate scheduler always return the same learning rate. +=# +type Fixed <: AbstractLearningRateScheduler + learning_rate :: Float64 +end +get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rate + +#=doc +.. class:: LearningRate.Exp + + :math:`\eta_t = \eta_0\gamma^t`. Here :math:`t` is the epoch count, or the iteration + count if ``decay_on_iteration`` is set to true. +=# +type Exp <: AbstractLearningRateScheduler + learning_rate :: Float64 + gamma :: Float64 + on_iteration :: Bool +end +function Exp(base_lr::Real; gamma::Real=0.9, decay_on_iteration::Bool=false) + @assert(0 < gamma < 1) + Exp(Float64(base_lr), Float64(gamma), decay_on_iteration) +end +get_learning_rate(self :: Exp, state :: OptimizationState) = + self.learning_rate * self.gamma ^ (self.on_iteration ? state.curr_iter : state.curr_epoch) + +end # module LearningRate +################################################################################ +function get_lr_scheduler(scheduler :: Any, lr :: Real) + if isa(scheduler, AbstractLearningRateScheduler) + return scheduler + else + return LearningRate.Fixed(lr) + end +end + + +#=doc +.. function:: get_momentum(scheduler, state) + + :param AbstractMomentumScheduler scheduler: the momentum scheduler. + :param OptimizationState state: the state about current epoch, mini-batch and iteration count. + :return: the current momentum. +=# +function get_momentum +end + + +################################################################################ +# The Momentum module +module Momentum +import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum + +#=doc +.. class:: Momentum.Null + + The null momentum scheduler always returns 0 for momentum. It is also used to + explicitly indicate momentum should not be used. +=# +type Null <: AbstractMomentumScheduler +end +get_momentum(self :: Null, state :: OptimizationState) = 0.0 + +#=doc +.. class:: Momentum.Fixed + + Fixed momentum scheduler always returns the same value. +=# +type Fixed <: AbstractMomentumScheduler + momentum :: Float64 +end +get_momentum(self :: Fixed, state :: OptimizationState) = self.momentum +end # module Momentum +################################################################################ +function get_momentum_scheduler(scheduler :: Any, momentum :: Real) + if isa(scheduler, AbstractMomentumScheduler) + return scheduler + elseif momentum == 0 + return Momentum.Null() + else + return Momentum.Fixed(momentum) + end +end + + +#=doc +.. function:: get_updater(optimizer) + + :param AbstractOptimizer optimizer: the underlying optimizer. + + A utility function to create an updater function, that uses its closure to + store all the states needed for each weights. +=# +function get_updater(optimizer :: AbstractOptimizer) + states = Dict{Int,Any}() + function updater(index :: Int, grad :: NDArray, weight :: NDArray) + if !haskey(states, index) + states[index] = create_state(optimizer, index, weight) + end + update(optimizer, index, weight, grad, states[index]) + end + return updater +end + +################################################################################ +#=doc +Built-in optimizers +------------------- +=# + +#=doc +.. class:: AbstractOptimizerOptions + + Base class for all optimizer options. +=# +abstract AbstractOptimizerOptions + +#=doc +.. function:: normalized_gradient(opts, state, grad) + + :param AbstractOptimizerOptions opts: options for the optimizer, should contain the field + ``grad_scale``, ``grad_clip`` and ``weight_decay``. + :param OptimizationState state: the current optimization state. + :param NDArray weight: the trainable weights. + :param NDArray grad: the original gradient of the weights. + + Get the properly normalized gradient (re-scaled and clipped if necessary). +=# +function normalized_gradient(opts::AbstractOptimizerOptions, state::OptimizationState, + weight::NDArray, grad::NDArray) + grad_scale = opts.grad_scale / state.batch_size + + grad = grad_scale * grad + if opts.grad_clip > 0 + grad = clip(grad, -opts.grad_clip, opts.grad_clip) + end + @inplace grad += opts.weight_decay * weight + + return grad +end + +include("optimizers/sgd.jl") +include("optimizers/adam.jl") diff --git a/src/random.jl-e b/src/random.jl-e new file mode 100644 index 000000000000..79a8b6e9e20b --- /dev/null +++ b/src/random.jl-e @@ -0,0 +1,25 @@ +function rand!(low::Real, high::Real, out::NDArray) + _random_uniform(low, high, out) +end +function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}) + rand(low, high, shape, cpu()) +end +function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}, ctx::Context) + out = empty(shape, ctx) + rand!(low, high, out) +end + +function randn!(mean::Real, stdvar::Real, out::NDArray) + _random_gaussian(mean, stdvar, out) +end +function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}) + randn(mean, stdvar, shape, cpu()) +end +function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}, ctx::Context) + out = empty(shape, ctx) + randn!(mean, stdvar, out) +end + +function srand!(seed_state::Int) + @mxcall(:MXRandomSeed, (Cint,), seed_state) +end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl new file mode 100644 index 000000000000..0c3760240844 --- /dev/null +++ b/src/symbolic-node.jl @@ -0,0 +1,437 @@ +#=doc +Symbolic API +============ +=# + +#=doc +.. class:: SymbolicNode + + SymbolicNode is the basic building block of the symbolic graph in MXNet.jl. + + .. note:: + + Throughout this documentation, ``SymbolicNode`` always refer to this :class:`SymbolicNode` type. + When we refer to the Julia's build-in SymbolicNode type (e.g. ``typeof(:foo)``), we always + say ``Base.Symbol``. +=# +type SymbolicNode + handle :: MX_SymbolHandle +end +function Base.unsafe_convert(::Type{MX_handle}, obj::SymbolicNode) + Base.unsafe_convert(MX_handle, obj.handle) +end +Base.convert(t::Type{MX_handle}, obj::SymbolicNode) = Base.unsafe_convert(t, obj) +Base.cconvert(t::Type{MX_handle}, obj::SymbolicNode) = Base.unsafe_convert(t, obj) + +#=doc +.. function:: deepcopy(self :: SymbolicNode) + + Make a deep copy of a SymbolicNode. +=# +function Base.deepcopy(self :: SymbolicNode) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolCopy, (MX_handle, Ref{MX_handle}), self, ref_hdr) + return SymbolicNode(MX_SymbolHandle(ref_hdr[])) +end + +#=doc +.. function:: copy(self :: SymbolicNode) + + Make a copy of a SymbolicNode. The same as making a deep copy. +=# +function Base.copy(self :: SymbolicNode) + Base.deepcopy(self) +end + +function Base.call(self :: SymbolicNode, args :: SymbolicNode...) + s = deepcopy(self) + _compose!(s, args...) +end +function Base.call(self :: SymbolicNode; kwargs...) + s = deepcopy(self) + _compose!(s; kwargs...) +end + +macro _list_symbol_info(self, func_name) + quote + ref_sz = Ref{MX_uint}(0) + ref_names = Ref{char_pp}(0) + @mxcall($func_name, (MX_handle, Ref{MX_uint}, Ref{char_pp}), + $self, ref_sz, ref_names) + narg = ref_sz[] + names = pointer_to_array(ref_names[], narg) + names = [symbol(bytestring(x)) for x in names] + return names + end +end +function list_arguments(self :: SymbolicNode) + @_list_symbol_info(self, :MXSymbolListArguments) +end +function list_outputs(self :: SymbolicNode) + @_list_symbol_info(self, :MXSymbolListOutputs) +end +"""List all auxiliary states in the symbool. + +Auxiliary states are special states of symbols that do not corresponds to an argument, +and do not have gradient. But still be useful for the specific operations. +A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. +Most operators do not have Auxiliary states. +""" +function list_auxiliary_states(self :: SymbolicNode) + @_list_symbol_info(self, :MXSymbolListAuxiliaryStates) +end + +"Get a new grouped SymbolicNode whose output contains all the internal outputs of this SymbolicNode." +function get_internals(self :: SymbolicNode) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolGetInternals, (MX_handle, Ref{MX_handle}), self, ref_hdr) + return SymbolicNode(MX_SymbolHandle(ref_hdr[])) +end + +"Create a symbolic variable with the given name" +function Variable(name :: Union{Base.Symbol, AbstractString}) + hdr_ref = Ref{MX_handle}(0) + @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) + SymbolicNode(MX_SymbolHandle(hdr_ref[])) +end + +"Create a SymbolicNode that groups symbols together" +function Group(symbols :: SymbolicNode...) + handles = MX_handle[symbols...] + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolCreateGroup, (MX_uint, Ptr{MX_handle}, Ref{MX_handle}), + length(handles), handles, ref_hdr) + SymbolicNode(MX_SymbolHandle(ref_hdr[])) +end + +macro _infer_shape(self, keys, indptr, sdata) + quote + ref_arg_shape_size = Ref{MX_uint}(0) + ref_arg_shape_ndim = Ref{Ptr{MX_uint}}(0) + ref_arg_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) + ref_out_shape_size = Ref{MX_uint}(0) + ref_out_shape_ndim = Ref{Ptr{MX_uint}}(0) + ref_out_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) + ref_aux_shape_size = Ref{MX_uint}(0) + ref_aux_shape_ndim = Ref{Ptr{MX_uint}}(0) + ref_aux_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) + ref_complete = Ref{Cint}(0) + @mxcall(:MXSymbolInferShape, + (MX_handle, MX_uint, char_pp, Ptr{MX_uint}, Ptr{MX_uint}, + Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, + Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, + Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, + Ref{Cint}), + self, length(indptr)-1, keys, indptr, sdata, + ref_arg_shape_size, ref_arg_shape_ndim, ref_arg_shape_data, + ref_out_shape_size, ref_out_shape_ndim, ref_out_shape_data, + ref_aux_shape_size, ref_aux_shape_ndim, ref_aux_shape_data, + ref_complete) + if ref_complete[] == 0 + return (nothing, nothing, nothing) + else + function build_shapes(shape_size::MX_uint, shape_ndim::Ptr{MX_uint}, shape_data::Ptr{Ptr{MX_uint}}) + shape_ndim = pointer_to_array(shape_ndim, shape_size) + shape_data = pointer_to_array(shape_data, shape_size) + shapes = map(1:shape_size) do i + my_shape = pointer_to_array(shape_data[i], shape_ndim[i]) + tuple(flipdim(Int[my_shape...],1)...) + end + convert(Vector{Tuple}, shapes) + end + return ( + build_shapes(ref_arg_shape_size[], ref_arg_shape_ndim[], ref_arg_shape_data[]), + build_shapes(ref_out_shape_size[], ref_out_shape_ndim[], ref_out_shape_data[]), + build_shapes(ref_aux_shape_size[], ref_aux_shape_ndim[], ref_aux_shape_data[]) + ) + end + end +end +function infer_shape(self :: SymbolicNode; kwargs...) + sdata = MX_uint[] + indptr = MX_uint[0] + for (k,v) in kwargs + append!(sdata, flipdim([v...],1)) + push!(indptr, length(sdata)) + end + keys = AbstractString[string(x[1]) for x in kwargs] + @_infer_shape(self, keys, indptr, sdata) +end +function infer_shape(self :: SymbolicNode, args :: Union{Tuple, Void}...) + sdata = MX_uint[] + indptr = MX_uint[0] + for arg in args + if isa(arg, Void); continue; end + append!(sdata, flipdim([arg...],1)) + push!(indptr, length(sdata)) + end + keys = Ptr{char_p}(0) + @_infer_shape(self, keys, indptr, sdata) +end + +function Base.getindex(self :: SymbolicNode, idx :: Union{Base.Symbol, AbstractString}) + idx = symbol(idx) + i_idx = find(idx .== list_outputs(self)) + @assert(length(i_idx) > 0, "Cannot find output with name '$idx'") + @assert(length(i_idx) < 2, "Found duplicated output with name '$idx'") + Base.getindex(self, i_idx[1]) +end +function Base.getindex(self :: SymbolicNode, idx :: Int) + ref_hdr = Ref{MX_handle}(0) + # note Julia is 1-based, while MXNet is 0-based + @mxcall(:MXSymbolGetOutput, (MX_handle, MX_uint, Ref{MX_handle}), self, idx-1, ref_hdr) + return SymbolicNode(MX_SymbolHandle(ref_hdr[])) +end + +import Base: +, .+ +function +(self :: SymbolicNode, args :: SymbolicNode...) + ret = self + for arg in args + ret = _Plus(ret, arg) + end + ret +end +function .+(self :: SymbolicNode, args :: SymbolicNode...) + +(self, args...) +end + +import Base: -, .- +function -(self :: SymbolicNode, arg :: SymbolicNode) + _Minus(self, arg) +end +function .-(self :: SymbolicNode, arg :: SymbolicNode) + -(self, arg) +end + +import Base: .* +function .*(self :: SymbolicNode, args :: SymbolicNode...) + ret = self + for arg in args + ret = _Mul(ret, arg) + end + ret +end + +import Base: ./ +function ./(self :: SymbolicNode, arg :: SymbolicNode) + _Div(self, arg) +end + +function _compose!(sym :: SymbolicNode; kwargs...) + name = char_p(0) + arg_keys = AbstractString[] + arg_vals = MX_handle[] + + for (k,v) in kwargs + if k == :name + name = string(v) + else + @assert(isa(v, SymbolicNode), "Compose expect `SymbolicNode` as arguments") + push!(arg_keys, string(k)) + push!(arg_vals, v) + end + end + + @mxcall(:MXSymbolCompose, + (MX_handle, char_p, MX_uint, Ptr{char_p}, Ptr{MX_handle}), + sym, name, length(arg_keys), arg_keys, arg_vals) + return sym +end +function _compose!(sym :: SymbolicNode, args::SymbolicNode...) + _compose!(sym, char_p(0), args...) +end +function _compose!(sym :: SymbolicNode, name :: Union{Base.Symbol, char_p}, args::SymbolicNode...) + if isa(name, Base.Symbol); name = string(name); end + arg_keys = Ptr{char_p}(0) + arg_vals = MX_handle[args...] + + @mxcall(:MXSymbolCompose, + (MX_handle, char_p, MX_uint, Ptr{char_p}, Ptr{MX_handle}), + sym, name, length(arg_vals), arg_keys, arg_vals) + return sym +end + +"""Save SymbolicNode into a JSON string""" +function to_json(self :: SymbolicNode) + ref_json = Ref{char_p}(0) + @mxcall(:MXSymbolSaveToJSON, (MX_handle, Ref{char_p}), self, ref_json) + return bytestring(ref_json[]) +end + +"""Load SymbolicNode from a JSON string representation.""" +function from_json(repr :: AbstractString, ::Type{SymbolicNode}) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolCreateFromJSON, (char_p, Ref{MX_handle}), repr, ref_hdr) + return SymbolicNode(MX_SymbolHandle(ref_hdr[])) +end + +"""Load SymbolicNode from a JSON file.""" +function load(filename :: AbstractString, ::Type{SymbolicNode}) + ref_hdr = Ref{MX_handle}(0) + @mxcall(:MXSymbolCreateFromFile, (char_p, Ref{MX_handle}), filename, ref_hdr) + return SymbolicNode(MX_SymbolHandle(ref_hdr[])) +end +function save(filename :: AbstractString, sym :: SymbolicNode) + @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), sym, filename) +end + +#=doc +libmxnet APIs +------------- + +**autogen:EMBED:SymbolicNode:EMBED:autogen** +=# +################################################################################ +# Atomic SymbolicNode functions dynamically imported from libmxnet +################################################################################ +function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) + ref_name = Ref{char_p}(0) + ref_desc = Ref{char_p}(0) + ref_kv_nargs = Ref{char_p}(0) + ref_nargs = Ref{MX_uint}(0) + ref_arg_names = Ref{char_pp}(0) + ref_arg_types = Ref{char_pp}(0) + ref_arg_descs = Ref{char_pp}(0) + + @mxcall(:MXSymbolGetAtomicSymbolInfo, + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, + Ref{char_pp}, Ref{char_p}), + hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, ref_kv_nargs) + + func_name = symbol(bytestring(ref_name[])) + kv_nargs_s = bytestring(ref_kv_nargs[]) + kv_nargs = symbol(kv_nargs_s) + + if gen_docs + f_desc = bytestring(ref_desc[]) * "\n\n" + if !isempty(kv_nargs_s) + f_desc *= "This function support variable length positional :class:`SymbolicNode` inputs.\n\n" + end + f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) + f_desc *= ":param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional.\n\n" + f_desc *= ":return: the constructed :class:`SymbolicNode`.\n\n" + return (func_name, f_desc) + end + + # function $func_name(args...; kwargs...) + func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) + func_body = quote + idx = findfirst(x -> x[1] == :name, kwargs) + if idx > 0 + name = kwargs[idx][2] + else + name = "" + end + + param_keys = AbstractString[] + param_vals = AbstractString[] + symbol_kws = Dict{Base.Symbol, SymbolicNode}() + + $(if kv_nargs != symbol("") + quote + if !in($kv_nargs_s, param_keys) + push!(param_keys, $kv_nargs_s) + push!(param_vals, string(length(args))) + end + end + end) + + for (k,v) in kwargs + if k == :name; continue; end + if isa(v, SymbolicNode) + symbol_kws[k] = v + else + push!(param_keys, string(k)) + push!(param_vals, dump_mx_param(v)) + end + end + + if length(args) != 0 && length(symbol_kws) != 0 + @assert(false, "$func_name only accepts Symbols either as positional or keyword arguments, not both.") + end + $(if kv_nargs != symbol("") + quote + if length(symbol_kws) > 0 + @assert(false, "$func_name takes variable number of SymbolicNode arguments, please pass input Symbols " * + "via positional arguments, instead of keyword arguments.") + end + end + end) + + # create the SymbolicNode + ref_sym_hdr = Ref{MX_handle}() + @mxcall(:MXSymbolCreateAtomicSymbol, + (MX_handle, MX_uint, Ptr{char_p}, Ptr{char_p}, Ref{MX_handle}), + $hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) + sym_hdr = ref_sym_hdr[] + + sym = SymbolicNode(MX_SymbolHandle(sym_hdr)) + hint = lowercase(string($func_name)) + name = get!(DEFAULT_NAME_MANAGER, name, hint) + + if length(args) != 0 + _compose!(sym, name, args...) + else + _compose!(sym; name=name, symbol_kws...) + end + + return sym + end + + func_def = Expr(:function, func_head, Expr(:block, func_body)) + eval(func_def) +end + +function _import_atomic_symbol_creators(;gen_docs=false) + n_ref = Ref{MX_uint}(0) + h_ref = Ref{Ptr{MX_handle}}(0) + @mxcall(:MXSymbolListAtomicSymbolCreators, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) + + n_creators = n_ref[] + h_creators = pointer_to_array(h_ref[], n_creators) + + if gen_docs + docs = Dict{Base.Symbol, AbstractString}() + end + + for i = 1:n_creators + creator_hdr = h_creators[i] + ret = _define_atomic_symbol_creator(creator_hdr, gen_docs=gen_docs) + if gen_docs + docs[ret[1]] = ret[2] + end + end + + if gen_docs + return docs + end +end + +################################################################################ +# Utility macros to chain up symbols +################################################################################ +macro chain(layers) + exprs = [] + last_layer = nothing + function _chain_layer(layer, last_layer) + if isa(last_layer, Void) + esc(layer) + else + @assert(isa(layer, Expr) && layer.head == :call, "Do not know how to chain up $layer") + return Expr(:call, esc(layer.args[1]), last_layer, map(esc, layer.args[2:end])...) + end + end + while true + if layers.head == :(=>) + new_layer = gensym() + push!(exprs, :($new_layer = $(_chain_layer(layers.args[1], last_layer)))) + last_layer = new_layer + layers = layers.args[2] + else + push!(exprs, _chain_layer(layers, last_layer)) + break + end + end + return Expr(:block, exprs...) +end + diff --git a/src/node.jl b/src/symbolic-node.jl-e similarity index 100% rename from src/node.jl rename to src/symbolic-node.jl-e diff --git a/src/util.jl-e b/src/util.jl-e new file mode 100644 index 000000000000..4ca613cbf7d1 --- /dev/null +++ b/src/util.jl-e @@ -0,0 +1,70 @@ +################################################################################ +# Dataset related utilities +################################################################################ +function get_data_dir() + data_dir = joinpath(Pkg.dir("MXNet"), "data") + mkpath(data_dir) + data_dir +end + +function get_mnist_ubyte() + data_dir = get_data_dir() + mnist_dir = joinpath(data_dir, "mnist") + mkpath(mnist_dir) + filenames = Dict(:train_data => "train-images-idx3-ubyte", + :train_label => "train-labels-idx1-ubyte", + :test_data => "t10k-images-idx3-ubyte", + :test_label => "t10k-labels-idx1-ubyte") + filenames = [k => joinpath(mnist_dir, v) for (k,v) in filenames] + if !all(isfile, values(filenames)) + cd(mnist_dir) do + run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/mnist.zip`) + run(`unzip -u mnist.zip`) + end + end + return filenames +end + +function get_cifar10() + data_dir = get_data_dir() + cifar10_dir = joinpath(data_dir, "cifar10") + mkpath(cifar10_dir) + filenames = Dict(:train => "cifar/train.rec", :test => "cifar/test.rec") + filenames = [k => joinpath(cifar10_dir, v) for (k,v) in filenames] + if !all(isfile, values(filenames)) + cd(cifar10_dir) do + run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/cifar10.zip`) + run(`unzip -u cifar10.zip`) + end + end + + filenames[:mean] = joinpath(cifar10_dir, "cifar/cifar_mean.bin") + return filenames +end + + +################################################################################ +# Internal Utilities +################################################################################ +const DOC_EMBED_ANCHOR = "**autogen:EMBED:{1}:EMBED:autogen**" +function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{char_pp}, arg_descs::Ref{char_pp}, remove_dup::Bool=true) + param_keys = Set{AbstractString}() + + arg_names = pointer_to_array(arg_names[], narg) + arg_types = pointer_to_array(arg_types[], narg) + arg_descs = pointer_to_array(arg_descs[], narg) + docstrings = AbstractString[] + + for i = 1:narg + arg_name = bytestring(arg_names[i]) + if arg_name ∈ param_keys && remove_dup + continue + end + push!(param_keys, arg_name) + + arg_type = bytestring(arg_types[i]) + arg_desc = bytestring(arg_descs[i]) + push!(docstrings, ":param $arg_name: $arg_desc\n:type $arg_name: $arg_type\n\n") + end + return join(docstrings, "\n") +end diff --git a/test/unittest/node.jl b/test/unittest/symbolic-node.jl similarity index 90% rename from test/unittest/node.jl rename to test/unittest/symbolic-node.jl index f7e9b51e60f0..33948adfcd40 100644 --- a/test/unittest/node.jl +++ b/test/unittest/symbolic-node.jl @@ -1,4 +1,4 @@ -module TestNode +module TestSymbolicNode using MXNet using Base.Test @@ -8,7 +8,7 @@ using ..Main: mlp2 # Test Implementations ################################################################################ function test_basic() - info("Node::basic") + info("SymbolicNode::basic") model = mlp2() @test mx.list_arguments(model) == [:data,:fc1_weight,:fc1_bias,:fc2_weight,:fc2_bias] @@ -17,7 +17,7 @@ function test_basic() end function test_internal() - info("Node::internal") + info("SymbolicNode::internal") data = mx.Variable(:data) oldfc = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) @@ -31,7 +31,7 @@ function test_internal() end function test_compose() - info("Node::compose") + info("SymbolicNode::compose") data = mx.Variable(:data) net1 = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) @@ -47,7 +47,7 @@ function test_compose() end function test_infer_shape() - info("Node::infer_shape::mlp2") + info("SymbolicNode::infer_shape::mlp2") model = mlp2() data_shape = (100, 100) @@ -61,7 +61,7 @@ function test_infer_shape() end function test_infer_shape_error() - info("Node::infer_shape::throws") + info("SymbolicNode::infer_shape::throws") model = mlp2() weight_shape = (100, 1) @@ -70,12 +70,12 @@ function test_infer_shape_error() end function test_saveload() - info("Node::saveload::mlp2") + info("SymbolicNode::saveload::mlp2") model = mlp2() fname = tempname() mx.save(fname, model) - model2 = mx.load(fname, mx.Node) + model2 = mx.load(fname, mx.SymbolicNode) @test mx.to_json(model) == mx.to_json(model2) rm(fname) From aab8784c12724e39976e5ac597b895ede55e5629 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 15:25:17 -0500 Subject: [PATCH 186/630] upate doc for refactoring --- docs/api/executor.rst | 6 +- docs/api/io.rst | 2 +- docs/api/model.rst | 2 +- docs/api/{symbol.rst => symbolic-node.rst} | 132 ++-- docs/build-api.jl | 4 +- docs/index.rst | 2 +- src/MXNet.jl-e | 35 - src/base.jl-e | 212 ------ src/callback.jl-e | 142 ---- src/context.jl-e | 44 -- src/executor.jl-e | 197 ----- src/initializer.jl-e | 117 --- src/io.jl-e | 641 ----------------- src/kvstore.jl-e | 132 ---- src/metric.jl-e | 37 - src/model.jl-e | 566 --------------- src/name.jl-e | 44 -- src/ndarray.jl-e | 800 --------------------- src/optimizer.jl-e | 226 ------ src/random.jl-e | 25 - src/symbolic-node.jl | 2 +- src/symbolic-node.jl-e | 437 ----------- src/util.jl-e | 70 -- 23 files changed, 75 insertions(+), 3800 deletions(-) rename docs/api/{symbol.rst => symbolic-node.rst} (69%) delete mode 100644 src/MXNet.jl-e delete mode 100644 src/base.jl-e delete mode 100644 src/callback.jl-e delete mode 100644 src/context.jl-e delete mode 100644 src/executor.jl-e delete mode 100644 src/initializer.jl-e delete mode 100644 src/io.jl-e delete mode 100644 src/kvstore.jl-e delete mode 100644 src/metric.jl-e delete mode 100644 src/model.jl-e delete mode 100644 src/name.jl-e delete mode 100644 src/ndarray.jl-e delete mode 100644 src/optimizer.jl-e delete mode 100644 src/random.jl-e delete mode 100644 src/symbolic-node.jl-e delete mode 100644 src/util.jl-e diff --git a/docs/api/executor.rst b/docs/api/executor.rst index 8887d4ce1d24..69c78137cd0e 100644 --- a/docs/api/executor.rst +++ b/docs/api/executor.rst @@ -7,7 +7,7 @@ Executor .. class:: Executor - An executor is a realization of a symbolic architecture defined by a :class:`Symbol`. + An executor is a realization of a symbolic architecture defined by a :class:`SymbolicNode`. The actual forward and backward computation specified by the network architecture can be carried out with an executor. @@ -16,9 +16,9 @@ Executor .. function:: bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) - Create an :class:`Executor` by binding a :class:`Symbol` to concrete :class:`NDArray`. + Create an :class:`Executor` by binding a :class:`SymbolicNode` to concrete :class:`NDArray`. - :param Symbol sym: the network architecture describing the computation graph. + :param SymbolicNode sym: the network architecture describing the computation graph. :param Context ctx: the context on which the computation should run. :param args: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete arrays for all the inputs in the network architecture. The inputs typically include diff --git a/docs/api/io.rst b/docs/api/io.rst index a7568a7b6f71..e9d9c04e9f3c 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -36,7 +36,7 @@ and split it into mini-batches so that the model can consume the data in a unifo training stage, both *data* and *label* will be feeded into the model, while during prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and of any shapes. The provided data and label names here should match the input names in a target - :class:`Symbol`. + :class:`SymbolicNode`. A data provider should also implement the Julia iteration interface, in order to allow iterating through the data set. The provider will be called in the following way: diff --git a/docs/api/model.rst b/docs/api/model.rst index ab330db9bcfa..d5245614061b 100644 --- a/docs/api/model.rst +++ b/docs/api/model.rst @@ -26,7 +26,7 @@ a network described using the symbolic API. -.. function:: FeedForward(arch :: Symbol, ctx) +.. function:: FeedForward(arch :: SymbolicNode, ctx) :param arch: the architecture of the network constructed using the symbolic API. :param ctx: the devices on which this model should do computation. It could be a single :class:`Context` diff --git a/docs/api/symbol.rst b/docs/api/symbolic-node.rst similarity index 69% rename from docs/api/symbol.rst rename to docs/api/symbolic-node.rst index e01ecb35980d..9386c10a8614 100644 --- a/docs/api/symbol.rst +++ b/docs/api/symbolic-node.rst @@ -5,29 +5,29 @@ Symbolic API -.. class:: Symbol +.. class:: SymbolicNode - Symbol is the basic building block of the symbolic graph in MXNet.jl. + SymbolicNode is the basic building block of the symbolic graph in MXNet.jl. .. note:: - Throughout this documentation, ``Symbol`` always refer to this :class:`Symbol` type. - When we refer to the Julia's build-in symbol type (e.g. ``typeof(:foo)``), we always + Throughout this documentation, ``SymbolicNode`` always refer to this :class:`SymbolicNode` type. + When we refer to the Julia's build-in SymbolicNode type (e.g. ``typeof(:foo)``), we always say ``Base.Symbol``. -.. function:: deepcopy(self :: Symbol) +.. function:: deepcopy(self :: SymbolicNode) - Make a deep copy of a symbol. + Make a deep copy of a SymbolicNode. -.. function:: copy(self :: Symbol) +.. function:: copy(self :: SymbolicNode) - Make a copy of a symbol. The same as making a deep copy. + Make a copy of a SymbolicNode. The same as making a deep copy. @@ -48,9 +48,9 @@ Public APIs :param act_type: Activation function to be applied. :type act_type: {'relu', 'sigmoid', 'tanh'}, required - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -71,9 +71,9 @@ Public APIs :param momentum: Momentum for moving average :type momentum: float, optional, default=0.1 - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -86,9 +86,9 @@ Public APIs :param data: Input data. :type data: Symbol - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -98,14 +98,14 @@ Public APIs Perform an feature concat on channel dim (dim 1) over all the inputs. - This function support variable length positional :class:`Symbol` inputs. + This function support variable length positional :class:`SymbolicNode` inputs. :param num_args: Number of inputs to be concated. :type num_args: int, required - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -154,9 +154,9 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=False - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -205,9 +205,9 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=True - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -224,9 +224,9 @@ Public APIs :param p: Fraction of the input that gets dropped out at training time :type p: float, optional, default=0.5 - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -236,14 +236,14 @@ Public APIs Perform an elementwise sum over all the inputs. - This function support variable length positional :class:`Symbol` inputs. + This function support variable length positional :class:`SymbolicNode` inputs. :param num_args: Number of inputs to be sumed. :type num_args: int, required - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -256,9 +256,9 @@ Public APIs :param data: Input data to flatten. :type data: Symbol - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -287,9 +287,9 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=False - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -318,9 +318,9 @@ Public APIs :param nsize: normalization window width in elements. :type nsize: int (non-negative), required - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -349,9 +349,9 @@ Public APIs :param upper_bound: Upper bound of random slope. (For rrelu only) :type upper_bound: float, optional, default=0.334 - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -368,9 +368,9 @@ Public APIs :param label: Input label to function. :type label: Symbol - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -388,9 +388,9 @@ Public APIs :param label: Input label to function. :type label: Symbol - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -419,9 +419,9 @@ Public APIs :param pad: pad for pooling: (y, x) :type pad: Shape(tuple), optional, default=(0, 0) - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -438,9 +438,9 @@ Public APIs :param target_shape: Target new shape :type target_shape: Shape(tuple), required - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -453,9 +453,9 @@ Public APIs :param num_outputs: Number of outputs to be sliced. :type num_outputs: int, required - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -476,9 +476,9 @@ Public APIs :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes :type multi_output: boolean, optional, default=False - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -499,9 +499,9 @@ Public APIs :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes :type multi_output: boolean, optional, default=False - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -514,9 +514,9 @@ Public APIs :param src: Source symbolic input to the function :type src: Symbol - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -529,9 +529,9 @@ Public APIs :param src: Source symbolic input to the function :type src: Symbol - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -544,9 +544,9 @@ Public APIs :param src: Source symbolic input to the function :type src: Symbol - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -559,9 +559,9 @@ Public APIs :param src: Source symbolic input to the function :type src: Symbol - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -577,9 +577,9 @@ Internal APIs Perform an elementwise div. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -589,9 +589,9 @@ Internal APIs Perform an elementwise minus. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -601,9 +601,9 @@ Internal APIs Perform an elementwise mul. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -620,9 +620,9 @@ Internal APIs :param need_top_grad: Whether this layer needs out grad for backward. Should be false for loss layers. :type need_top_grad: boolean, optional, default=True - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. @@ -632,9 +632,9 @@ Internal APIs Perform an elementwise plus. - :param Base.Symbol name: The name of the symbol. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. - :return: the constructed :class:`Symbol`. + :return: the constructed :class:`SymbolicNode`. diff --git a/docs/build-api.jl b/docs/build-api.jl index b70c480c9d79..510426ee2004 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -79,8 +79,8 @@ extract_doc("context.rst", "context.jl") extract_doc("ndarray.rst", "ndarray.jl") embed_mxnet_api("ndarray.rst", "ndarray", mx._import_ndarray_functions) -extract_doc("symbol.rst", "symbol.jl") -embed_mxnet_api("symbol.rst", "symbol", mx._import_atomic_symbol_creators) +extract_doc("symbolic-node.rst", "symbolic-node.jl") +embed_mxnet_api("symbolic-node.rst", "symbolic-node", mx._import_atomic_symbol_creators) extract_doc("executor.rst", "executor.jl") diff --git a/docs/index.rst b/docs/index.rst index 7520047db11a..6203ad3a1af4 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -38,7 +38,7 @@ For more details, see documentation below. Please also checkout the `examples api/callback api/io api/ndarray - api/symbol + api/symbolic-node api/executor Indices and tables diff --git a/src/MXNet.jl-e b/src/MXNet.jl-e deleted file mode 100644 index f9f9e8664c4f..000000000000 --- a/src/MXNet.jl-e +++ /dev/null @@ -1,35 +0,0 @@ -__precompile__() - -module MXNet - -# we put everything in the namespace mx, because there are a lot of -# functions with the same names as built-in utilities like "zeros", etc. -export mx -module mx -using Formatting - -include("base.jl") -include("context.jl") - -include("ndarray.jl") -include("random.jl") - -include("name.jl") -include("symbolic-node.jl") -include("executor.jl") - -include("metric.jl") -include("optimizer.jl") -include("initializer.jl") - -include("io.jl") -include("kvstore.jl") - -include("callback.jl") -include("model.jl") - -include("util.jl") - -end # mx - -end # module MXNet diff --git a/src/base.jl-e b/src/base.jl-e deleted file mode 100644 index 0988400b9d31..000000000000 --- a/src/base.jl-e +++ /dev/null @@ -1,212 +0,0 @@ -"Exception thrown when an error occurred calling MXNet API." -immutable MXError <: Exception - msg :: AbstractString -end - -################################################################################ -# Common types used in MXNet API -################################################################################ -typealias MX_uint Cuint -typealias MX_float Cfloat -typealias MX_handle Ptr{Void} - -typealias char_p Ptr{UInt8} -typealias char_pp Ptr{char_p} - -################################################################################ -# Initialization and library API entrance -################################################################################ -const MXNET_LIB = Libdl.find_library(["libmxnet.so","libmxnet.dll"], - [joinpath("$(get(ENV,"MXNET_HOME",""))","lib"), - joinpath(Pkg.dir("MXNet"),"deps/usr/lib")]) -if isempty(MXNET_LIB) - # touch this file, so that after the user properly build libmxnet, the precompiled - # MXNet.ji will be re-compiled to get MXNET_LIB properly. - touch(@__FILE__) - error("Cannot find or load libmxnet.so. Please see the document on how to build it.") -end - -function __init__() - _import_ndarray_functions() - _import_atomic_symbol_creators() - _import_io_iterators() - - atexit() do - # notify libmxnet we are shutting down - ccall( ("MXNotifyShutdown", MXNET_LIB), Cint, () ) - end -end - -function mx_get_last_error() - msg = ccall( ("MXGetLastError", MXNET_LIB), char_p, () ) - if msg == C_NULL - throw(MXError("Failed to get last error message")) - end - return bytestring(msg) -end - -"Utility macro to call MXNet API functions" -macro mxcall(fv, argtypes, args...) - f = eval(fv) - args = map(esc, args) - quote - _mxret = ccall( ($(Meta.quot(f)), $MXNET_LIB), - Cint, $argtypes, $(args...) ) - if _mxret != 0 - err_msg = mx_get_last_error() - throw(MXError(err_msg)) - end - end -end - -################################################################################ -# Handle types -################################################################################ -macro mx_define_handle_t(name, destructor) - name = esc(name) - quote - type $name - value :: MX_handle - - function $name(value = C_NULL) - hdr = new(value) - - $(if destructor != :nop - :(finalizer(hdr, delete!)) - end) - - return hdr - end - end - - $(if finalizer != :nop - quote - function delete!(h :: $name) - if h.value != C_NULL - @mxcall($(Meta.quot(destructor)), (MX_handle,), h.value) - h.value = C_NULL - end - end - end - end) - - function Base.unsafe_convert(::Type{MX_handle}, obj::$name) - obj.value - end - Base.convert(t::Type{MX_handle}, obj::$name) = Base.unsafe_convert(t, obj) - Base.cconvert(t::Type{MX_handle}, obj::$name) = Base.unsafe_convert(t, obj) - - function Base.isnull(obj::$name) obj.value == C_NULL end - end -end - -@mx_define_handle_t(MX_NDArrayHandle, MXNDArrayFree) -@mx_define_handle_t(MX_FunctionHandle, nop) -@mx_define_handle_t(MX_SymbolHandle, MXSymbolFree) -@mx_define_handle_t(MX_ExecutorHandle, MXExecutorFree) -@mx_define_handle_t(MX_DataIterHandle, MXDataIterFree) -@mx_define_handle_t(MX_KVStoreHandle, MXKVStoreFree) - -################################################################################ -# MXNet Params -# -# MXNet API use string to pass some common parameters like the configurations -# when defining layers. Typically, it is enough to use string(obj) to get a -# recognizable representation for libmxnet. However, there is currently a -# caveat: -# -# Because Julia use column-major ordering for tensors. In order to properly -# interact with Julia Arrays, the shape will look "reversed" from the Julia -# side. For example, a typical MNIST mini-batch tensor is of shape (28,28,1,100) -# from Julia side, while the shape information for the same piece of memory -# should be interpreted as (100,1,28,28) from C/C++/Python side. -# -# Therefore, when passing parameters to libmxnet, we should reverse the shape -# parameter. For example, when the user specify a non-square kernel size for -# a convolution or pooling layer. Unfortunately, those operators are automatically -# imported, and information about the type of each parameter is somehow limited. -# One hacky way is to match the type description for the string "Shape(tuple)" -# when importing operators. But currently we simply decided to reverse **all** -# NTuple{N, Int} passed to libmxnet. -# -# TODO: find a better solution in case this cause issues in the future. -################################################################################ -function dump_mx_param(val :: Any) - string(val) -end -function dump_mx_param{N,T<:Integer}(shape :: NTuple{N, T}) - string(tuple(flipdim([shape...],1)...)) -end - -"""A convenient macro copied from Mocha.jl that could be used to define structs -with default values and type checks. For example -```julia -@defstruct MyStruct Any ( - field1 :: Int = 0, - (field2 :: AbstractString = "", !isempty(field2)) -) -``` -where each field could be either -```julia -field_name :: field_type = default_value -``` -or put within a tuple, with the second element -specifying a validation check on the field value. -In the example above, the default value for -field2 does not satisfy the assertion, this -could be used to force user to provide a -valid value when no meaningful default value -is available. - -The macro will define a constructor that could accept -the keyword arguments. -""" -macro defstruct(name, super_name, fields) - @assert fields.head == :tuple - fields = fields.args - @assert length(fields) > 0 - name = esc(name) - super_name = esc(super_name) - - field_defs = Array(Expr, length(fields)) # :(field2 :: Int) - field_names = Array(Expr, length(fields)) # :field2 - field_defaults = Array(Expr, length(fields)) # :(field2 = 0) - field_types = Array(Expr, length(fields)) # Int - field_asserts = Array(Expr, length(fields)) # :(field2 >= 0) - - for i = 1:length(fields) - field = fields[i] - if field.head == :tuple - field_asserts[i] = esc(field.args[2]) - field = field.args[1] - end - field_defs[i] = esc(field.args[1]) - field_names[i] = esc(field.args[1].args[1]) - field_types[i] = esc(field.args[1].args[2]) - field_defaults[i] = Expr(:kw, field.args[1].args[1], esc(field.args[2])) - end - - # body of layer type, defining fields - type_body = Expr(:block, field_defs...) - - # constructor - converts = map(zip(field_names, field_types)) do param - f_name, f_type = param - :($f_name = convert($f_type, $f_name)) - end - asserts = map(filter(i -> isdefined(field_asserts,i), 1:length(fields))) do i - :(@assert($(field_asserts[i]))) - end - construct = Expr(:call, name, field_names...) - ctor_body = Expr(:block, converts..., asserts..., construct) - ctor_def = Expr(:call, name, Expr(:parameters, field_defaults...)) - ctor = Expr(:(=), ctor_def, ctor_body) - - quote - type $(name) <: $super_name - $type_body - end - - $ctor - end -end diff --git a/src/callback.jl-e b/src/callback.jl-e deleted file mode 100644 index 9f3d85b576ff..000000000000 --- a/src/callback.jl-e +++ /dev/null @@ -1,142 +0,0 @@ -#=doc -Callbacks in training -===================== -=# - -#=doc -.. class:: AbstractCallback - - Abstract type of callback functions used in training. -=# -abstract AbstractCallback - -#=doc -.. class:: AbstractBatchCallback - - Abstract type of callbacks to be called every mini-batch. -=# -abstract AbstractBatchCallback <: AbstractCallback - -#=doc -.. class:: AbstractEpochCallback - - Abstract type of callbacks to be called every epoch. -=# -abstract AbstractEpochCallback <: AbstractCallback - -type BatchCallback <: AbstractBatchCallback - frequency :: Int - call_on_0 :: Bool - callback :: Function -end - -#=doc -.. function:: every_n_batch(callback :: Function, n :: Int; call_on_0 = false) - - A convenient function to construct a callback that runs every ``n`` mini-batches. - - :param Int call_on_0: keyword argument, default false. Unless set, the callback - will **not** be run on batch 0. - - For example, the :func:`speedometer` callback is defined as - - .. code-block:: julia - - every_n_iter(frequency, call_on_0=true) do state :: OptimizationState - if state.curr_batch == 0 - # reset timer - else - # compute and print speed - end - end - - :seealso: :func:`every_n_epoch`, :func:`speedometer`. -=# -function every_n_batch(callback :: Function, n :: Int; call_on_0 :: Bool = false) - BatchCallback(n, call_on_0, callback) -end -function Base.call(cb :: BatchCallback, state :: OptimizationState) - if state.curr_batch == 0 - if cb.call_on_0 - cb.callback(state) - end - elseif state.curr_batch % cb.frequency == 0 - cb.callback(state) - end -end - -#=doc -.. function:: speedometer(; frequency=50) - - Create an :class:`AbstractBatchCallback` that measure the training speed - (number of samples processed per second) every k mini-batches. - - :param Int frequency: keyword argument, default 50. The frequency (number of - min-batches) to measure and report the speed. -=# -function speedometer(;frequency::Int=50) - cl_tic = 0 - every_n_batch(frequency, call_on_0=true) do state :: OptimizationState - if state.curr_batch == 0 - # reset timer - cl_tic = time() - else - speed = frequency * state.batch_size / (time() - cl_tic) - info(format("Speed: {1:>6.2f} samples/sec", speed)) - cl_tic = time() - end - end -end - - -type EpochCallback <: AbstractEpochCallback - frequency :: Int - call_on_0 :: Bool - callback :: Function -end - -#=doc -.. function:: every_n_epoch(callback :: Function, n :: Int; call_on_0 = false) - - A convenient function to construct a callback that runs every ``n`` full data-passes. - - :param Int call_on_0: keyword argument, default false. Unless set, the callback - will **not** be run on epoch 0. Epoch 0 means no training has been performed - yet. This is useful if you want to inspect the randomly initialized model - that has not seen any data yet. - - :seealso: :func:`every_n_iter`. -=# -function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) - EpochCallback(n, call_on_0, callback) -end -function Base.call(cb :: EpochCallback, model :: Any, state :: OptimizationState) - if state.curr_epoch == 0 - if cb.call_on_0 - cb.callback(model, state) - end - elseif state.curr_epoch % cb.frequency == 0 - cb.callback(model, state) - end -end - -#=doc -.. function:: do_checkpoint(prefix; frequency=1, save_epoch_0=false) - - Create an :class:`AbstractEpochCallback` that save checkpoints of the model to disk. - The checkpoints can be loaded back later on. - - :param AbstractString prefix: the prefix of the filenames to save the model. The model - architecture will be saved to prefix-symbol.json, while the weights will be saved - to prefix-0012.params, for example, for the 12-th epoch. - :param Int frequency: keyword argument, default 1. The frequency (measured in epochs) to - save checkpoints. - :param Bool save_epoch_0: keyword argument, default false. Whether we should save a - checkpoint for epoch 0 (model initialized but not seen any data yet). -=# -function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) - mkpath(dirname(prefix)) - every_n_epoch(frequency, call_on_0=save_epoch_0) do model, state - save_checkpoint(model, prefix, state) - end -end diff --git a/src/context.jl-e b/src/context.jl-e deleted file mode 100644 index 1e96c305fb04..000000000000 --- a/src/context.jl-e +++ /dev/null @@ -1,44 +0,0 @@ -#=doc -Context -======= -=# -@enum CONTEXT_TYPE CPU=1 GPU=2 CPU_PINNED=3 - -#=doc -.. class:: Context - - A context describes the device type and id on which computation should be carried on. -=# -immutable Context - device_type :: CONTEXT_TYPE - device_id :: Int -end -Context(dev_type :: Union{CONTEXT_TYPE, Int}, dev_id :: Int = 0) = - Context(convert(CONTEXT_TYPE, dev_type), dev_id) - -function Base.show(io :: IO, ctx :: Context) - print(io, "$(ctx.device_type)$(ctx.device_id)") -end - -#=doc -.. function:: cpu(dev_id=0) - - :param Int dev_id: the CPU id. - - Get a CPU context with a specific id. ``cpu()`` is usually the default context for many - operations when no context is specified. -=# -function cpu(dev_id::Int=0) - return Context(CPU, dev_id) -end - -#=doc -.. function:: gpu(dev_id=0) - - :param Int dev_id: the GPU device id. - - Get a GPU context with a specific id. The K GPUs on a node is typically numbered as 0,...,K-1. -=# -function gpu(dev_id::Int=0) - return Context(GPU, dev_id) -end diff --git a/src/executor.jl-e b/src/executor.jl-e deleted file mode 100644 index 6dea17763101..000000000000 --- a/src/executor.jl-e +++ /dev/null @@ -1,197 +0,0 @@ -#=doc -Executor -======== -=# - -#=doc -.. class:: Executor - - An executor is a realization of a symbolic architecture defined by a :class:`Node`. - The actual forward and backward computation specified by the network architecture can - be carried out with an executor. -=# -type Executor - handle :: MX_ExecutorHandle - symbol :: Node - arg_arrays :: Vector{NDArray} - grad_arrays :: Vector{Union{Void,NDArray}} - aux_arrays :: Vector{NDArray} - outputs :: Vector{NDArray} - arg_dict :: Dict{Base.Symbol, NDArray} - aux_dict :: Dict{Base.Symbol, NDArray} -end -function Executor(hdr :: MX_ExecutorHandle, symbol :: Node, - arg_arrays :: Vector{NDArray}, grad_arrays :: Vector{Union{Void,NDArray}}, - aux_arrays :: Vector{NDArray}) - # get output arrays - ref_size = Ref{MX_uint}(0) - ref_hdrs = Ref{Ptr{MX_handle}}(0) - @mxcall(:MXExecutorOutputs, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_handle}}), - hdr, ref_size, ref_hdrs) - out_hdrs = pointer_to_array(ref_hdrs[], ref_size[]) - out_arrays = [NDArray(MX_NDArrayHandle(x)) for x in out_hdrs] - - arg_names = list_arguments(symbol) - @assert(length(arg_names) == length(unique(arg_names)), "Duplicated names in arguments: $arg_names") - arg_dict = Dict{Base.Symbol,NDArray}(zip(arg_names, arg_arrays)) - - aux_names = list_auxiliary_states(symbol) - @assert(length(aux_names) == length(unique(aux_names)), "Duplicated names in auxiliary states: $aux_names") - aux_dict = Dict{Base.Symbol,NDArray}(zip(aux_names, aux_arrays)) - - Executor(hdr, symbol, arg_arrays, grad_arrays, aux_arrays, out_arrays, arg_dict, aux_dict) -end - -function Base.unsafe_convert(::Type{MX_handle}, obj::Executor) - Base.unsafe_convert(MX_handle, obj.handle) -end -Base.convert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) -Base.cconvert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) - -function _get_ndarray_inputs(arg_key::AbstractString, args::Vector{NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) - @assert(length(args) == length(arg_names), "Length of $arg_key does not match number of arguments") - return (MX_handle[args...], args) -end -function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) - args_vec = map(arg_names) do name - arr = get(args, name, nothing) - if !allow_missing - @assert(!isa(arr, Void), "Must specify all arguments in $arg_key ($name is missing)") - end - arr - end - # help the type inference - if allow_missing - args_vec = Union{NDArray,Void}[args_vec...] - else - args_vec = NDArray[args_vec...] - end - args_hdr = MX_handle[(isa(x,Void) ? MX_handle(0) : x) for x in args_vec] - return (args_hdr, args_vec) -end - -#=doc -.. function:: bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) - - Create an :class:`Executor` by binding a :class:`Node` to concrete :class:`NDArray`. - - :param Node sym: the network architecture describing the computation graph. - :param Context ctx: the context on which the computation should run. - :param args: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete - arrays for all the inputs in the network architecture. The inputs typically include - network parameters (weights, bias, filters, etc.), data and labels. See :func:`list_arguments` - and :func:`infer_shape`. - :param args_grad: TODO - :param aux_states: - :param grad_req: -=# -@enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 -function bind(self :: Node, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; - args_grad :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), - aux_states :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), - grad_req :: Union{GRAD_REQ,Vector{GRAD_REQ},Dict{Base.Symbol,GRAD_REQ}} = GRAD_WRITE) - - arg_names = list_arguments(self) - - args_hdr, args = _get_ndarray_inputs("args", args, arg_names, false) - args_grad_hdr, args_grad = _get_ndarray_inputs("args_grad", args_grad, arg_names, true) - aux_args_hdr, aux_states = _get_ndarray_inputs("aux_states", aux_states, list_auxiliary_states(self), false) - - if isa(grad_req, GRAD_REQ) - reqs = MX_uint[grad_req for i=1:length(args)] - elseif isa(grad_req, Vector{GRAD_REQ}) - @assert(length(grad_req) == length(args)) - reqs = MX_uint[grad_req...] - elseif isa(grad_req, Dict{Base.Symbol, GRAD_REQ}) - reqs = MX_uint[get(grad_req, name, GRAD_NOP) for name in arg_names] - end - - ref_hdr = Ref{MX_handle}(0) - @mxcall(:MXExecutorBind, - (MX_handle, Cint, Cint, MX_uint, Ptr{MX_handle}, Ptr{MX_handle}, Ptr{MX_uint}, - MX_uint, Ptr{MX_handle}, Ref{MX_handle}), - self, ctx.device_type, ctx.device_id, length(args), args_hdr, - args_grad_hdr, reqs, length(aux_states), aux_args_hdr, ref_hdr) - args_grad = convert(Vector{Union{Void,NDArray}}, args_grad) - executor = Executor(MX_ExecutorHandle(ref_hdr[]), self, - args, args_grad, aux_states) -end -function bind(self :: Node; kwargs...) - kwargs = Dict(kwargs) - @assert(haskey(kwargs, :args), "Must specify args") - args = pop!(kwargs, :args) - if haskey(kwargs, :context) - context = pop!(kwargs, :context) - else - context = cpu() - end - bind(self, context, args; kwargs...) -end - -function simple_bind(self :: Node, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) - arg_shapes, out_shapes, aux_shapes = infer_shape(self; kwargs...) - @assert(!isa(arg_shapes, Void), "Information not enough to perform complete shape inference") - - arg_arrays = NDArray[zeros(shape, ctx) for shape in arg_shapes] - arg_names = list_arguments(self) - if grad_req == GRAD_NOP - grad_arrays = Dict{Base.Symbol,NDArray}() - else - provided_data_names = [x[1] for x in kwargs] - grad_arrays = Dict{Base.Symbol,NDArray}() - for (name, shape) in zip(arg_names, arg_shapes) - # if not in provided data, should be parameters - if !in(name, provided_data_names) - grad_arrays[name] = zeros(shape, ctx) - end - end - end - - aux_arrays = [zeros(shape, ctx) for shape in aux_shapes] - return bind(self, ctx, arg_arrays, args_grad=grad_arrays, grad_req=grad_req, aux_states=aux_arrays) -end - - -function forward(self :: Executor; is_train::Bool=false, kwargs...) - for (k,v) in kwargs - @assert(k ∈ self.arg_dict, "Unknown argument $k") - @assert(isa(v, NDArray), "Keyword argument $k must be an NDArray") - copy!(self.arg_dict[k], v) - end - - @mxcall(:MXExecutorForward, (MX_handle, Cint), self, is_train) -end - -function backward(self :: Executor) - backward(self, NDArray[]) -end -function backward(self :: Executor, out_grad :: NDArray) - backward(self, [out_grad]) -end -function backward(self :: Executor, out_grads :: Vector{NDArray}) - out_grads = MX_handle[out_grads...] - @mxcall(:MXExecutorBackward, (MX_handle, MX_uint, Ptr{MX_handle}), self, length(out_grads), out_grads) -end - - -function copy_params_from(self::Executor, arg_params::Dict{Base.Symbol,NDArray}, - aux_params::Union{Void,Dict{Base.Symbol,NDArray}}=nothing; - allow_extra_params::Bool=false) - for (name, array) in arg_params - if haskey(self.arg_dict, name) - copy!(self.arg_dict[name], array) - else - @assert(allow_extra_params, "Extra params $name not in the arguments") - end - end - - if !isa(aux_params, Void) - for (name, array) in aux_params - if haskey(self.aux_dict, name) - copy!(self.aux_dict[name], array) - else - @assert(allow_extra_params, "Extra auxiliary state $name not recognized") - end - end - end -end diff --git a/src/initializer.jl-e b/src/initializer.jl-e deleted file mode 100644 index 8f78bfba9367..000000000000 --- a/src/initializer.jl-e +++ /dev/null @@ -1,117 +0,0 @@ -#=doc -Initializers -============ -Interface ---------- -=# - -#=doc -.. class:: AbstractInitializer - - The abstract base class for all initializers. - -To define a new initializer, it is -enough to derive a new type, and implement one or more of the following methods: - -.. function:: _init_weight(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -.. function:: _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -.. function:: _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -.. function:: _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) - -Or, if full behavior customization is needed, override the following function - -.. function:: call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -=# -abstract AbstractInitializer - -function call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) - strname = string(name) - if endswith(strname, "bias") - _init_bias(self, name, array) - elseif endswith(strname, "gamma") - _init_gamma(self, name, array) - elseif endswith(strname, "beta") - _init_beta(self, name, array) - elseif endswith(strname, "weight") - _init_weight(self, name, array) - elseif endswith(strname, "moving_mean") - _init_zero(self, name, array) - elseif endswith(strname, "moving_var") - _init_zero(self, name, array) - else - _init_default(self, name, array) - end -end - -function _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) - array[:] = 0 -end -function _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) - array[:] = 1 -end -function _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) - array[:] = 0 -end -function _init_zero(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) - array[:] = 0 -end - -#=doc -Built-in initializers ---------------------- -=# -#=doc -.. class:: UniformInitializer - - Initialize weights according to a uniform distribution within the provided scale. -=# -immutable UniformInitializer <: AbstractInitializer - scale :: AbstractFloat -end -#=doc -.. function UniformInitializer(scale=0.07) - - Construct a :class:`UniformInitializer` with the specified scale. -=# -UniformInitializer() = UniformInitializer(0.07) - -function _init_weight(self :: UniformInitializer, name :: Base.Symbol, array :: NDArray) - rand!(-self.scale, self.scale, array) -end - -#=doc -.. class:: NormalInitializer - - Initialize weights according to a univariate Gaussian distribution. -=# -immutable NormalInitializer <: AbstractInitializer - μ :: AbstractFloat - σ :: AbstractFloat -end -#=doc -.. function:: NormalIninitializer(; mu=0, sigma=0.01) - - Construct a :class:`NormalInitializer` with mean ``mu`` and variance ``sigma``. -=# -NormalInitializer(; mu=0, sigma=0.01) = NormalInitializer(mu, sigma) - -function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) - randn!(self.μ, self.σ, array) -end - -#=doc -.. class:: XaiverInitializer - - The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding - the difficulty of training deep feedforward neuralnetworks*. -=# -immutable XaiverInitializer <: AbstractInitializer -end - -function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) - dims = size(array) - fan_in = prod(dims[2:end]) - fan_out = dims[1] - scale = sqrt(3 / (fan_in + fan_out)) - rand!(-scale, scale, array) -end diff --git a/src/io.jl-e b/src/io.jl-e deleted file mode 100644 index 5c59e96bb611..000000000000 --- a/src/io.jl-e +++ /dev/null @@ -1,641 +0,0 @@ -#=doc -Data Providers -============== -Interface ---------- - -Data providers are wrappers that load external data, be it images, text, or general tensors, -and split it into mini-batches so that the model can consume the data in a uniformed way. -=# - -#=doc -.. class:: AbstractDataProvider - - The root type for all data provider. A data provider should implement the following interfaces: - - .. function:: get_batch_size(provider) -> Int - - :param AbstractDataProvider provider: the data provider. - :return: the mini-batch size of the provided data. All the provided data should have the - same mini-batch size (i.e. the last dimension). - - .. function:: provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} - - :param AbstractDataProvider provider: the data provider. - :return: a vector of (name, shape) pairs describing the names of the data it provides, and - the corresponding shapes. - - .. function:: provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} - - :param AbstractDataProvider provider: the data provider. - :return: a vector of (name, shape) pairs describing the names of the labels it provides, and - the corresponding shapes. - - The difference between *data* and *label* is that during - training stage, both *data* and *label* will be feeded into the model, while during - prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and - of any shapes. The provided data and label names here should match the input names in a target - :class:`Node`. - - A data provider should also implement the Julia iteration interface, in order to allow iterating - through the data set. The provider will be called in the following way: - - .. code-block:: julia - - for batch in eachbatch(provider) - data = get_data(provider, batch) - end - - which will be translated by Julia compiler into - - .. code-block:: julia - - state = Base.start(eachbatch(provider)) - while !Base.done(provider, state) - (batch, state) = Base.next(provider, state) - data = get_data(provider, batch) - end - - By default, :func:`eachbatch` simply returns the provider itself, so the iterator interface - is implemented on the provider type itself. But the extra layer of abstraction allows us to - implement a data provider easily via a Julia ``Task`` coroutine. - The detailed interface function is listed below: - - .. function:: Base.eltype(provider) -> AbstractDataBatch - - :param AbstractDataProvider provider: the data provider. - :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. - - .. function:: Base.start(provider) -> AbstractDataProviderState - - :param AbstractDataProvider provider: the data provider. - - This function is always called before iterating into the dataset. It should initialize - the iterator, reset the index, and do data shuffling if needed. - - .. function:: Base.done(provider, state) -> Bool - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. - :return: true if there is no more data to iterate in this dataset. - - .. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) - - :param AbstractDataProvider provider: the data provider. - :return: the current data batch, and the state for the next iteration. - - Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that - is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this - case, you can safely assume that - - * :func:`Base.start` will always be called, and called only once before the iteration starts. - * :func:`Base.done` will always be called at the beginning of every iteration and always be called once. - * If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with - a call to :func:`Base.start`. - * :func:`Base.next` will always be called only once in each iteration. It will always be called after - one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will - not be called. - - With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation - of the built-in :class:`MXDataProvider` for example. - - .. caution:: - - Please do not use the one data provider simultaneously in two different places, either in parallel, - or in a nested loop. For example, the behavior for the following code is undefined - - .. code-block:: julia - - for batch in data - # updating the parameters - - # now let's test the performance on the training set - for b2 in data - # ... - end - end -=# -abstract AbstractDataProvider - -#=doc -.. class:: AbstractDataProviderState - - Base type for data provider states. -=# -abstract AbstractDataProviderState - -#=doc -.. class:: AbstractDataBatch - - Base type for a data mini-batch. It should implement the following interfaces: - - .. function:: count_samples(provider, batch) -> Int - - :param AbstractDataBatch batch: the data batch object. - :return: the number of samples in this batch. This number should be greater than 0, but - less than or equal to the batch size. This is used to indicate at the end of - the data set, there might not be enough samples for a whole mini-batch. - - .. function:: get_data(provider, batch) -> Vector{NDArray} - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :return: a vector of data in this batch, should be in the same order as declared in - :func:`provide_data() `. - - The last dimension of each :class:`NDArray` should always match the batch_size, even when - :func:`count_samples` returns a value less than the batch size. In this case, - the data provider is free to pad the remaining contents with any value. - - .. function:: get_label(provider, batch) -> Vector{NDArray} - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :return: a vector of labels in this batch. Similar to :func:`get_data`. - - - The following utility functions will be automatically defined. - - .. function:: get(provider, batch, name) -> NDArray - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :param Base.Symbol name: the name of the data to get, should be one of the names - provided in either :func:`provide_data() ` - or :func:`provide_label() `. - :return: the corresponding data array corresponding to that name. - - .. function:: load_data!(provider, batch, targets) - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :param targets: the targets to load data into. - :type targets: Vector{Vector{SlicedNDArray}} - - The targets is a list of the same length as number of data provided by this provider. - Each element in the list is a list of :class:`SlicedNDArray`. This list described a - spliting scheme of this data batch into different slices, each slice is specified by - a slice-ndarray pair, where *slice* specify the range of samples in the mini-batch - that should be loaded into the corresponding *ndarray*. - - This utility function is used in data parallelization, where a mini-batch is splited - and computed on several different devices. - - .. function:: load_label!(provider, batch, targets) - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :param targets: the targets to load label into. - :type targets: Vector{Vector{SlicedNDArray}} - - The same as :func:`load_data!`, except that this is for loading labels. -=# -abstract AbstractDataBatch - -#=doc -.. class:: DataBatch - - A basic subclass of :class:`AbstractDataBatch`, that implement the interface by - accessing member fields. -=# -type DataBatch <: AbstractDataBatch - data :: Vector{NDArray} - label :: Vector{NDArray} - count :: Int -end -count_samples(batch :: DataBatch) = batch.count -get_data(batch :: DataBatch) = batch.data -get_label(batch :: DataBatch) = batch.label - -#=doc -.. class:: SlicedNDArray - - A alias type of ``Tuple{UnitRange{Int},NDArray}``. -=# -typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} - -function _load_general!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, - targets :: Vector{Vector{SlicedNDArray}}, loader::Function) - data = loader(provider, batch) - for (d_src, d_targets) in zip(data, targets) - for (slice_idx, d_dst) in d_targets - copy!(d_dst, slice(d_src, slice_idx)) - end - end -end -function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, - targets :: Vector{Vector{SlicedNDArray}}) - _load_general!(provider, batch, targets, get_data) -end -function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, - targets :: Vector{Vector{SlicedNDArray}}) - _load_general!(provider, batch, targets, get_label) -end - -function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{NDArray}) - for (src, dst) in zip(get_data(provider, batch), targets) - copy!(dst, src) - end -end -function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{NDArray}) - for (src, dst) in zip(get_label(provider, batch), targets) - copy!(dst, src) - end -end - -import Base.get -function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name :: Base.Symbol) - for (idx, (k, s)) in enumerate(provide_data(provider)) - if name == k - return get_data(provider, batch)[idx] - end - end - for (idx, (k, s)) in enumerate(provide_label(provider)) - if name == k - return get_label(provider, batch)[idx] - end - end - error("$name is not provided by this data provider") -end - -eachbatch(provider :: AbstractDataProvider) = provider - -#=doc -Built-in data providers ------------------------ -=# - -################################################################################ -#=doc -.. class:: ArrayDataProvider - - A convenient tool to iterate :class:`NDArray` or Julia ``Array``. -=# -type ArrayDataProvider <: AbstractDataProvider - data_arrays :: Vector{Array{MX_float}} - data_names :: Vector{Base.Symbol} - label_arrays :: Vector{Array{MX_float}} - label_names :: Vector{Base.Symbol} - batch_size :: Int - sample_count :: Int - shuffle :: Bool - data_padding :: MX_float - label_padding :: MX_float - - data_batch :: Vector{NDArray} - label_batch :: Vector{NDArray} -end - -#=doc -.. function:: ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) - - Construct a data provider from :class:`NDArray` or Julia Arrays. - - :param data: the data, could be - - - a :class:`NDArray`, or a Julia Array. This is equivalent to ``:data => data``. - - a name-data pair, like ``:mydata => array``, where ``:mydata`` is the name of the data - and ``array`` is an :class:`NDArray` or a Julia Array. - - a list of name-data pairs. - - :param label: the same as the ``data`` parameter. When this argument is omitted, the constructed - provider will provide no labels. - :param Int batch_size: the batch size, default is 0, which means treating the whole array as a - single mini-batch. - :param Bool shuffle: turn on if the data should be shuffled at every epoch. - :param Real data_padding: when the mini-batch goes beyond the dataset boundary, there might - be less samples to include than a mini-batch. This value specify a scalar to pad the - contents of all the missing data points. - :param Real label_padding: the same as ``data_padding``, except for the labels. -=# -# Julia's type system is sometimes very frustrating. You cannot specify a function -# with argument Vector{Pair} to expect to be matched when calling with the parameter -# [:foo => zeros(2,3), :bar => zeros(3)] because the type inference gives very specific -# results, about the parametric type in the Pair{T1,T2} type, thus does not match the -# generic Pair type. In general, Int <: Number but Vector{Int} <: Vector{Number} is not -# true. So let us just use Any here... -function ArrayDataProvider(data::Any; batch_size::Int=0, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) - ArrayDataProvider(data, [], batch_size=batch_size, shuffle=shuffle, data_padding=data_padding, label_padding=label_padding) -end -function ArrayDataProvider(data::Any, label::Any; batch_size::Int=0, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) - asarr{T}(arr :: Array{T}) = convert(Array{MX_float}, arr) - asarr(arr :: NDArray) = copy(arr) - - if isa(data, Union{NDArray, Array}) && eltype(data) <: Real - data_names = [:data] - data_arrays = Array{MX_float}[asarr(data)] - elseif isa(data, Pair) - @assert isa(data.first, Base.Symbol) && isa(data.second, Union{NDArray, Array}) - data_names = [data.first] - data_arrays = Array{MX_float}[asarr(data.second)] - elseif isa(data, Vector) || isa(data, Tuple) - map(data) do d - @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) - end - data_names = Base.Symbol[d.first for d in data] - data_arrays = Array{MX_float}[asarr(d.second) for d in data] - else - error("Invalid data argument type") - end - - if isa(label, Union{NDArray, Array}) && eltype(label) <: Real - label_names = [:softmax_label] - label_arrays = Array{MX_float}[asarr(label)] - elseif isa(label, Pair) - @assert isa(label.first, Base.Symbol) && isa(label.second, Union{NDArray, Array}) - label_names = [label.first] - label_arrays = Array{MX_float}[asarr(label.second)] - elseif isa(label, Vector) || isa(label, Tuple) - map(label) do d - @assert isa(d, Pair) && isa(d.first, Base.Symbol) && isa(d.second, Union{NDArray, Array}) - end - label_names = Base.Symbol[d.first for d in label] - label_arrays = Array{MX_float}[asarr(d.second) for d in label] - else - error("Invalid label argument type") - end - - @assert length(data_arrays) > 0 - sample_count = size(data_arrays[1])[end] - for i = 1:length(data_names) - @assert(size(data_arrays[i])[end] == sample_count, - "Number of samples in $(data_names[i]) is mismatch with $(data_names[1])") - end - for i = 1:length(label_names) - @assert(size(label_arrays[i])[end] == sample_count, - "Number of samples in $(label_names[i]) is mismatch with $(data_names[1])") - end - - if batch_size == 0 - batch_size = sample_count - end - @assert 0 < batch_size <= sample_count - - function gen_batch_nds(arrs :: Vector{Array{MX_float}}, bsize :: Int) - map(arrs) do arr - shape = size(arr) - empty(shape[1:end-1]..., bsize) - end - end - - data_batch = gen_batch_nds(data_arrays, batch_size) - label_batch = gen_batch_nds(label_arrays, batch_size) - - # reshape data and labels into 2D tensors, so that it is easier to work with them - data_arrays = map(data_arrays) do arr - reshape(arr, prod(size(arr)[1:end-1]), size(arr)[end]) - end - label_arrays = map(label_arrays) do arr - reshape(arr, prod(size(arr)[1:end-1]), size(arr)[end]) - end - - ArrayDataProvider(data_arrays, data_names, label_arrays, label_names, batch_size, - sample_count, shuffle, data_padding, label_padding, data_batch, label_batch) -end - -function provide_data(provider::ArrayDataProvider) - return collect(zip(provider.data_names, map(size, provider.data_batch))) -end -function provide_label(provider::ArrayDataProvider) - return collect(zip(provider.label_names, map(size, provider.label_batch))) -end -get_batch_size(provider::ArrayDataProvider) = provider.batch_size - -immutable ArrayDataProviderState <: AbstractDataProviderState - curr_idx :: Int -end - -function Base.eltype(provider :: ArrayDataProvider) - ArrayDataProviderState -end - -function Base.start(provider :: ArrayDataProvider) - if provider.shuffle - # re-shuffle all data - idx_perm = randperm(provider.sample_count) - provider.data_arrays = map(x->x[:,idx_perm], provider.data_arrays) - provider.label_arrays = map(x->x[:,idx_perm], provider.label_arrays) - end - - return ArrayDataProviderState(1) -end - -function Base.done(provider::ArrayDataProvider, state :: ArrayDataProviderState) - return state.curr_idx > provider.sample_count -end - -immutable ArrayDataBatch <: AbstractDataBatch - idx :: UnitRange{Int} -end -function Base.next(provider :: ArrayDataProvider, state :: ArrayDataProviderState) - idx = state.curr_idx:min(state.curr_idx+provider.batch_size-1, provider.sample_count) - return (ArrayDataBatch(idx), ArrayDataProviderState(idx.stop+1)) -end - -function count_samples(provider :: ArrayDataProvider, batch :: ArrayDataBatch) - return length(batch.idx) -end - -function get_data(provider :: ArrayDataProvider, batch :: ArrayDataBatch) - for (src, dst) in zip(provider.data_arrays, provider.data_batch) - copy_ignore_shape!(dst[1:length(batch.idx)], src[:, batch.idx]) - if length(batch.idx) < provider.batch_size - dst[length(batch.idx)+1:provider.batch_size] = provider.data_padding - end - end - return provider.data_batch -end -function get_label(provider :: ArrayDataProvider, batch :: ArrayDataBatch) - for (src, dst) in zip(provider.label_arrays, provider.label_batch) - copy_ignore_shape!(dst[1:length(batch.idx)], src[:, batch.idx]) - if length(batch.idx) < provider.batch_size - dst[length(batch.idx)+1:provider.batch_size] = provider.label_padding - end - end - return provider.label_batch -end - - -#=doc -libmxnet data providers ------------------------ -=# - -################################################################################ -#=doc -.. class:: MXDataProvider - - A data provider that wrap built-in data iterators from libmxnet. See below for - a list of built-in data iterators. -=# -type MXDataProvider <: AbstractDataProvider - handle :: MX_DataIterHandle - data_shape :: Vector{Tuple{Base.Symbol, Tuple}} - label_shape:: Vector{Tuple{Base.Symbol, Tuple}} - batch_size :: Int - - # those two a auxiliary variables to help avoid calling reset - # but still pre-fetch first batch to get shape information - first_epoch:: Bool - first_batch:: Bool -end - -function _reset_data_iter(handle :: MX_DataIterHandle) - @mxcall(:MXDataIterBeforeFirst, (MX_handle,), handle) -end -function _iter_next(handle :: MX_DataIterHandle) - ref_ret = Ref{Cint}(0) - @mxcall(:MXDataIterNext, (MX_handle, Ref{Cint}), handle, ref_ret) - return Bool(ref_ret[]) -end -function _get_data(handle :: MX_DataIterHandle) - ref_hdr = Ref{MX_handle}(0) - @mxcall(:MXDataIterGetData, (MX_handle, Ref{MX_handle}), handle, ref_hdr) - return NDArray(MX_NDArrayHandle(ref_hdr[]), false) -end -function _get_label(handle :: MX_DataIterHandle) - ref_hdr = Ref{MX_handle}(0) - @mxcall(:MXDataIterGetLabel, (MX_handle, Ref{MX_handle}), handle, ref_hdr) - return NDArray(MX_NDArrayHandle(ref_hdr[]), false) -end - -function MXDataProvider(handle :: MX_DataIterHandle; - data_name :: Base.Symbol=:data, - label_name :: Union{Base.Symbol,Void}=:softmax_label, - kwargs...) # for convenience, we ignore the rest keyword arguments - # init iterator, load the first batch and get shapes - @assert(_iter_next(handle), "Failed to load the first batch in MXDataProvider") - data_shape = Tuple{Base.Symbol, Tuple}[(data_name, size(_get_data(handle)))] - if !isa(label_name, Void) - label_shape = Tuple{Base.Symbol, Tuple}[(label_name::Base.Symbol, size(_get_label(handle)))] - else - label_shape = Tuple{Base.Symbol, Tuple}[] - end - - MXDataProvider(handle, data_shape, label_shape, data_shape[1][2][end], true, true) -end - -provide_data(provider::MXDataProvider) = provider.data_shape -provide_label(provider::MXDataProvider) = provider.label_shape -get_batch_size(provider::MXDataProvider) = provider.batch_size - -type MXDataProviderState <: AbstractDataProviderState - has_next :: Bool -end -immutable MXDataBatch <: AbstractDataBatch -end - -function Base.eltype(provider :: MXDataProvider) - MXDataBatch -end -function Base.start(provider :: MXDataProvider) - if !provider.first_epoch - _reset_data_iter(provider.handle) - else - provider.first_epoch = false - end - - return MXDataProviderState(true) -end -function Base.done(provider :: MXDataProvider, state :: MXDataProviderState) - if provider.first_batch - state.has_next = true - provider.first_batch = false - else - state.has_next = _iter_next(provider.handle) - end - return !state.has_next -end -function Base.next(provider :: MXDataProvider, state :: MXDataProviderState) - return (MXDataBatch(), state) -end - -function get_data(provider :: MXDataProvider, batch :: MXDataBatch) - return NDArray[_get_data(provider.handle)] -end -function get_label(provider :: MXDataProvider, batch :: MXDataBatch) - return NDArray[_get_label(provider.handle)] -end -function count_samples(provider :: MXDataProvider, batch :: MXDataBatch) - ref_pad = Ref{Cint}(0) - @mxcall(:MXDataIterGetPadNum, (MX_handle, Ref{Cint}), provider.handle, ref_pad) - return provider.batch_size - Int(ref_pad[]) -end - -#=doc -**autogen:EMBED:io:EMBED:autogen** -=# -function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) - ref_name = Ref{char_p}(0) - ref_desc = Ref{char_p}(0) - ref_narg = Ref{MX_uint}(0) - ref_arg_names = Ref{char_pp}(0) - ref_arg_types = Ref{char_pp}(0) - ref_arg_descs = Ref{char_pp}(0) - - @mxcall(:MXDataIterGetIterInfo, - (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), - hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) - - iter_name = symbol(bytestring(ref_name[])) - - if gen_docs - if endswith(string(iter_name), "Iter") - f_desc = "Can also be called with the alias ``$(string(iter_name)[1:end-4] * "Provider")``.\n" - else - f_desc = "" - end - f_desc *= bytestring(ref_desc[]) * "\n\n" - f_desc *= ":param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data.\n" - f_desc *= ":param Base.Symbol label_name: keyword argument, default ``:softmax_label``. " * - "The name of the label. Could be ``nothing`` if no label is presented in this dataset.\n\n" - f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":return: the constructed :class:`MXDataProvider`." - return (iter_name, f_desc) - end - - defun = quote - function $iter_name(; kwargs...) - arg_keys = AbstractString[string(k) for (k,v) in kwargs] - arg_vals = AbstractString[dump_mx_param(v) for (k,v) in kwargs] - ref_hdr = Ref{MX_handle}(0) - - @mxcall(:MXDataIterCreateIter, (MX_handle, MX_uint, char_pp, char_pp, Ref{MX_handle}), - $hdr, length(arg_keys), arg_keys, arg_vals, ref_hdr) - - return MXDataProvider(MX_DataIterHandle(ref_hdr[]); kwargs...) - end - end - eval(defun) - - # add an alias XXXProvider => XXXIter - if endswith(string(iter_name), "Iter") - alias_name = symbol(string(iter_name)[1:end-4] * "Provider") - eval(:($alias_name = $iter_name)) - end -end - -function _import_io_iterators(;gen_docs::Bool=false) - n_ref = Ref{MX_uint}(0) - h_ref = Ref{Ptr{MX_handle}}(0) - @mxcall(:MXListDataIters, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) - - n_creators = n_ref[] - h_creators = pointer_to_array(h_ref[], n_creators) - - if gen_docs - docs = Dict{Base.Symbol, AbstractString}() - end - - for i = 1:n_creators - creator_hdr = h_creators[i] - ret = _define_data_iter_creator(creator_hdr; gen_docs=gen_docs) - if gen_docs - docs[ret[1]] = ret[2] - end - end - - if gen_docs - return docs - end -end diff --git a/src/kvstore.jl-e b/src/kvstore.jl-e deleted file mode 100644 index d52433f567b2..000000000000 --- a/src/kvstore.jl-e +++ /dev/null @@ -1,132 +0,0 @@ -type KVStore - handle :: MX_KVStoreHandle - updater_c :: Ptr{Void} - updater :: Function - - KVStore(hdr :: MX_KVStoreHandle) = new(hdr, Ptr{Void}(0)) -end - -function KVStore(kv_type::Base.Symbol = :local) - #@assert(kv_type ∈ [:local]) # TODO: update with allowed types - - ref_hdr = Ref{MX_handle}(0) - kv_type = string(kv_type) - @mxcall(:MXKVStoreCreate, (char_p, Ref{MX_handle}), kv_type, ref_hdr) - return KVStore(MX_KVStoreHandle(ref_hdr[])) -end -function Base.unsafe_convert(::Type{MX_handle}, obj::KVStore) - Base.unsafe_convert(MX_handle, obj.handle) -end -Base.convert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) -Base.cconvert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) - -function _flatten_kvlist(keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) - @assert length(keys) == length(vals) - keys_flt = Int[] - vals_flt = NDArray[] - for (k,v) in zip(keys, vals) - append!(keys_flt, Base.ones(Int, length(v))*k) - append!(vals_flt, v) - end - return (keys_flt, vals_flt) -end - -function init!(self :: KVStore, key :: Int, val :: NDArray) - init!(self, [key], [val]) -end -function init!(self :: KVStore, key :: Int, vals :: Vector{NDArray}) - init!(self, Base.ones(Int, length(vals))*key, vals) -end -function init!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) - init!(self, _flatten_kvlist(keys, vals)...) -end -function init!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{NDArray}) - @assert length(keys) == length(vals) - keys = Cint[keys...] - vals = MX_handle[vals...] - @mxcall(:MXKVStoreInit, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}), - self, length(keys), keys, vals) -end - -import Base.push! -function push!(self :: KVStore, key :: Int, val :: NDArray; priority :: Int = 0) - push!(self, [key], [val]; priority = priority) -end -function push!(self :: KVStore, key :: Int, vals :: Vector{NDArray}; priority :: Int = 0) - push!(self, Base.ones(Int, length(vals))*key, vals; priority = priority) -end -function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}; priority::Int=0) - push!(self, _flatten_kvlist(keys, vals)...; priority = priority) -end -function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{NDArray}; priority::Int=0) - @assert length(keys) == length(vals) - keys = Cint[keys...] - vals = MX_handle[vals...] - @mxcall(:MXKVStorePush, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}, Cint), - self, length(keys), keys, vals, priority) -end - -function pull!(self :: KVStore, key :: Int, out :: NDArray; priority :: Int = 0) - pull!(self, [key], [out]) -end -function pull!(self :: KVStore, key :: Int, outs :: Vector{NDArray}; priority :: Int = 0) - pull!(self, Base.ones(Int, length(outs))*key, outs; priority = priority) -end -function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{Vector{NDArray}}; priority::Int=0) - pull!(self, _flatten_kvlist(keys, outs)...; priority = priority) -end -function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{NDArray}; priority::Int=0) - @assert length(keys) == length(outs) - keys = Cint[keys...] - outs = MX_handle[outs...] - @mxcall(:MXKVStorePull, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}, Cint), - self, length(keys), keys, outs, priority) -end - - -function get_type(self :: KVStore) - type_ref = Ref{char_p}(0) - @mxcall(:MXKVStoreGetType, (MX_handle, Ref{char_p}), self, type_ref) - return symbol(bytestring(type_ref[])) -end - -function get_num_workers(self :: KVStore) - ref_size = Ref{Cint}(0) - @mxcall(:MXKVStoreGetGroupSize, (MX_handle, Ref{Cint}), self, ref_size) - return Int(ref_size[]) -end - -function get_rank(self :: KVStore) - ref_rank = Ref{Cint}(0) - @mxcall(:MXKVStoreGetRank, (MX_handle, Ref{Cint}), self, ref_rank) - return Int(ref_rank[]) -end - - -# TODO: Currently Julia does not support closure in c-callbacks, so we are making use of the -# extra handle parameter of the API to pass the updater object around. Fix this when someday -# full closure cfunction is supported in Julia. -function _kvstore_update_wrapper(index::Cint, nd_recv::MX_handle, nd_local::MX_handle, updater::Ptr{Void}) - updater_func = unsafe_pointer_to_objref(updater) :: Function - updater_func(Int(index), NDArray(MX_NDArrayHandle(nd_recv)), NDArray(MX_NDArrayHandle(nd_local))) - return nothing -end -function set_updater(self :: KVStore, updater :: Function) - self.updater = updater # keep a reference to the julia object so that updater_c is kept valid - self.updater_c = cfunction(_kvstore_update_wrapper, Void, (Cint, MX_handle, MX_handle, Ptr{Void})) - - @mxcall(:MXKVStoreSetUpdater, (MX_handle, Ptr{Void}, Any), - self, self.updater_c, updater) -end - -function set_optimizer(self :: KVStore, optimizer :: AbstractOptimizer) - ref_is_worker = Ref{Cint}(0) - @mxcall(:MXKVStoreIsWorkerNode, (Ref{Cint},), ref_is_worker) - is_worker = ref_is_worker[] - - if ismatch(r"dist", string(get_type(self))) && is_worker - # TODO - else - set_updater(self, get_updater(optimizer)) - end -end diff --git a/src/metric.jl-e b/src/metric.jl-e deleted file mode 100644 index c88239ab8cc8..000000000000 --- a/src/metric.jl-e +++ /dev/null @@ -1,37 +0,0 @@ -abstract AbstractEvalMetric - -type Accuracy <: AbstractEvalMetric - acc_sum :: Float64 - n_sample :: Int - - Accuracy() = new(0.0, 0) -end - -function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDArray) - label = copy(label) - pred = copy(pred) - - n_sample = size(pred)[end] - metric.n_sample += n_sample - for i = 1:n_sample - klass = indmax(pred[:,i]) - metric.acc_sum += (klass-1) == label[i] - end -end - -function update!(metric :: Accuracy, labels :: Vector{NDArray}, preds :: Vector{NDArray}) - @assert length(labels) == length(preds) - for i = 1:length(labels) - _update_single_output(metric, labels[i], preds[i]) - end -end - -import Base: get -function get(metric :: Accuracy) - return [(:accuracy, metric.acc_sum / metric.n_sample)] -end - -function reset!(metric :: Accuracy) - metric.acc_sum = 0.0 - metric.n_sample = 0 -end diff --git a/src/model.jl-e b/src/model.jl-e deleted file mode 100644 index 93189124d9b0..000000000000 --- a/src/model.jl-e +++ /dev/null @@ -1,566 +0,0 @@ -#=doc -Models -====== - -The model API provides convenient high-level interface to do training and predicting on -a network described using the symbolic API. -=# - -#=doc -.. class:: AbstractModel - - The abstract super type of all models in MXNet.jl. -=# -abstract AbstractModel - -#=doc -.. class:: FeedForward - - The feedforward model provides convenient interface to train and predict on - feedforward architectures like multi-layer MLP, ConvNets, etc. There is no - explicitly handling of *time index*, but it is relatively easy to implement - unrolled RNN / LSTM under this framework (**TODO**: add example). For models - that handles sequential data explicitly, please use **TODO**... -=# -type FeedForward <: AbstractModel - arch :: Node - ctx :: Vector{Context} - - arg_params :: Dict{Base.Symbol, NDArray} - aux_params :: Dict{Base.Symbol, NDArray} - - pred_exec :: Union{Executor, Void} - - # leave the rest fields undefined - FeedForward(arch :: Node, ctx :: Vector{Context}) = new(arch, ctx) -end - -"""Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector - of length `n_split`, with each entry a `UnitRange{Int}` indicating the slice index for that - piece. -""" -function _split_inputs(batch_size :: Int, n_split :: Int) - @assert(batch_size >= n_split) - per_split = floor(Int, batch_size / n_split) - counts = Base.zeros(Int, n_split)+per_split - extra = batch_size - sum(counts) - counts[1:extra] += 1 - - cum = [0, cumsum(counts)...] - idx = [cum[i-1]+1:cum[i] for i = 2:length(cum)] - return idx -end - -#=doc -.. function:: FeedForward(arch :: Node, ctx) - - :param arch: the architecture of the network constructed using the symbolic API. - :param ctx: the devices on which this model should do computation. It could be a single :class:`Context` - or a list of :class:`Context` objects. In the latter case, data parallelization will be used - for training. If no context is provided, the default context ``cpu()`` will be used. -=# -function FeedForward(arch :: Node; context :: Union{Context, Vector{Context}, Void} = nothing) - if isa(context, Void) - context = [Context(CPU)] - elseif isa(context, Context) - context = [context] - end - FeedForward(arch, context) -end - -#=doc -.. function:: init_model(self, initializer; overwrite=false, input_shapes...) - - Initialize the weights in the model. - - This method will be called automatically when training a model. So there is usually no - need to call this method unless one needs to inspect a model with only randomly initialized - weights. - - :param FeedForward self: the model to be initialized. - :param AbstractInitializer initializer: an initializer describing how the weights should be initialized. - :param Bool overwrite: keyword argument, force initialization even when weights already exists. - :param input_shapes: the shape of all data and label inputs to this model, given as keyword arguments. - For example, ``data=(28,28,1,100), label=(100,)``. -=# -function init_model(self :: FeedForward, initializer :: AbstractInitializer; overwrite::Bool=false, input_shapes...) - # all arg names, including data, label, and parameters - arg_names = list_arguments(self.arch) - - input_names = [x[1] for x in input_shapes] - - param_names = setdiff(arg_names, input_names) - aux_names = list_auxiliary_states(self.arch) - - arg_defined = true - aux_defined = true - - arg_shapes, out_shapes, aux_shapes = infer_shape(self.arch; input_shapes...) - if !isdefined(self, :arg_params) - param_name_shapes = filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) - self.arg_params = Dict([name => empty(shape) for (name,shape) in param_name_shapes]) - arg_defined = false - end - if !isdefined(self, :aux_params) - self.aux_params = Dict([name => empty(shape) for (name,shape) in zip(aux_names,aux_shapes)]) - aux_defined = false - end - - # initialize the contents of the parameters - if !arg_defined || overwrite - for (k,v) in self.arg_params - initializer(k, v) - end - end - if !aux_defined || overwrite - for (k,v) in self.aux_params - initializer(k, v) - end - end - - return (arg_names, param_names, aux_names) -end - -function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_shapes...) - if !isdefined(self, :pred_exec) || isa(self.pred_exec, Void) || overwrite - if !isdefined(self, :arg_params) || !isdefined(self, :aux_params) - @assert(false, "Model weights not defined, please init or train the model, or load from file") - end - - # the predictor use only the first device - self.pred_exec = simple_bind(self.arch, self.ctx[1]; grad_req=GRAD_NOP, data_shapes...) - copy_params_from(self.pred_exec, self.arg_params, self.aux_params) - else - # make sure the new setup is compatible with the existing one - for (d_name, d_shape) in data_shapes - @assert(d_shape == size(self.pred_exec.arg_dict[d_name]), - "Shape of $d_name mismatch with existing predictor, use overwrite=true overwrite existing predictor") - end - end -end - -#=doc -.. function:: - predict(self, data; overwrite=false, callback=nothing) - - Predict using an existing model. The model should be already initialized, or trained or loaded from - a checkpoint. There is an overloaded function that allows to pass the callback as the first argument, - so it is possible to do - - .. code-block:: julia - - predict(model, data) do batch_output - # consume or write batch_output to file - end - - :param FeedForward self: the model. - :param AbstractDataProvider data: the data to perform prediction on. - :param Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory - allocation of the :class:`Executor` depends on the mini-batch size of the test - data provider. If you call predict twice with data provider of the same batch-size, - then the executor can be re-used. Otherwise, if ``overwrite`` is false (default), - an error will be raised; if ``overwrite`` is set to true, a new :class:`Executor` - will be created to replace the old one. - - .. note:: - - Prediction is computationally much less costly than training, so the bottleneck sometimes becomes the IO - for copying mini-batches of data. Since there is no concern about convergence in prediction, it is better - to set the mini-batch size as large as possible (limited by your device memory) if prediction speed is a - concern. - - For the same reason, currently prediction will only use the first device even if multiple devices are - provided to construct the model. - - :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` -=# -function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = false) - predict(self, data; overwrite = overwrite, callback=callback) -end -function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::Bool=false, callback::Union{Function,Void}=nothing) - data_shapes = provide_data(data) - data_names = [x[1] for x in data_shapes] - _setup_predictor(self, overwrite; data_shapes...) - - batch_size = get_batch_size(data) - data_arrays = [self.pred_exec.arg_dict[name] for name in data_names] - output_list = [Array{MX_float}[] for i=1:length(self.pred_exec.outputs)] - for batch in eachbatch(data) - load_data!(data, batch, data_arrays) - forward(self.pred_exec, is_train=false) - if isa(callback, Void) - # no callback, accumulate the data and return at the end - for (o_list, o_nd) in zip(output_list, self.pred_exec.outputs) - push!(o_list, copy(slice(o_nd, 1:count_samples(data, batch)))) - end - else - outputs = self.pred_exec.outputs - if length(outputs) == 1 - outputs = outputs[1] - end - callback(outputs) - end - end - - if !isa(callback, Void) - # callback exists, do not accumulate data - return nothing - end - - if isempty(output_list) - # maybe model does not have outputs - return nothing - end - if isempty(output_list[1]) - # maybe no output because data is empty - return length(output_list) == 1 ? output_list[1] : output_list - end - - # concatenate along mini-batches - output_arrays = [cat(ndims(x[1]), x...) for x in output_list] - if length(output_arrays) == 1 - # only 1 output, return it directly, instead of a list - output_arrays = output_arrays[1] - end - return output_arrays -end - -function _init_model(self :: FeedForward, data :: AbstractDataProvider, initializer :: AbstractInitializer, overwrite :: Bool) - init_model(self, initializer; overwrite=overwrite, [provide_data(data)..., provide_label(data)...]...) -end - -function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}) - if num_device == 1 && !ismatch(r"dist", string(kv_type)) - kv = nothing - else - if kv_type == :local - max_size = maximum([prod(size(param)) for (k,param) in arg_params]) - if max_size < 1024 * 1024 * 16 - kv_type = :local_update_cpu - else - kv_type = :local_allreduce_cpu - end - info("Auto-select kvstore type = $kv_type") - end - kv = KVStore(kv_type) - end - - update_on_kvstore = true - if isa(kv, Void) || ismatch(r"local_allreduce", string(get_type(kv))) - update_on_kvstore = false - end - - return (kv, update_on_kvstore) -end - -@defstruct TrainingOptions Any ( - initializer :: AbstractInitializer = UniformInitializer(0.01), - n_epoch :: Int = 10, - eval_data :: Union{Void, AbstractDataProvider} = nothing, - eval_metric :: AbstractEvalMetric = Accuracy(), - kvstore :: Union{Base.Symbol, KVStore} = :local, - force_init :: Bool = false, - callbacks :: Vector{AbstractCallback} = AbstractCallback[], -) - -function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, - state::OptimizationState, type_filter::Type) - map(callbacks) do cb - if isa(cb, type_filter) - if type_filter == AbstractEpochCallback - # epoch callback have extra access to the model object - cb(self, state) - else - cb(state) - end - end - end -end - -#=doc -.. function:: train(model :: FeedForward, ...) - - Alias to :func:`fit`. -=# -function train(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) - fit(self, optimizer, data; kwargs...) -end - -#=doc -.. function:: fit(model :: FeedForward, optimizer, data; kwargs...) - - Train the ``model`` on ``data`` with the ``optimizer``. - - :param FeedForward model: the model to be trained. - :param AbstractOptimizer optimizer: the optimization algorithm to use. - :param AbstractDataProvider data: the training data provider. - :param Int n_epoch: default 10, the number of full data-passes to run. - :param AbstractDataProvider eval_data: keyword argument, default ``nothing``. The data provider for - the validation set. - :param AbstractEvalMetric eval_metric: keyword argument, default ``Accuracy()``. The metric used - to evaluate the training performance. If ``eval_data`` is provided, the same metric is also - calculated on the validation set. - :param kvstore: keyword argument, default ``:local``. The key-value store used to synchronize gradients - and parameters when multiple devices are used for training. - :type kvstore: :class:`KVStore` or ``Base.Symbol`` - :param AbstractInitializer initializer: keyword argument, default ``UniformInitializer(0.01)``. - :param Bool force_init: keyword argument, default false. By default, the random initialization using the - provided ``initializer`` will be skipped if the model weights already exists, maybe from a previous - call to :func:`train` or an explicit call to :func:`init_model` or :func:`load_checkpoint`. When - this option is set, it will always do random initialization at the begining of training. - :param callbacks: keyword argument, default ``[]``. Callbacks to be invoked at each epoch or mini-batch, - see :class:`AbstractCallback`. - :type callbacks: ``Vector{AbstractCallback}`` -=# -function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) - opts = TrainingOptions(; kwargs...) - - info("Start training on $(self.ctx)") - - batch_size = get_batch_size(data) - num_dev = length(self.ctx) - slices = _split_inputs(batch_size, num_dev) - - # initialize parameters - info("Initializing parameters...") - arg_names, param_names, aux_names = _init_model(self, data, opts.initializer, opts.force_init) - - # setup kvstore - kvstore = opts.kvstore - if isa(kvstore, Base.Symbol) - info("Creating KVStore...") - kvstore, update_on_kvstore = _create_kvstore(kvstore, length(self.ctx), self.arg_params) - end - - train_execs = Array(Executor, num_dev) - for i = 1:num_dev - data_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)] - label_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)] - train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=GRAD_WRITE, data_shapes..., label_shapes...) - - copy_params_from(train_execs[i], self.arg_params, self.aux_params) - end - - # set up input data structures - data_names = [x[1] for x in provide_data(data)] - label_names = [x[1] for x in provide_label(data)] - - data_arrays = [SlicedNDArray[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] - for name in data_names] - label_arrays = [SlicedNDArray[(slices[i], exec.arg_dict[name]) for (i,exec) in enumerate(train_execs)] - for name in label_names] - - param_idx = filter(i -> in(arg_names[i], param_names), 1:length(arg_names)) - - param_arrays = [NDArray[exec.arg_arrays[i] for exec in train_execs] for i in param_idx] - grad_arrays = [NDArray[exec.grad_arrays[i] for exec in train_execs] for i in param_idx] - aux_arrays = [NDArray[exec.aux_arrays[i] for exec in train_execs] for i = 1:length(aux_names)] - - op_state = OptimizationState(batch_size) - optimizer.state = op_state - - if !update_on_kvstore - updater = get_updater(optimizer) - end - - if !isa(kvstore, Void) - if update_on_kvstore - set_optimizer(kvstore, optimizer) - end - - info("Initializing KVStore...") - # init kv with gradients - for idx = 1:length(param_arrays) - param_on_devs = param_arrays[idx] - - init!(kvstore, idx, self.arg_params[param_names[idx]]) - - if update_on_kvstore - # pull weights back - pull!(kvstore, idx, param_on_devs, priority=-idx) - end - end - end - - # set up output and labels in CPU for evaluation metric - output_shapes = [tuple(size(x)[1:end-1]...,batch_size) for x in train_execs[1].outputs] - cpu_dev = Context(CPU) - cpu_output_arrays = [empty(shape, cpu_dev) for shape in output_shapes] - cpu_label_arrays = [empty(shape, cpu_dev) for (name,shape) in provide_label(data)] - - # invoke callbacks on epoch 0 - _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) - - # now start training... - for i_epoch = 1:opts.n_epoch - time_start = time() - reset!(opts.eval_metric) - - op_state.curr_epoch = i_epoch - op_state.curr_batch = 0 - - # invoke callbacks on iteration 0 - _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) - - for batch in eachbatch(data) - load_data!(data, batch, data_arrays) - load_label!(data, batch, label_arrays) - - # forward and backward - for (texec, islice) in zip(train_execs, slices) - forward(texec, is_train=true) - - # copy outputs into cpu ndarray, for evaluation metric - for (cpu_out, dev_out) in zip(cpu_output_arrays, texec.outputs) - copy!(slice(cpu_out, islice), dev_out) - end - - backward(texec) - end - - op_state.curr_iter += 1 - op_state.curr_batch += 1 - optimizer.state = op_state - - # update parameters - for idx = 1:length(param_names) - # gradient synchronization - if !isa(kvstore, Void) - # push gradient, priority is negative index - push!(kvstore, idx, grad_arrays[idx], priority=-idx) - if update_on_kvstore - # pull back the weights - pull!(kvstore, idx, param_arrays[idx], priority=-idx) - else - # pull back the sum-ed gradients, to the same locations - pull!(kvstore, idx, grad_arrays[idx], priority=-idx) - end - end - - if !update_on_kvstore - # manual updating - for i_dev = 1:num_dev - # create a fake index, so that the updater create states - # for different param AND different devices, TODO(mli) - # use a better solution later - fake_idx = idx * num_dev + i_dev - updater(fake_idx, grad_arrays[idx][i_dev], param_arrays[idx][i_dev]) - end - end - end - - # invoke callbacks after finishing each iteration - _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) - - # update evaluation metric on training set - load_label!(data, batch, cpu_label_arrays) - update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) - end # end of one epoch - - time_stop = time() - info(format("== Epoch {1:0>3d} ==========", i_epoch)) - info("## Training summary") - for (name, value) in get(opts.eval_metric) - info(format("{1:>15s} = {2:.4f}", name, value)) - end - info(format("{1:>15s} = {2:.4f} seconds", "time", time_stop-time_start)) - - # evaluation on validation set - if !isa(opts.eval_data, Void) - # because we are re-using the memory allocated for the training network, - # the batch_size of the validation dataset must be the same as the training - # batch_size - @assert(get_batch_size(opts.eval_data) == batch_size) - - reset!(opts.eval_metric) - for batch in eachbatch(opts.eval_data) - load_data!(opts.eval_data, batch, data_arrays) - - # forward and backward - for (texec, islice) in zip(train_execs, slices) - forward(texec, is_train=true) - - # copy outputs into cpu ndarray, for evaluation metric - for (cpu_out, dev_out) in zip(cpu_output_arrays, texec.outputs) - copy!(slice(cpu_out, islice), dev_out) - end - end - load_label!(opts.eval_data, batch, cpu_label_arrays) - update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) - end - - info("## Validation summary") - for (name, value) in get(opts.eval_metric) - info(format("{1:>15s} = {2:.4f}", name, value)) - end - end - - if i_epoch == opts.n_epoch || any(x->isa(x, AbstractEpochCallback), opts.callbacks) - # copy data back to cpu - for (name, weights) in zip(param_names, param_arrays) - # average parameters across devices - weight = +([copy(w, cpu()) for w in weights]...) / length(weights) - copy!(self.arg_params[name], weight) - end - for (name, aux_devs) in zip(aux_names, aux_arrays) - aux_avg = +([copy(aux, cpu()) for aux in aux_devs]...) / length(aux_devs) - copy!(self.aux_params[name], aux_avg) - end - end - _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) - end # end of all epochs -end - -function save_checkpoint(self :: FeedForward, prefix :: AbstractString, state :: OptimizationState) - save_checkpoint(self.arch, self.arg_params, self.aux_params, prefix, state.curr_epoch) -end -function save_checkpoint(sym :: Node, arg_params :: Dict{Base.Symbol, NDArray}, - aux_params :: Dict{Base.Symbol, NDArray}, prefix :: AbstractString, epoch :: Int) - save("$prefix-symbol.json", sym) - save_dict = merge(Dict([symbol("arg:$k") => v for (k,v) in arg_params]), - Dict([symbol("aux:$k") => v for (k,v) in aux_params])) - save_filename = format("{1}-{2:04d}.params", prefix, epoch) - save(save_filename, save_dict) - info("Saved checkpoint to '$save_filename'") -end - -function load_checkpoint(prefix :: AbstractString, epoch :: Int) - arch = load("$prefix-symbol.json", Node) - saved_dict = load(format("{1}-{2:04d}.params", prefix, epoch), NDArray) - arg_params = Dict{Base.Symbol, NDArray}() - aux_params = Dict{Base.Symbol, NDArray}() - for (k,v) in saved_dict - tp, name = split(string(k), ':') - name = symbol(name) - if tp == "arg" - arg_params[name] = v - else - aux_params[name] = v - end - end - - return (arch, arg_params, aux_params) -end - -function load_checkpoint(prefix :: AbstractString, epoch :: Int, ::Type{FeedForward}) - arch, arg_params, aux_params = load_checkpoint(prefix, epoch) - model = FeedForward(arch) - model.arg_params = arg_params - model.aux_params = aux_params - return model -end - -function load_checkpoint(self :: FeedForward, prefix :: AbstractString, epoch :: Int; overwrite :: Bool = true) - if isdefined(self, :arg_params) && isdefined(self, :aux_params) && !overwrite - info("model weights already exists, skip loading... (call with overwrite=true if needed)") - return self - end - - arch, arg_params, aux_params = load_checkpoint(prefix, epoch) - # TODO: is there better way to compare two symbols - @assert(to_json(self.arch) == to_json(arch), "Cannot load from a checkpoint with different network architecture") - self.arg_params = arg_params - self.aux_params = aux_params - return self -end - diff --git a/src/name.jl-e b/src/name.jl-e deleted file mode 100644 index 5ebf10917ce6..000000000000 --- a/src/name.jl-e +++ /dev/null @@ -1,44 +0,0 @@ -abstract AbstractNameManager -typealias NameType Union{Base.Symbol, AbstractString} -typealias NameCounter Dict{Base.Symbol, Int} - -import Base: get! - -# Default implementation for generating a name for a symbol. -# When a name is specified by the user, it will be used. Otherwise, a name -# is automatically generated based on the hint string. -function _default_get_name!(counter :: NameCounter, name :: NameType, hint :: NameType) - if isa(name, Base.Symbol) || !isempty(name) - return symbol(name) - end - - hint = symbol(hint) - if !haskey(counter, hint) - counter[hint] = 0 - end - name = symbol("$hint$(counter[hint])") - counter[hint] += 1 - return name -end - -type BasicNameManager <: AbstractNameManager - counter :: NameCounter -end -BasicNameManager() = BasicNameManager(NameCounter()) - -function get!(manager :: BasicNameManager, name :: NameType, hint :: NameType) - _default_get_name!(manager.counter, name, hint) -end - -type PrefixNameManager <: AbstractNameManager - prefix :: Base.Symbol - counter :: NameCounter -end -PrefixNameManager(prefix :: NameType) = PrefixNameManager(symbol(prefix), NameCounter()) - -function get!(manager :: PrefixNameManager, name :: NameType, hint :: NameType) - name = _default_get_name!(manager.counter, name, hint) - return symbol("$(manager.prefix)$name") -end - -DEFAULT_NAME_MANAGER = BasicNameManager() diff --git a/src/ndarray.jl-e b/src/ndarray.jl-e deleted file mode 100644 index 82293d2fdbe9..000000000000 --- a/src/ndarray.jl-e +++ /dev/null @@ -1,800 +0,0 @@ -#=doc -NDArray API -=========== -=# - -# create a NDArray handle of specific shape -function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) - h_ref = Ref{MX_handle}(0) - shape = flipdim(MX_uint[shape...],1) - @mxcall(:MXNDArrayCreate, (Ptr{MX_uint}, MX_uint, Cint, Cint, Cint, Ref{MX_handle}), - shape, length(shape), ctx.device_type, ctx.device_id, delay_alloc, h_ref) - handle = MX_NDArrayHandle(h_ref[]) - return handle -end - -# create a handle to an empty NDArray, this handle can be used to hold -# results returned by libmx API calls -function _ndarray_alloc() - h_ref = Ref{MX_handle}(0) - @mxcall(:MXNDArrayCreateNone, (Ref{MX_handle},), h_ref) - return MX_NDArrayHandle(h_ref[]) -end - -################################################################################ -# NDArray Type -################################################################################ -#=doc -.. class:: NDArray - - Wrapper of the ``NDArray`` type in ``libmxnet``. This is the basic building block - of tensor-based computation. - - .. _ndarray-shape-note: - - .. note:: - - since C/C++ use row-major ordering for arrays while Julia follows a - column-major ordering. To keep things consistent, we keep the underlying data - in their original layout, but use *language-native* convention when we talk - about shapes. For example, a mini-batch of 100 MNIST images is a tensor of - C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory - have shape (28,28,1,100). -=# -type NDArray - handle :: MX_NDArrayHandle - writable :: Bool - - function NDArray(handle, writable=true) - new(handle, writable) - end -end - -function Base.show(io :: IO, arr :: NDArray) - print(io, "mx.NDArray$(size(arr))") -end - -function NDArray{T<:Real}(data :: Array{T}) - copy(data, cpu()) -end - -function Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) - Base.unsafe_convert(MX_handle, obj.handle) -end -Base.convert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) -Base.cconvert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) - -################################################################################ -# NDArray functions exported to the users -################################################################################ -#=doc -.. function:: context(arr :: NDArray) - - Get the context that this :class:`NDArray` lives on. -=# -function context(arr :: NDArray) - ref_typeid = Ref{Cint}(0) - ref_devid = Ref{Cint}(0) - @mxcall(:MXNDArrayGetContext, (MX_handle, Ref{Cint}, Ref{Cint}), - arr, ref_typeid, ref_devid) - return Context(ref_typeid[], ref_devid[]) -end - -#=doc -.. function:: - empty(shape :: Tuple, ctx :: Context) - empty(shape :: Tuple) - empty(dim1, dim2, ...) - - Allocate memory for an uninitialized :class:`NDArray` with specific shape. -=# -function empty{N}(shape :: NTuple{N, Int}) - empty(shape, cpu()) -end -function empty{N}(shape :: NTuple{N, Int}, ctx :: Context) - NDArray(_ndarray_alloc(shape, ctx, false)) -end -function empty(shape :: Int...) - empty(shape) -end - -#=doc -Interface functions similar to Julia Arrays -------------------------------------------- -=# - -#=doc -.. function:: - zeros(shape :: Tuple, ctx :: Context) - zeros(shape :: Tuple) - zeros(dim1, dim2, ...) - - Create zero-ed :class:`NDArray` with specific shape. -=# -function zeros{N}(shape :: NTuple{N, Int}) - zeros(shape, cpu()) -end -function zeros{N}(shape :: NTuple{N, Int}, ctx :: Context) - arr = empty(shape, ctx) - arr[:] = 0 - return arr -end -function zeros(shape :: Int...) - zeros(shape) -end - -#=doc -.. function:: - ones(shape :: Tuple, ctx :: Context) - ones(shape :: Tuple) - ones(dim1, dim2, ...) - - Create an :class:`NDArray` with specific shape and initialize with 1. -=# -function ones{N}(shape :: NTuple{N, Int}) - ones(shape, cpu()) -end -function ones{N}(shape :: NTuple{N, Int}, ctx :: Context) - arr = empty(shape, ctx) - arr[:] = 1 - return arr -end -function ones(shape :: Int...) - ones(shape) -end - -import Base: size, length, ndims, eltype - -#=doc -.. function:: - size(arr :: NDArray) - size(arr :: NDArray, dim :: Int) - - Get the shape of an :class:`NDArray`. The shape is in Julia's column-major convention. See - also the :ref:`notes on NDArray shapes `. -=# -function size(arr :: NDArray) - ref_ndim = Ref{MX_uint}(0) - ref_shape = Ref{Ptr{MX_uint}}(0) - @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), - arr, ref_ndim, ref_shape) - tuple(map(Int, flipdim(pointer_to_array(ref_shape[], ref_ndim[]),1))...) -end -function size(arr :: NDArray, dim :: Int) - size(arr)[dim] -end - -#=doc -.. function:: length(arr :: NDArray) - - Get the number of elements in an :class:`NDArray`. -=# -function length(arr :: NDArray) - prod(size(arr)) -end - -#=doc -.. function:: ndims(arr :: NDArray) - - Get the number of dimensions of an :class:`NDArray`. Is equivalent to ``length(size(arr))``. -=# -function ndims(arr :: NDArray) - length(size(arr)) -end - -#=doc -.. function:: eltype(arr :: NDArray) - - Get the element type of an :class:`NDArray`. Currently the element type is always ``mx.MX_float``. -=# -function eltype(arr :: NDArray) - MX_float -end - - -import Base: slice -#=doc -.. function:: slice(arr :: NDArray, start:stop) - - Create a view into a sub-slice of an :class:`NDArray`. Note only slicing at the slowest - changing dimension is supported. In Julia's column-major perspective, this is the last - dimension. For example, given an :class:`NDArray` of shape (2,3,4), ``slice(array, 2:3)`` will create - a :class:`NDArray` of shape (2,3,2), sharing the data with the original array. This operation is - used in data parallelization to split mini-batch into sub-batches for different devices. -=# -function slice(arr :: NDArray, ::Colon) - arr -end -function slice(arr :: NDArray, slice::UnitRange{Int}) - dim1 = size(arr)[end] - @assert(1 <= slice.start <= slice.stop <= dim1) - if slice.start == 1 && slice.stop == dim1 - return arr - end - - hdr_ref = Ref{MX_handle}(0) - # note Julia is 1-based, inclusive-inclusive indexing, while C++ is - # 0-based, inclusive-exclusive indexing. So 1:3 in Julia should - # translates into 0:3 in C++. - @mxcall(:MXNDArraySlice, (MX_handle, MX_uint, MX_uint, Ref{MX_handle}), - arr, slice.start-1, slice.stop, hdr_ref) - return NDArray(MX_NDArrayHandle(hdr_ref[]), arr.writable) -end - -import Base: setindex! - -#=doc -.. function:: setindex!(arr :: NDArray, val, idx) - - Assign values to an :class:`NDArray`. Elementwise assignment is not implemented, only the following - scenarios are supported - - - ``arr[:] = val``: whole array assignment, ``val`` could be a scalar or an array (Julia ``Array`` - or :class:`NDArray`) of the same shape. - - ``arr[start:stop] = val``: assignment to a *slice*, ``val`` could be a scalar or an array of - the same shape to the slice. See also :func:`slice`. -=# -function setindex!(arr :: NDArray, val :: Real, ::Colon) - @assert(arr.writable) - _set_value(val, arr) - return arr -end -function setindex!{T<:Real}(arr :: NDArray, val :: Array{T}, ::Colon) - copy!(arr, val) -end -function setindex!(arr :: NDArray, val :: NDArray, ::Colon) - copy!(arr, val) -end -function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, idx::UnitRange{Int}) - setindex!(slice(arr, idx), val, Colon()) -end - -#=doc -.. function:: getindex(arr :: NDArray, idx) - - Shortcut for :func:`slice`. A typical use is to write - - .. code-block:: julia - - arr[:] += 5 - - which translates into - - .. code-block:: julia - - arr[:] = arr[:] + 5 - - which furthur translates into - - .. code-block:: julia - - setindex!(getindex(arr, Colon()), 5, Colon()) - - .. note:: - - The behavior is quite different from indexing into Julia's ``Array``. For example, ``arr[2:5]`` - create a **copy** of the sub-array for Julia ``Array``, while for :class:`NDArray`, this is - a *slice* that shares the memory. -=# -import Base: getindex -"""Shortcut for `slice`. **NOTE** the behavior for Julia's built-in index slicing is to create a -copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. -""" -function getindex(arr :: NDArray, ::Colon) - return arr -end -function getindex(arr :: NDArray, idx::UnitRange{Int}) - slice(arr, idx) -end - -#=doc -Copying functions ------------------ -=# -import Base: copy!, copy, convert -#=doc -.. function:: - copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) - - Copy contents of ``src`` into ``dst``. -=# -function copy!(dst :: NDArray, src :: NDArray) - @assert(dst.writable) - if dst.handle == src.handle - warn("Copying an NDArray to itself") - return - end - - _copyto(src, dst) - return dst -end - -function copy!(dst :: Array{MX_float}, src :: NDArray) - @assert size(dst) == size(src) - @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{MX_float}, Csize_t), - src, pointer(dst), length(dst)) - return dst -end -function copy!{T<:Real}(dst :: Array{T}, src :: NDArray) - copy!(dst, copy(src)) -end - -function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) - @assert dst.writable - @assert size(dst) == size(src) - src = convert(Array{MX_float}, src) # this might involve copying - @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), - dst.handle, pointer(src), length(src)) - return dst -end - -function copy_ignore_shape!{T<:Real}(dst :: NDArray, src :: Array{T}) - @assert dst.writable - @assert length(dst) == length(src) - src = convert(Array{MX_float}, src) # this might involve copying - @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), - dst.handle, pointer(src), length(src)) - return dst -end - - -#=doc -.. function:: - copy(arr :: NDArray) - copy(arr :: NDArray, ctx :: Context) - copy(arr :: Array, ctx :: Context) - - Create a copy of an array. When no :class:`Context` is given, create a Julia ``Array``. - Otherwise, create an :class:`NDArray` on the specified context. -=# -# Create copy: NDArray -> Julia Array -function copy(arr :: NDArray) - j_arr = Array(MX_float, size(arr)) - copy!(j_arr, arr) -end - -# Create copy: NDArray -> NDArray in a given context -function copy(arr :: NDArray, ctx :: Context) - dst = NDArray(_ndarray_alloc(size(arr), ctx, true)) - copy!(dst, arr) -end - -# Create copy: Julia Array -> NDArray in a given context -function copy{T<:Real}(arr :: Array{T}, ctx :: Context) - dst = empty(size(arr), ctx) - copy!(dst, arr) -end - -#=doc -.. function:: convert(::Type{Array{T}}, arr :: NDArray) - - Convert an :class:`NDArray` into a Julia ``Array`` of specific type. -=# -# Convert copy: NDArray -> Julia Array -function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) - convert(t, copy(arr)) -end - - -#=doc -Basic arithmetics ------------------ -=# - -#=doc -.. function:: @inplace - - Julia does not support re-definiton of ``+=`` operator (like ``__iadd__`` in python), - When one write ``a += b``, it gets translated to ``a = a+b``. ``a+b`` will allocate new - memory for the results, and the newly allocated :class:`NDArray` object is then assigned - back to a, while the original contents in a is discarded. This is very inefficient - when we want to do inplace update. - - This macro is a simple utility to implement this behavior. Write - - .. code-block:: julia - - @mx.inplace a += b - - will translate into - - .. code-block:: julia - - mx.add_to!(a, b) - - which will do inplace adding of the contents of ``b`` into ``a``. -=# -macro inplace(stmt) - if stmt.head == :+= || stmt.head == :.+= - Expr(:call, :add_to!, esc(stmt.args[1]), esc(stmt.args[2])) - elseif stmt.head == :-= || stmt.head == :.-= - Expr(:call, :sub_from!, esc(stmt.args[1]), esc(stmt.args[2])) - elseif stmt.head == :.*= - Expr(:call, :mul_to!, esc(stmt.args[1]), esc(stmt.args[2])) - elseif stmt.head == :./= - Expr(:call, :div_from!, esc(stmt.args[1]), esc(stmt.args[2])) - else - error("unsupported inplace translation for $stmt") - end -end - -#=doc -.. function:: add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) - - Add a bunch of arguments into ``dst``. Inplace updating. -=# -function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) - @assert dst.writable - for arg in args - if isa(arg, Real) - _plus_scalar(dst, arg, dst) - else - _plus(dst, arg, dst) - end - end - return dst -end - -#=doc -.. function:: - +(args...) - .+(args...) - - Summation. Multiple arguments of either scalar or :class:`NDArray` could be - added together. Note at least the first or second argument needs to be an :class:`NDArray` to - avoid ambiguity of built-in summation. -=# -import Base: +, .+ -function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) - ret = copy(arg0, context(arg0)) - add_to!(ret, args...) -end -function .+(arg0 :: NDArray, args :: Union{Real, NDArray}...) - +(arg0, args...) -end -function +(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) - +(arg1, arg0, args...) -end -function .+(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) - .+(arg1, arg0, args...) -end - -#=doc -.. function:: sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) - - Subtract a bunch of arguments from ``dst``. Inplace updating. -=# -function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) - @assert dst.writable - if isa(arg, Real) - _minus_scalar(dst, arg, dst) - else - _minus(dst, arg, dst) - end -end - -#=doc -.. function:: - -(arg0, arg1) - -(arg0) - .-(arg0, arg1) - - Subtraction ``arg0 - arg1``, of scalar types or :class:`NDArray`. Or create - the negative of ``arg0``. -=# -import Base: -, .- -function -(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) - ret = copy(arg0, context(arg0)) - sub_from!(ret, arg1) -end -function .-(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) - -(arg0, arg1) -end -function -(arg0 :: Real, arg1 :: NDArray) - ret = -arg1 - add_to!(ret, arg0) - return ret -end -function .-(arg0 :: Real, arg1 :: NDArray) - -(arg0, arg1) -end - -function -(arg0 :: NDArray) - _mul_scalar(arg0, -1.0) -end - -#=doc -.. function:: mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) - - Elementwise multiplication into ``dst`` of either a scalar or an :class:`NDArray` of the same shape. - Inplace updating. -=# -function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) - @assert dst.writable - if isa(arg, Real) - _mul_scalar(dst, arg, dst) - else - _mul(dst, arg, dst) - end - return dst -end - -#=doc -.. function:: - .*(arg0, arg1) - - Elementwise multiplication of ``arg0`` and ``arg``, could be either scalar or :class:`NDArray`. -=# -import Base: .*, * -function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) - ret = copy(arg0, context(arg0)) - mul_to!(ret, arg) -end -function .*(arg0 :: Real, arg :: NDArray) - .*(arg, arg0) -end - -#=doc -.. function:: - *(arg0, arg1) - - Currently only multiplication a scalar with an :class:`NDArray` is implemented. Matrix multiplication - is to be added soon. -=# -function *(arg0 :: NDArray, arg :: Real) - ret = copy(arg0, context(arg0)) - mul_to!(ret, arg) -end -function *(arg0 :: Real, arg :: NDArray) - *(arg, arg0) -end - -#=doc -.. function:: div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) - - Elementwise divide a scalar or an :class:`NDArray` of the same shape from ``dst``. Inplace updating. -=# -function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) - @assert dst.writable - if isa(arg, Real) - _div_scalar(dst, arg, dst) - else - _div(dst, arg, dst) - end -end - -import Base: ./, / -#=doc -.. function:: ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) - - Elementwise dividing an :class:`NDArray` by a scalar or another :class:`NDArray` of the same shape. -=# -function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) - ret = copy(arg0, context(arg0)) - div_from!(ret, arg) -end - -#=doc -.. function:: /(arg0 :: NDArray, arg :: Real) - - Divide an :class:`NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. -=# -function /(arg0 :: NDArray, arg :: Real) - ./(arg0, arg) -end - -#=doc -IO --- -=# -#=doc -.. function:: load(filename, ::Type{NDArray}) - - Load NDArrays from binary file. - - :param AbstractString filename: the path of the file to load. It could be S3 or HDFS address. - :return: Either ``Dict{Base.Symbol, NDArray}`` or ``Vector{NDArray}``. - - If the ``libmxnet`` is built with the corresponding component enabled. Examples - - * ``s3://my-bucket/path/my-s3-ndarray`` - * ``hdfs://my-bucket/path/my-hdfs-ndarray`` - * ``/path-to/my-local-ndarray`` -=# -function load(filename::AbstractString, ::Type{NDArray}) - out_size = Ref{MX_uint}(0) - out_hdrs = Ref{Ptr{MX_handle}}(0) - out_name_size = Ref{MX_uint}(0) - out_names = Ref{char_pp}(0) - @mxcall(:MXNDArrayLoad, (char_p, Ref{MX_uint}, Ref{Ptr{MX_handle}}, Ref{MX_uint}, Ref{char_pp}), - filename, out_size, out_hdrs, out_name_size, out_names) - out_name_size = out_name_size[] - out_size = out_size[] - if out_name_size == 0 - return [NDArray(MX_NDArrayHandle(hdr)) for hdr in pointer_to_array(out_hdrs[], out_size)] - else - @assert out_size == out_name_size - return Dict([(symbol(bytestring(k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in - zip(pointer_to_array(out_names[], out_size), pointer_to_array(out_hdrs[], out_size))]) - end -end - -#=doc -.. function:: save(filename :: AbstractString, data) - - Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built - with corresponding support. - - :param AbstractString filename: path to the binary file to write to. - :param data: data to save to file. - :type data: :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. -=# -function save(filename::AbstractString, data::NDArray) - save(filename, [data]) -end -function save(filename::AbstractString, data::Vector{NDArray}) - @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), - filename, length(data), MX_handle[data...], char_pp(0)) -end -function save(filename::AbstractString, data::Dict{Base.Symbol,NDArray}) - names = [k for k in keys(data)] - arrays = MX_handle[data[k] for k in names] - names = AbstractString[string(k) for k in names] - - @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), - filename, length(names), arrays, names) -end - -#=doc -libmxnet APIs -------------- -=# -################################################################################ -# NDArray functions dynamically imported from libmxnet -################################################################################ -function _invoke_mxfunction(func_handle::MX_handle, use_vars, scalars, mut_vars) - @mxcall(:MXFuncInvoke, - (MX_handle, Ptr{MX_handle}, Ptr{MX_float}, Ptr{MX_handle}), - func_handle, use_vars, scalars, mut_vars) -end - -@enum(LIBMX_FUNC_TYPE_MASK, - NDARRAY_ARG_BEFORE_SCALAR = 1, - ACCEPT_EMPTY_MUTATE_TARGET = (1 << 2) -) - -# Import corresponding math functions from base so the automatically defined libmxnet -# functions can overload them -import Base: sqrt - -#=doc -The libxmnet APIs are automatically imported from ``libmxnet.so``. The functions listed -here operate on :class:`NDArray` objects. The arguments to the functions are typically ordered -as - -.. code-block:: julia - - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) - -unless ``NDARRAY_ARG_BEFORE_SCALAR`` is not set. In this case, the scalars are put before the input arguments: - -.. code-block:: julia - - func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) - - -If ``ACCEPT_EMPTY_MUTATE_TARGET`` is set. An overloaded function without the output arguments will also be defined: - -.. code-block:: julia - - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) - -Upon calling, the output arguments will be automatically initialized with empty NDArrays. - -Those functions always return the output arguments. If there is only one output (the typical situation), that -object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. - -**autogen:EMBED:ndarray:EMBED:autogen** -=# -function _import_ndarray_functions(;gen_docs=false) - n_ref = Ref{MX_uint}(0) - h_ref = Ref{Ptr{MX_handle}}(0) - @mxcall(:MXListFunctions, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) - - n_funcs = n_ref[] - h_funcs = pointer_to_array(h_ref[], n_funcs) - - if gen_docs - docs = Dict{Base.Symbol, AbstractString}() - end - - for i = 1:n_funcs - func_handle = h_funcs[i] - - #---------------------------------------- - # get function information (human readable) - ref_name = Ref{char_p}(0) - ref_desc = Ref{char_p}(0) - ref_narg = Ref{MX_uint}(0) - - ref_arg_names = Ref{char_pp}(0) - ref_arg_types = Ref{char_pp}(0) - ref_arg_descs = Ref{char_pp}(0) - - @mxcall(:MXFuncGetInfo, - (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), - func_handle, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) - - func_name = symbol(bytestring(ref_name[])) - - if gen_docs - # generate document only - f_desc = bytestring(ref_desc[]) * "\n\n" - f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) - docs[func_name] = f_desc - else - #---------------------------------------- - # get function specification - ref_n_use_vars = Ref{MX_uint}(0) - ref_n_scalars = Ref{MX_uint}(0) - ref_n_mut_vars = Ref{MX_uint}(0) - ref_type_mask = Ref{Cint}(0) - @mxcall(:MXFuncDescribe, - (MX_handle, Ref{MX_uint}, Ref{MX_uint}, Ref{MX_uint}, Ref{Cint}), - func_handle, ref_n_use_vars, ref_n_scalars, ref_n_mut_vars, ref_type_mask) - - #---------------------------------------- - # prepare function definition - n_used_vars = ref_n_use_vars[] - n_scalars = ref_n_scalars[] - n_mutate_vars = ref_n_mut_vars[] - type_mask = ref_type_mask[] - accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 - arg_before_scalar = (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 - - # general ndarray function - if arg_before_scalar - args = vcat([Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) - else - args = vcat([Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) - end - - _use_vars = Expr(:ref, :MX_handle, [symbol("in$i") for i=1:n_used_vars]...) - _scalars = Expr(:ref, :MX_float, [symbol("sca$i") for i=1:n_scalars]...) - _mut_vars = Expr(:ref, :MX_handle, [symbol("out$i") for i=1:n_mutate_vars]...) - stmt_call = Expr(:call, :_invoke_mxfunction, func_handle, _use_vars, _scalars, _mut_vars) - if n_mutate_vars == 1 - stmt_ret = :(return out1) - else - stmt_ret = Expr(:return, Expr(:tuple, [symbol("out$i") for i=1:n_mutate_vars]...)) - end - - func_body = Expr(:block, stmt_call, stmt_ret) - func_head = Expr(:call, func_name, args...) - - func_def = Expr(:function, func_head, func_body) - eval(func_def) - - if accept_empty_mutate - args0 = args[1:n_used_vars+n_scalars] - func_head0 = Expr(:call, func_name, args0...) - _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] - stmt_call0 = Expr(:call, func_name, args0..., _mut_vars0...) - func_body0 = Expr(:block, stmt_call0) - func_head0 = Expr(:call, func_name, args0...) - - func_def0 = Expr(:function, func_head0, func_body0) - eval(func_def0) - end - end - end - - if gen_docs - return docs - end -end - diff --git a/src/optimizer.jl-e b/src/optimizer.jl-e deleted file mode 100644 index a5f0bfd5ec60..000000000000 --- a/src/optimizer.jl-e +++ /dev/null @@ -1,226 +0,0 @@ -#=doc -Optimizers -========== - -Common interfaces ------------------ -=# - - -#=doc -.. class:: AbstractOptimizer - - Base type for all optimizers. -=# -abstract AbstractOptimizer - -#=doc -.. class:: AbstractLearningRateScheduler - - Base type for all learning rate scheduler. -=# -abstract AbstractLearningRateScheduler - -#=doc -.. class:: AbstractMomentumScheduler - - Base type for all momentum scheduler. -=# -abstract AbstractMomentumScheduler - - - -#=doc -.. class:: OptimizationState - - .. attribute:: batch_size - - The size of the mini-batch used in stochastic training. - - .. attribute:: curr_epoch - - The current epoch count. Epoch 0 means no training yet, during the first - pass through the data, the epoch will be 1; during the second pass, the - epoch count will be 1, and so on. - - .. attribute:: curr_batch - - The current mini-batch count. The batch count is reset during every epoch. - The batch count 0 means the beginning of each epoch, with no mini-batch - seen yet. During the first mini-batch, the mini-batch count will be 1. - - .. attribute:: curr_iter - - The current iteration count. One iteration corresponds to one mini-batch, - but unlike the mini-batch count, the iteration count does **not** reset - in each epoch. So it track the *total* number of mini-batches seen so far. -=# -type OptimizationState - batch_size :: Int - curr_epoch :: Int - curr_batch :: Int - curr_iter :: Int -end -OptimizationState(batch_size::Int) = OptimizationState(batch_size, 0, 0, 0) - - -#=doc -.. function:: get_learning_rate(scheduler, state) - - :param AbstractLearningRateScheduler scheduler: a learning rate scheduler. - :param OptimizationState state: the current state about epoch, mini-batch and iteration count. - :return: the current learning rate. -=# -function get_learning_rate -end - -################################################################################ -# The learning rate module -module LearningRate -import ..mx: AbstractLearningRateScheduler, OptimizationState, get_learning_rate - -#=doc -.. class:: LearningRate.Fixed - - Fixed learning rate scheduler always return the same learning rate. -=# -type Fixed <: AbstractLearningRateScheduler - learning_rate :: Float64 -end -get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rate - -#=doc -.. class:: LearningRate.Exp - - :math:`\eta_t = \eta_0\gamma^t`. Here :math:`t` is the epoch count, or the iteration - count if ``decay_on_iteration`` is set to true. -=# -type Exp <: AbstractLearningRateScheduler - learning_rate :: Float64 - gamma :: Float64 - on_iteration :: Bool -end -function Exp(base_lr::Real; gamma::Real=0.9, decay_on_iteration::Bool=false) - @assert(0 < gamma < 1) - Exp(Float64(base_lr), Float64(gamma), decay_on_iteration) -end -get_learning_rate(self :: Exp, state :: OptimizationState) = - self.learning_rate * self.gamma ^ (self.on_iteration ? state.curr_iter : state.curr_epoch) - -end # module LearningRate -################################################################################ -function get_lr_scheduler(scheduler :: Any, lr :: Real) - if isa(scheduler, AbstractLearningRateScheduler) - return scheduler - else - return LearningRate.Fixed(lr) - end -end - - -#=doc -.. function:: get_momentum(scheduler, state) - - :param AbstractMomentumScheduler scheduler: the momentum scheduler. - :param OptimizationState state: the state about current epoch, mini-batch and iteration count. - :return: the current momentum. -=# -function get_momentum -end - - -################################################################################ -# The Momentum module -module Momentum -import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum - -#=doc -.. class:: Momentum.Null - - The null momentum scheduler always returns 0 for momentum. It is also used to - explicitly indicate momentum should not be used. -=# -type Null <: AbstractMomentumScheduler -end -get_momentum(self :: Null, state :: OptimizationState) = 0.0 - -#=doc -.. class:: Momentum.Fixed - - Fixed momentum scheduler always returns the same value. -=# -type Fixed <: AbstractMomentumScheduler - momentum :: Float64 -end -get_momentum(self :: Fixed, state :: OptimizationState) = self.momentum -end # module Momentum -################################################################################ -function get_momentum_scheduler(scheduler :: Any, momentum :: Real) - if isa(scheduler, AbstractMomentumScheduler) - return scheduler - elseif momentum == 0 - return Momentum.Null() - else - return Momentum.Fixed(momentum) - end -end - - -#=doc -.. function:: get_updater(optimizer) - - :param AbstractOptimizer optimizer: the underlying optimizer. - - A utility function to create an updater function, that uses its closure to - store all the states needed for each weights. -=# -function get_updater(optimizer :: AbstractOptimizer) - states = Dict{Int,Any}() - function updater(index :: Int, grad :: NDArray, weight :: NDArray) - if !haskey(states, index) - states[index] = create_state(optimizer, index, weight) - end - update(optimizer, index, weight, grad, states[index]) - end - return updater -end - -################################################################################ -#=doc -Built-in optimizers -------------------- -=# - -#=doc -.. class:: AbstractOptimizerOptions - - Base class for all optimizer options. -=# -abstract AbstractOptimizerOptions - -#=doc -.. function:: normalized_gradient(opts, state, grad) - - :param AbstractOptimizerOptions opts: options for the optimizer, should contain the field - ``grad_scale``, ``grad_clip`` and ``weight_decay``. - :param OptimizationState state: the current optimization state. - :param NDArray weight: the trainable weights. - :param NDArray grad: the original gradient of the weights. - - Get the properly normalized gradient (re-scaled and clipped if necessary). -=# -function normalized_gradient(opts::AbstractOptimizerOptions, state::OptimizationState, - weight::NDArray, grad::NDArray) - grad_scale = opts.grad_scale / state.batch_size - - grad = grad_scale * grad - if opts.grad_clip > 0 - grad = clip(grad, -opts.grad_clip, opts.grad_clip) - end - @inplace grad += opts.weight_decay * weight - - return grad -end - -include("optimizers/sgd.jl") -include("optimizers/adam.jl") diff --git a/src/random.jl-e b/src/random.jl-e deleted file mode 100644 index 79a8b6e9e20b..000000000000 --- a/src/random.jl-e +++ /dev/null @@ -1,25 +0,0 @@ -function rand!(low::Real, high::Real, out::NDArray) - _random_uniform(low, high, out) -end -function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}) - rand(low, high, shape, cpu()) -end -function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}, ctx::Context) - out = empty(shape, ctx) - rand!(low, high, out) -end - -function randn!(mean::Real, stdvar::Real, out::NDArray) - _random_gaussian(mean, stdvar, out) -end -function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}) - randn(mean, stdvar, shape, cpu()) -end -function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}, ctx::Context) - out = empty(shape, ctx) - randn!(mean, stdvar, out) -end - -function srand!(seed_state::Int) - @mxcall(:MXRandomSeed, (Cint,), seed_state) -end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 0c3760240844..b33c89c18616 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -279,7 +279,7 @@ end libmxnet APIs ------------- -**autogen:EMBED:SymbolicNode:EMBED:autogen** +**autogen:EMBED:symbolic-node:EMBED:autogen** =# ################################################################################ # Atomic SymbolicNode functions dynamically imported from libmxnet diff --git a/src/symbolic-node.jl-e b/src/symbolic-node.jl-e deleted file mode 100644 index 337d50864684..000000000000 --- a/src/symbolic-node.jl-e +++ /dev/null @@ -1,437 +0,0 @@ -#=doc -Symbolic API -============ -=# - -#=doc -.. class:: Node - - Node is the basic building block of the symbolic graph in MXNet.jl. - - .. note:: - - Throughout this documentation, ``Node`` always refer to this :class:`Node` type. - When we refer to the Julia's build-in Node type (e.g. ``typeof(:foo)``), we always - say ``Base.Symbol``. -=# -type Node - handle :: MX_SymbolHandle -end -function Base.unsafe_convert(::Type{MX_handle}, obj::Node) - Base.unsafe_convert(MX_handle, obj.handle) -end -Base.convert(t::Type{MX_handle}, obj::Node) = Base.unsafe_convert(t, obj) -Base.cconvert(t::Type{MX_handle}, obj::Node) = Base.unsafe_convert(t, obj) - -#=doc -.. function:: deepcopy(self :: Node) - - Make a deep copy of a Node. -=# -function Base.deepcopy(self :: Node) - ref_hdr = Ref{MX_handle}(0) - @mxcall(:MXSymbolCopy, (MX_handle, Ref{MX_handle}), self, ref_hdr) - return Node(MX_SymbolHandle(ref_hdr[])) -end - -#=doc -.. function:: copy(self :: Node) - - Make a copy of a Node. The same as making a deep copy. -=# -function Base.copy(self :: Node) - Base.deepcopy(self) -end - -function Base.call(self :: Node, args :: Node...) - s = deepcopy(self) - _compose!(s, args...) -end -function Base.call(self :: Node; kwargs...) - s = deepcopy(self) - _compose!(s; kwargs...) -end - -macro _list_symbol_info(self, func_name) - quote - ref_sz = Ref{MX_uint}(0) - ref_names = Ref{char_pp}(0) - @mxcall($func_name, (MX_handle, Ref{MX_uint}, Ref{char_pp}), - $self, ref_sz, ref_names) - narg = ref_sz[] - names = pointer_to_array(ref_names[], narg) - names = [symbol(bytestring(x)) for x in names] - return names - end -end -function list_arguments(self :: Node) - @_list_symbol_info(self, :MXSymbolListArguments) -end -function list_outputs(self :: Node) - @_list_symbol_info(self, :MXSymbolListOutputs) -end -"""List all auxiliary states in the symbool. - -Auxiliary states are special states of symbols that do not corresponds to an argument, -and do not have gradient. But still be useful for the specific operations. -A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. -Most operators do not have Auxiliary states. -""" -function list_auxiliary_states(self :: Node) - @_list_symbol_info(self, :MXSymbolListAuxiliaryStates) -end - -"Get a new grouped Node whose output contains all the internal outputs of this Node." -function get_internals(self :: Node) - ref_hdr = Ref{MX_handle}(0) - @mxcall(:MXSymbolGetInternals, (MX_handle, Ref{MX_handle}), self, ref_hdr) - return Node(MX_SymbolHandle(ref_hdr[])) -end - -"Create a symbolic variable with the given name" -function Variable(name :: Union{Base.Symbol, AbstractString}) - hdr_ref = Ref{MX_handle}(0) - @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) - Node(MX_SymbolHandle(hdr_ref[])) -end - -"Create a Node that groups symbols together" -function Group(symbols :: Node...) - handles = MX_handle[symbols...] - ref_hdr = Ref{MX_handle}(0) - @mxcall(:MXSymbolCreateGroup, (MX_uint, Ptr{MX_handle}, Ref{MX_handle}), - length(handles), handles, ref_hdr) - Node(MX_SymbolHandle(ref_hdr[])) -end - -macro _infer_shape(self, keys, indptr, sdata) - quote - ref_arg_shape_size = Ref{MX_uint}(0) - ref_arg_shape_ndim = Ref{Ptr{MX_uint}}(0) - ref_arg_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) - ref_out_shape_size = Ref{MX_uint}(0) - ref_out_shape_ndim = Ref{Ptr{MX_uint}}(0) - ref_out_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) - ref_aux_shape_size = Ref{MX_uint}(0) - ref_aux_shape_ndim = Ref{Ptr{MX_uint}}(0) - ref_aux_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) - ref_complete = Ref{Cint}(0) - @mxcall(:MXSymbolInferShape, - (MX_handle, MX_uint, char_pp, Ptr{MX_uint}, Ptr{MX_uint}, - Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, - Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, - Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, - Ref{Cint}), - self, length(indptr)-1, keys, indptr, sdata, - ref_arg_shape_size, ref_arg_shape_ndim, ref_arg_shape_data, - ref_out_shape_size, ref_out_shape_ndim, ref_out_shape_data, - ref_aux_shape_size, ref_aux_shape_ndim, ref_aux_shape_data, - ref_complete) - if ref_complete[] == 0 - return (nothing, nothing, nothing) - else - function build_shapes(shape_size::MX_uint, shape_ndim::Ptr{MX_uint}, shape_data::Ptr{Ptr{MX_uint}}) - shape_ndim = pointer_to_array(shape_ndim, shape_size) - shape_data = pointer_to_array(shape_data, shape_size) - shapes = map(1:shape_size) do i - my_shape = pointer_to_array(shape_data[i], shape_ndim[i]) - tuple(flipdim(Int[my_shape...],1)...) - end - convert(Vector{Tuple}, shapes) - end - return ( - build_shapes(ref_arg_shape_size[], ref_arg_shape_ndim[], ref_arg_shape_data[]), - build_shapes(ref_out_shape_size[], ref_out_shape_ndim[], ref_out_shape_data[]), - build_shapes(ref_aux_shape_size[], ref_aux_shape_ndim[], ref_aux_shape_data[]) - ) - end - end -end -function infer_shape(self :: Node; kwargs...) - sdata = MX_uint[] - indptr = MX_uint[0] - for (k,v) in kwargs - append!(sdata, flipdim([v...],1)) - push!(indptr, length(sdata)) - end - keys = AbstractString[string(x[1]) for x in kwargs] - @_infer_shape(self, keys, indptr, sdata) -end -function infer_shape(self :: Node, args :: Union{Tuple, Void}...) - sdata = MX_uint[] - indptr = MX_uint[0] - for arg in args - if isa(arg, Void); continue; end - append!(sdata, flipdim([arg...],1)) - push!(indptr, length(sdata)) - end - keys = Ptr{char_p}(0) - @_infer_shape(self, keys, indptr, sdata) -end - -function Base.getindex(self :: Node, idx :: Union{Base.Symbol, AbstractString}) - idx = symbol(idx) - i_idx = find(idx .== list_outputs(self)) - @assert(length(i_idx) > 0, "Cannot find output with name '$idx'") - @assert(length(i_idx) < 2, "Found duplicated output with name '$idx'") - Base.getindex(self, i_idx[1]) -end -function Base.getindex(self :: Node, idx :: Int) - ref_hdr = Ref{MX_handle}(0) - # note Julia is 1-based, while MXNet is 0-based - @mxcall(:MXSymbolGetOutput, (MX_handle, MX_uint, Ref{MX_handle}), self, idx-1, ref_hdr) - return Node(MX_SymbolHandle(ref_hdr[])) -end - -import Base: +, .+ -function +(self :: Node, args :: Node...) - ret = self - for arg in args - ret = _Plus(ret, arg) - end - ret -end -function .+(self :: Node, args :: Node...) - +(self, args...) -end - -import Base: -, .- -function -(self :: Node, arg :: Node) - _Minus(self, arg) -end -function .-(self :: Node, arg :: Node) - -(self, arg) -end - -import Base: .* -function .*(self :: Node, args :: Node...) - ret = self - for arg in args - ret = _Mul(ret, arg) - end - ret -end - -import Base: ./ -function ./(self :: Node, arg :: Node) - _Div(self, arg) -end - -function _compose!(sym :: Node; kwargs...) - name = char_p(0) - arg_keys = AbstractString[] - arg_vals = MX_handle[] - - for (k,v) in kwargs - if k == :name - name = string(v) - else - @assert(isa(v, Node), "Compose expect `Node` as arguments") - push!(arg_keys, string(k)) - push!(arg_vals, v) - end - end - - @mxcall(:MXSymbolCompose, - (MX_handle, char_p, MX_uint, Ptr{char_p}, Ptr{MX_handle}), - sym, name, length(arg_keys), arg_keys, arg_vals) - return sym -end -function _compose!(sym :: Node, args::Node...) - _compose!(sym, char_p(0), args...) -end -function _compose!(sym :: Node, name :: Union{Base.Symbol, char_p}, args::Node...) - if isa(name, Base.Symbol); name = string(name); end - arg_keys = Ptr{char_p}(0) - arg_vals = MX_handle[args...] - - @mxcall(:MXSymbolCompose, - (MX_handle, char_p, MX_uint, Ptr{char_p}, Ptr{MX_handle}), - sym, name, length(arg_vals), arg_keys, arg_vals) - return sym -end - -"""Save Node into a JSON string""" -function to_json(self :: Node) - ref_json = Ref{char_p}(0) - @mxcall(:MXSymbolSaveToJSON, (MX_handle, Ref{char_p}), self, ref_json) - return bytestring(ref_json[]) -end - -"""Load Node from a JSON string representation.""" -function from_json(repr :: AbstractString, ::Type{Node}) - ref_hdr = Ref{MX_handle}(0) - @mxcall(:MXSymbolCreateFromJSON, (char_p, Ref{MX_handle}), repr, ref_hdr) - return Node(MX_SymbolHandle(ref_hdr[])) -end - -"""Load Node from a JSON file.""" -function load(filename :: AbstractString, ::Type{Node}) - ref_hdr = Ref{MX_handle}(0) - @mxcall(:MXSymbolCreateFromFile, (char_p, Ref{MX_handle}), filename, ref_hdr) - return Node(MX_SymbolHandle(ref_hdr[])) -end -function save(filename :: AbstractString, sym :: Node) - @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), sym, filename) -end - -#=doc -libmxnet APIs -------------- - -**autogen:EMBED:Node:EMBED:autogen** -=# -################################################################################ -# Atomic Node functions dynamically imported from libmxnet -################################################################################ -function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) - ref_name = Ref{char_p}(0) - ref_desc = Ref{char_p}(0) - ref_kv_nargs = Ref{char_p}(0) - ref_nargs = Ref{MX_uint}(0) - ref_arg_names = Ref{char_pp}(0) - ref_arg_types = Ref{char_pp}(0) - ref_arg_descs = Ref{char_pp}(0) - - @mxcall(:MXSymbolGetAtomicSymbolInfo, - (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, - Ref{char_pp}, Ref{char_p}), - hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, ref_kv_nargs) - - func_name = symbol(bytestring(ref_name[])) - kv_nargs_s = bytestring(ref_kv_nargs[]) - kv_nargs = symbol(kv_nargs_s) - - if gen_docs - f_desc = bytestring(ref_desc[]) * "\n\n" - if !isempty(kv_nargs_s) - f_desc *= "This function support variable length positional :class:`Node` inputs.\n\n" - end - f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":param Base.Symbol name: The name of the Node. (e.g. `:my_symbol`), optional.\n\n" - f_desc *= ":return: the constructed :class:`Node`.\n\n" - return (func_name, f_desc) - end - - # function $func_name(args...; kwargs...) - func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) - func_body = quote - idx = findfirst(x -> x[1] == :name, kwargs) - if idx > 0 - name = kwargs[idx][2] - else - name = "" - end - - param_keys = AbstractString[] - param_vals = AbstractString[] - symbol_kws = Dict{Base.Symbol, Node}() - - $(if kv_nargs != symbol("") - quote - if !in($kv_nargs_s, param_keys) - push!(param_keys, $kv_nargs_s) - push!(param_vals, string(length(args))) - end - end - end) - - for (k,v) in kwargs - if k == :name; continue; end - if isa(v, Node) - symbol_kws[k] = v - else - push!(param_keys, string(k)) - push!(param_vals, dump_mx_param(v)) - end - end - - if length(args) != 0 && length(symbol_kws) != 0 - @assert(false, "$func_name only accepts Symbols either as positional or keyword arguments, not both.") - end - $(if kv_nargs != symbol("") - quote - if length(symbol_kws) > 0 - @assert(false, "$func_name takes variable number of Node arguments, please pass input Symbols " * - "via positional arguments, instead of keyword arguments.") - end - end - end) - - # create the Node - ref_sym_hdr = Ref{MX_handle}() - @mxcall(:MXSymbolCreateAtomicSymbol, - (MX_handle, MX_uint, Ptr{char_p}, Ptr{char_p}, Ref{MX_handle}), - $hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) - sym_hdr = ref_sym_hdr[] - - sym = Node(MX_SymbolHandle(sym_hdr)) - hint = lowercase(string($func_name)) - name = get!(DEFAULT_NAME_MANAGER, name, hint) - - if length(args) != 0 - _compose!(sym, name, args...) - else - _compose!(sym; name=name, symbol_kws...) - end - - return sym - end - - func_def = Expr(:function, func_head, Expr(:block, func_body)) - eval(func_def) -end - -function _import_atomic_symbol_creators(;gen_docs=false) - n_ref = Ref{MX_uint}(0) - h_ref = Ref{Ptr{MX_handle}}(0) - @mxcall(:MXSymbolListAtomicSymbolCreators, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) - - n_creators = n_ref[] - h_creators = pointer_to_array(h_ref[], n_creators) - - if gen_docs - docs = Dict{Base.Symbol, AbstractString}() - end - - for i = 1:n_creators - creator_hdr = h_creators[i] - ret = _define_atomic_symbol_creator(creator_hdr, gen_docs=gen_docs) - if gen_docs - docs[ret[1]] = ret[2] - end - end - - if gen_docs - return docs - end -end - -################################################################################ -# Utility macros to chain up symbols -################################################################################ -macro chain(layers) - exprs = [] - last_layer = nothing - function _chain_layer(layer, last_layer) - if isa(last_layer, Void) - esc(layer) - else - @assert(isa(layer, Expr) && layer.head == :call, "Do not know how to chain up $layer") - return Expr(:call, esc(layer.args[1]), last_layer, map(esc, layer.args[2:end])...) - end - end - while true - if layers.head == :(=>) - new_layer = gensym() - push!(exprs, :($new_layer = $(_chain_layer(layers.args[1], last_layer)))) - last_layer = new_layer - layers = layers.args[2] - else - push!(exprs, _chain_layer(layers, last_layer)) - break - end - end - return Expr(:block, exprs...) -end - diff --git a/src/util.jl-e b/src/util.jl-e deleted file mode 100644 index 4ca613cbf7d1..000000000000 --- a/src/util.jl-e +++ /dev/null @@ -1,70 +0,0 @@ -################################################################################ -# Dataset related utilities -################################################################################ -function get_data_dir() - data_dir = joinpath(Pkg.dir("MXNet"), "data") - mkpath(data_dir) - data_dir -end - -function get_mnist_ubyte() - data_dir = get_data_dir() - mnist_dir = joinpath(data_dir, "mnist") - mkpath(mnist_dir) - filenames = Dict(:train_data => "train-images-idx3-ubyte", - :train_label => "train-labels-idx1-ubyte", - :test_data => "t10k-images-idx3-ubyte", - :test_label => "t10k-labels-idx1-ubyte") - filenames = [k => joinpath(mnist_dir, v) for (k,v) in filenames] - if !all(isfile, values(filenames)) - cd(mnist_dir) do - run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/mnist.zip`) - run(`unzip -u mnist.zip`) - end - end - return filenames -end - -function get_cifar10() - data_dir = get_data_dir() - cifar10_dir = joinpath(data_dir, "cifar10") - mkpath(cifar10_dir) - filenames = Dict(:train => "cifar/train.rec", :test => "cifar/test.rec") - filenames = [k => joinpath(cifar10_dir, v) for (k,v) in filenames] - if !all(isfile, values(filenames)) - cd(cifar10_dir) do - run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/cifar10.zip`) - run(`unzip -u cifar10.zip`) - end - end - - filenames[:mean] = joinpath(cifar10_dir, "cifar/cifar_mean.bin") - return filenames -end - - -################################################################################ -# Internal Utilities -################################################################################ -const DOC_EMBED_ANCHOR = "**autogen:EMBED:{1}:EMBED:autogen**" -function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{char_pp}, arg_descs::Ref{char_pp}, remove_dup::Bool=true) - param_keys = Set{AbstractString}() - - arg_names = pointer_to_array(arg_names[], narg) - arg_types = pointer_to_array(arg_types[], narg) - arg_descs = pointer_to_array(arg_descs[], narg) - docstrings = AbstractString[] - - for i = 1:narg - arg_name = bytestring(arg_names[i]) - if arg_name ∈ param_keys && remove_dup - continue - end - push!(param_keys, arg_name) - - arg_type = bytestring(arg_types[i]) - arg_desc = bytestring(arg_descs[i]) - push!(docstrings, ":param $arg_name: $arg_desc\n:type $arg_name: $arg_type\n\n") - end - return join(docstrings, "\n") -end From c13f88f7c04883e721c8d24c20ea2dc02d5765e2 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 15:49:45 -0500 Subject: [PATCH 187/630] add nn-factory --- README.md | 8 ++------ examples/mnist/mlp.jl | 17 ++++++++++------ src/MXNet.jl | 2 ++ src/nn-factory.jl | 46 +++++++++++++++++++++++++++++++++++++++++++ 4 files changed, 61 insertions(+), 12 deletions(-) create mode 100644 src/nn-factory.jl diff --git a/README.md b/README.md index 10862ff8a6a6..7dc99a24a7b4 100644 --- a/README.md +++ b/README.md @@ -15,12 +15,8 @@ Here is an exmple of how training a simple 3-layer MLP on MNIST looks like: ```julia using MXNet -mlp = @mx.chain mx.Variable(:data) => - mx.FullyConnected(name=:fc1, num_hidden=128) => - mx.Activation(name=:relu1, act_type=:relu) => - mx.FullyConnected(name=:fc2, num_hidden=64) => - mx.Activation(name=:relu2, act_type=:relu) => - mx.FullyConnected(name=:fc3, num_hidden=10) => +mlp = @mx.chain mx.Variable(:data) => + mx.MLP([128, 64, 10]) => mx.SoftmaxOutput(name=:softmax) # data provider diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index f6fbbd5c0870..cdb0064da8e5 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -14,12 +14,17 @@ using MXNet # mlp = mx.SoftmaxOutput(data = fc3, name=:softmax) #-- Option 2: using the mx.chain macro -mlp = @mx.chain mx.Variable(:data) => - mx.FullyConnected(name=:fc1, num_hidden=128) => - mx.Activation(name=:relu1, act_type=:relu) => - mx.FullyConnected(name=:fc2, num_hidden=64) => - mx.Activation(name=:relu2, act_type=:relu) => - mx.FullyConnected(name=:fc3, num_hidden=10) => +# mlp = @mx.chain mx.Variable(:data) => +# mx.FullyConnected(name=:fc1, num_hidden=128) => +# mx.Activation(name=:relu1, act_type=:relu) => +# mx.FullyConnected(name=:fc2, num_hidden=64) => +# mx.Activation(name=:relu2, act_type=:relu) => +# mx.FullyConnected(name=:fc3, num_hidden=10) => +# mx.SoftmaxOutput(name=:softmax) + +#-- Option 3: using nn-factory +mlp = @mx.chain mx.Variable(:data) => + mx.MLP([128, 64, 10]) => mx.SoftmaxOutput(name=:softmax) # data provider diff --git a/src/MXNet.jl b/src/MXNet.jl index f9f9e8664c4f..a3e280d26a11 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -30,6 +30,8 @@ include("model.jl") include("util.jl") +include("nn-factory.jl") + end # mx end # module MXNet diff --git a/src/nn-factory.jl b/src/nn-factory.jl new file mode 100644 index 000000000000..79aec78a1746 --- /dev/null +++ b/src/nn-factory.jl @@ -0,0 +1,46 @@ +#=doc +Neural Networks Factory +======================= + +Neural network factory provide convenient helper functions to define +common neural networks. +=# + +#=doc +.. function:: MLP(input, spec) + + Construct a multi-layer perceptron. + + :param SymbolicNode input: the input to the mlp. + :param spec: the mlp specification, a list of hidden dimensions. For example, + ``[128, (512, :sigmoid), 10]``. The number in the list indicate the + number of hidden units in each layer. A tuple could be used to specify + the activation of each layer. Otherwise, the default activation will + be used (except for the last layer). + :param Base.Symbol hidden_activation: keyword argument, default ``:relu``, indicating + the default activation for hidden layers. The specification here could be overwritten + by layer-wise specification in the ``spec`` argument. Also activation is not + applied to the last, i.e. the prediction layer. + :param prefix: keyword argument, default ``gensym()``, used as the prefix to + name the constructed layers. +=# +function MLP(input, spec; hidden_activation::Base.Symbol=:relu, prefix=gensym()) + spec = convert(Vector{Union{Int,Tuple}}, spec) + + n_layer = length(spec) + for (i, s) in enumerate(spec) + if isa(s, Tuple) + n_unit, act_type = s + else + n_unit = s + act_type = hidden_activation + end + input = FullyConnected(input, name=symbol(prefix, "fc$i"), num_hidden=n_unit) + if i < n_layer || isa(s, Tuple) + # will not add activation unless the user explicitly specified + input = Activation(input, name=symbol(prefix, "$act_type$i"), act_type=act_type) + end + end + + return input +end From 3bc475a2e16391e7faffe2fd4e809d6f20751c9b Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 15:50:45 -0500 Subject: [PATCH 188/630] add doc for nn factory --- docs/api/nn-factory.rst | 29 +++++++++++++++++++++++++++++ docs/build-api.jl | 2 ++ docs/index.rst | 1 + 3 files changed, 32 insertions(+) create mode 100644 docs/api/nn-factory.rst diff --git a/docs/api/nn-factory.rst b/docs/api/nn-factory.rst new file mode 100644 index 000000000000..02e3d2ca73f1 --- /dev/null +++ b/docs/api/nn-factory.rst @@ -0,0 +1,29 @@ + +Neural Networks Factory +======================= + +Neural network factory provide convenient helper functions to define +common neural networks. + + + + +.. function:: MLP(input, spec) + + Construct a multi-layer perceptron. + + :param SymbolicNode input: the input to the mlp. + :param spec: the mlp specification, a list of hidden dimensions. For example, + ``[128, (512, :sigmoid), 10]``. The number in the list indicate the + number of hidden units in each layer. A tuple could be used to specify + the activation of each layer. Otherwise, the default activation will + be used (except for the last layer). + :param Base.Symbol hidden_activation: keyword argument, default ``:relu``, indicating + the default activation for hidden layers. The specification here could be overwritten + by layer-wise specification in the ``spec`` argument. Also activation is not + applied to the last, i.e. the prediction layer. + :param prefix: keyword argument, default ``gensym()``, used as the prefix to + name the constructed layers. + + + diff --git a/docs/build-api.jl b/docs/build-api.jl index 510426ee2004..d49996a24cb3 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -92,3 +92,5 @@ extract_doc("optimizer.rst", "optimizer.jl") extract_doc("io.rst", "io.jl") embed_mxnet_api("io.rst", "io", mx._import_io_iterators) + +extract_doc("nn-factory.rst", "nn-factory.jl") diff --git a/docs/index.rst b/docs/index.rst index 6203ad3a1af4..c10f44780a2b 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -39,6 +39,7 @@ For more details, see documentation below. Please also checkout the `examples api/io api/ndarray api/symbolic-node + api/nn-factory api/executor Indices and tables From 41c20ae0ca7fff41bbc85aa93841b86f231f2dbb Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 15:53:13 -0500 Subject: [PATCH 189/630] fix travis CI build error due to refactoring --- examples/mnist/mlp-test.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl index 04d917c6543d..feabd1140a89 100644 --- a/examples/mnist/mlp-test.jl +++ b/examples/mnist/mlp-test.jl @@ -38,9 +38,9 @@ function mnist_fit_and_predict(optimizer, initializer, n_epoch) for i_epoch = 0:n_epoch @test isfile(mx.format("{1}-{2:04d}.params", cp_prefix, i_epoch)) end - mlp_load = mx.load("$cp_prefix-symbol.json", mx.Symbol) + mlp_load = mx.load("$cp_prefix-symbol.json", mx.SymbolicNode) @test mx.to_json(mlp_load) == mx.to_json(mlp) - mlp_load = mx.from_json(readall("$cp_prefix-symbol.json"), mx.Symbol) + mlp_load = mx.from_json(readall("$cp_prefix-symbol.json"), mx.SymbolicNode) @test mx.to_json(mlp_load) == mx.to_json(mlp) #-------------------------------------------------------------------------------- From 3e8627d59142e05692c401e06e2b165b2e926832 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 15:57:51 -0500 Subject: [PATCH 190/630] document clean up --- docs/api/nn-factory.rst | 8 ++++++-- docs/api/symbolic-node.rst | 6 ------ src/nn-factory.jl | 8 ++++++-- src/symbolic-node.jl | 6 ------ 4 files changed, 12 insertions(+), 16 deletions(-) diff --git a/docs/api/nn-factory.rst b/docs/api/nn-factory.rst index 02e3d2ca73f1..44569c640da9 100644 --- a/docs/api/nn-factory.rst +++ b/docs/api/nn-factory.rst @@ -10,7 +10,8 @@ common neural networks. .. function:: MLP(input, spec) - Construct a multi-layer perceptron. + Construct a multi-layer perceptron. A MLP is a multi-layer neural network with + fully connected layers. :param SymbolicNode input: the input to the mlp. :param spec: the mlp specification, a list of hidden dimensions. For example, @@ -21,9 +22,12 @@ common neural networks. :param Base.Symbol hidden_activation: keyword argument, default ``:relu``, indicating the default activation for hidden layers. The specification here could be overwritten by layer-wise specification in the ``spec`` argument. Also activation is not - applied to the last, i.e. the prediction layer. + applied to the last, i.e. the prediction layer. See :func:`Activation` for a + list of supported activation types. :param prefix: keyword argument, default ``gensym()``, used as the prefix to name the constructed layers. + :return: the constructed MLP. + diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index 9386c10a8614..bead11843799 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -9,12 +9,6 @@ Symbolic API SymbolicNode is the basic building block of the symbolic graph in MXNet.jl. - .. note:: - - Throughout this documentation, ``SymbolicNode`` always refer to this :class:`SymbolicNode` type. - When we refer to the Julia's build-in SymbolicNode type (e.g. ``typeof(:foo)``), we always - say ``Base.Symbol``. - diff --git a/src/nn-factory.jl b/src/nn-factory.jl index 79aec78a1746..984f50a5f782 100644 --- a/src/nn-factory.jl +++ b/src/nn-factory.jl @@ -9,7 +9,8 @@ common neural networks. #=doc .. function:: MLP(input, spec) - Construct a multi-layer perceptron. + Construct a multi-layer perceptron. A MLP is a multi-layer neural network with + fully connected layers. :param SymbolicNode input: the input to the mlp. :param spec: the mlp specification, a list of hidden dimensions. For example, @@ -20,9 +21,12 @@ common neural networks. :param Base.Symbol hidden_activation: keyword argument, default ``:relu``, indicating the default activation for hidden layers. The specification here could be overwritten by layer-wise specification in the ``spec`` argument. Also activation is not - applied to the last, i.e. the prediction layer. + applied to the last, i.e. the prediction layer. See :func:`Activation` for a + list of supported activation types. :param prefix: keyword argument, default ``gensym()``, used as the prefix to name the constructed layers. + + :return: the constructed MLP. =# function MLP(input, spec; hidden_activation::Base.Symbol=:relu, prefix=gensym()) spec = convert(Vector{Union{Int,Tuple}}, spec) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index b33c89c18616..6258810b0a34 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -7,12 +7,6 @@ Symbolic API .. class:: SymbolicNode SymbolicNode is the basic building block of the symbolic graph in MXNet.jl. - - .. note:: - - Throughout this documentation, ``SymbolicNode`` always refer to this :class:`SymbolicNode` type. - When we refer to the Julia's build-in SymbolicNode type (e.g. ``typeof(:foo)``), we always - say ``Base.Symbol``. =# type SymbolicNode handle :: MX_SymbolHandle From be8cbdace438a9faf7b5a617bba1799574477b1d Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 16:13:19 -0500 Subject: [PATCH 191/630] more test for IO --- test/unittest/io.jl | 2 ++ 1 file changed, 2 insertions(+) diff --git a/test/unittest/io.jl b/test/unittest/io.jl index 8ef3b57d948c..39e37f1bfe9a 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -51,9 +51,11 @@ function test_arrays_impl(data::Vector, label::Vector, provider::mx.ArrayDataPro for (d1, (_, d2)) in zip(data, mx.provide_data(provider)) @test size(d1)[1:end-1] == d2[1:end-1] + @test batch_size == d2[end] end for (d1, (_, d2)) in zip(label, mx.provide_label(provider)) @test size(d1)[1:end-1] == d2[1:end-1] + @test batch_size == d2[end] end info("IO::Array::#data=$(length(data)),#label=$(length(label)),batch_size=$batch_size") From b49dc626b0bd60953b4cc1c0a78129e6d0b0c342 Mon Sep 17 00:00:00 2001 From: = <=> Date: Mon, 9 Nov 2015 19:32:40 -0500 Subject: [PATCH 192/630] update doc (Symbol -> SymbolicNode) --- docs/api/io.rst | 4 +- docs/api/symbolic-node.rst | 112 ++++++++++++++++++------------------- src/symbolic-node.jl | 2 +- src/util.jl | 5 +- 4 files changed, 63 insertions(+), 60 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index e9d9c04e9f3c..6c9d71836108 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -317,7 +317,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -460,7 +460,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index bead11843799..f811d41aaad5 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -36,13 +36,13 @@ Public APIs Apply activation function to input. :param data: Input data to activation function. - :type data: Symbol + :type data: SymbolicNode :param act_type: Activation function to be applied. :type act_type: {'relu', 'sigmoid', 'tanh'}, required - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -55,7 +55,7 @@ Public APIs Apply batch normalization to input. :param data: Input data to batch normalization - :type data: Symbol + :type data: SymbolicNode :param eps: Epsilon to prevent div 0 @@ -65,7 +65,7 @@ Public APIs :param momentum: Momentum for moving average :type momentum: float, optional, default=0.1 - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -78,9 +78,9 @@ Public APIs Get output from a symbol and pass 0 gradient back :param data: Input data. - :type data: Symbol + :type data: SymbolicNode - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -97,7 +97,7 @@ Public APIs :param num_args: Number of inputs to be concated. :type num_args: int, required - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -110,15 +110,15 @@ Public APIs Apply convolution to input then add a bias. :param data: Input data to the ConvolutionOp. - :type data: Symbol + :type data: SymbolicNode :param weight: Weight matrix. - :type weight: Symbol + :type weight: SymbolicNode :param bias: Bias parameter. - :type bias: Symbol + :type bias: SymbolicNode :param kernel: convolution kernel size: (y, x) @@ -148,7 +148,7 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=False - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -161,15 +161,15 @@ Public APIs Apply deconvolution to input then add a bias. :param data: Input data to the DeconvolutionOp. - :type data: Symbol + :type data: SymbolicNode :param weight: Weight matrix. - :type weight: Symbol + :type weight: SymbolicNode :param bias: Bias parameter. - :type bias: Symbol + :type bias: SymbolicNode :param kernel: deconvolution kernel size: (y, x) @@ -199,7 +199,7 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=True - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -212,13 +212,13 @@ Public APIs Apply dropout to input :param data: Input data to dropout. - :type data: Symbol + :type data: SymbolicNode :param p: Fraction of the input that gets dropped out at training time :type p: float, optional, default=0.5 - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -235,7 +235,7 @@ Public APIs :param num_args: Number of inputs to be sumed. :type num_args: int, required - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -248,9 +248,9 @@ Public APIs Flatten input :param data: Input data to flatten. - :type data: Symbol + :type data: SymbolicNode - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -263,15 +263,15 @@ Public APIs Apply matrix multiplication to input then add a bias. :param data: Input data to the FullyConnectedOp. - :type data: Symbol + :type data: SymbolicNode :param weight: Weight matrix. - :type weight: Symbol + :type weight: SymbolicNode :param bias: Bias parameter. - :type bias: Symbol + :type bias: SymbolicNode :param num_hidden: Number of hidden nodes of the output. @@ -281,7 +281,7 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=False - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -294,7 +294,7 @@ Public APIs Apply convolution to input then add a bias. :param data: Input data to the ConvolutionOp. - :type data: Symbol + :type data: SymbolicNode :param alpha: value of the alpha variance scaling parameter in the normalization formula @@ -312,7 +312,7 @@ Public APIs :param nsize: normalization window width in elements. :type nsize: int (non-negative), required - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -325,7 +325,7 @@ Public APIs Apply activation function to input. :param data: Input data to activation function. - :type data: Symbol + :type data: SymbolicNode :param act_type: Activation function to be applied. @@ -343,7 +343,7 @@ Public APIs :param upper_bound: Upper bound of random slope. (For rrelu only) :type upper_bound: float, optional, default=0.334 - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -356,13 +356,13 @@ Public APIs Use linear regression for final output, this is used on final output of a net. :param data: Input data to function. - :type data: Symbol + :type data: SymbolicNode :param label: Input label to function. - :type label: Symbol + :type label: SymbolicNode - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -376,13 +376,13 @@ Public APIs Logistic regression is suitable for binary classification or probability prediction tasks. :param data: Input data to function. - :type data: Symbol + :type data: SymbolicNode :param label: Input label to function. - :type label: Symbol + :type label: SymbolicNode - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -395,7 +395,7 @@ Public APIs Perform spatial pooling on inputs. :param data: Input data to the pooling operator. - :type data: Symbol + :type data: SymbolicNode :param kernel: pooling kernel size: (y, x) @@ -413,7 +413,7 @@ Public APIs :param pad: pad for pooling: (y, x) :type pad: Shape(tuple), optional, default=(0, 0) - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -426,13 +426,13 @@ Public APIs Reshape input to target shape :param data: Input data to reshape. - :type data: Symbol + :type data: SymbolicNode :param target_shape: Target new shape :type target_shape: Shape(tuple), required - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -447,7 +447,7 @@ Public APIs :param num_outputs: Number of outputs to be sliced. :type num_outputs: int, required - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -460,7 +460,7 @@ Public APIs DEPRECATED: Perform a softmax transformation on input. Please use SoftmaxOutput :param data: Input data to softmax. - :type data: Symbol + :type data: SymbolicNode :param grad_scale: Scale the gradient by a float factor @@ -470,7 +470,7 @@ Public APIs :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes :type multi_output: boolean, optional, default=False - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -483,7 +483,7 @@ Public APIs Perform a softmax transformation on input, backprop with logloss. :param data: Input data to softmax. - :type data: Symbol + :type data: SymbolicNode :param grad_scale: Scale the gradient by a float factor @@ -493,7 +493,7 @@ Public APIs :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes :type multi_output: boolean, optional, default=False - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -506,9 +506,9 @@ Public APIs Take exp of the src :param src: Source symbolic input to the function - :type src: Symbol + :type src: SymbolicNode - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -521,9 +521,9 @@ Public APIs Take log of the src :param src: Source symbolic input to the function - :type src: Symbol + :type src: SymbolicNode - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -536,9 +536,9 @@ Public APIs Take sqrt of the src :param src: Source symbolic input to the function - :type src: Symbol + :type src: SymbolicNode - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -551,9 +551,9 @@ Public APIs Take square of the src :param src: Source symbolic input to the function - :type src: Symbol + :type src: SymbolicNode - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -571,7 +571,7 @@ Internal APIs Perform an elementwise div. - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -583,7 +583,7 @@ Internal APIs Perform an elementwise minus. - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -595,7 +595,7 @@ Internal APIs Perform an elementwise mul. - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -614,7 +614,7 @@ Internal APIs :param need_top_grad: Whether this layer needs out grad for backward. Should be false for loss layers. :type need_top_grad: boolean, optional, default=True - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -626,7 +626,7 @@ Internal APIs Perform an elementwise plus. - :param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional. + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 6258810b0a34..7f993c7491b5 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -302,7 +302,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) f_desc *= "This function support variable length positional :class:`SymbolicNode` inputs.\n\n" end f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":param Base.Symbol name: The name of the SymbolicNode. (e.g. `:my_symbol`), optional.\n\n" + f_desc *= ":param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional.\n\n" f_desc *= ":return: the constructed :class:`SymbolicNode`.\n\n" return (func_name, f_desc) end diff --git a/src/util.jl b/src/util.jl index 4ca613cbf7d1..be27d1e2310c 100644 --- a/src/util.jl +++ b/src/util.jl @@ -47,6 +47,9 @@ end # Internal Utilities ################################################################################ const DOC_EMBED_ANCHOR = "**autogen:EMBED:{1}:EMBED:autogen**" +function _format_typestring(typestr :: AbstractString) + replace(typestr, r"\bSymbol\b", "SymbolicNode") +end function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{char_pp}, arg_descs::Ref{char_pp}, remove_dup::Bool=true) param_keys = Set{AbstractString}() @@ -62,7 +65,7 @@ function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{ch end push!(param_keys, arg_name) - arg_type = bytestring(arg_types[i]) + arg_type = _format_typestring(bytestring(arg_types[i])) arg_desc = bytestring(arg_descs[i]) push!(docstrings, ":param $arg_name: $arg_desc\n:type $arg_name: $arg_type\n\n") end From 591871cd0cbf0e411a7d16f5a05b80f34e92bc7b Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 9 Nov 2015 23:59:20 -0500 Subject: [PATCH 193/630] add doc for metrics --- docs/api/io.rst | 4 ++-- docs/api/metric.rst | 46 +++++++++++++++++++++++++++++++++++++++++++++ docs/build-api.jl | 1 + docs/index.rst | 1 + src/metric.jl | 43 ++++++++++++++++++++++++++++++++++++++++++ 5 files changed, 93 insertions(+), 2 deletions(-) create mode 100644 docs/api/metric.rst diff --git a/docs/api/io.rst b/docs/api/io.rst index 6c9d71836108..e9d9c04e9f3c 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -317,7 +317,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -460,7 +460,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/metric.rst b/docs/api/metric.rst new file mode 100644 index 000000000000..db18ae731a59 --- /dev/null +++ b/docs/api/metric.rst @@ -0,0 +1,46 @@ + +Evaluation Metrics +================== + +Evaluation metrics provide a way to evaluate the performance of a learned model. +This is typically used during training to monitor performance on the validation +set. + + + + +.. class:: AbstractEvalMetric + + The base class for all evaluation metrics. The sub-types should implement the following + interfaces. + + .. function:: update!(metric, labels, preds) + + Update and accumulate metrics. + + :param AbstractEvalMetric metric: the metric object. + :param labels: the labels from the data provider. + :type labels: Vector{NDArray} + :param preds: the outputs (predictions) of the network. + :type preds: Vector{NDArray} + + .. function:: reset!(metric) + + Reset the accumulation counter. + + .. function:: get(metric) + + Get the accumulated metrics. + + :return: ``Vector{Tuple{Base.Symbol, Real}}``, a list of name-value pairs. For + example, ``[(:accuracy, 0.9)]``. + + + + +.. class:: Accuracy + + Multiclass classification accuracy. + + + diff --git a/docs/build-api.jl b/docs/build-api.jl index d49996a24cb3..99ae5ad1c709 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -89,6 +89,7 @@ extract_doc("callback.rst", "callback.jl") extract_doc("model.rst", "model.jl") extract_doc("optimizer.rst", "optimizer.jl") +extract_doc("metric.rst", "metric.jl") extract_doc("io.rst", "io.jl") embed_mxnet_api("io.rst", "io", mx._import_io_iterators) diff --git a/docs/index.rst b/docs/index.rst index c10f44780a2b..da28e3080440 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -36,6 +36,7 @@ For more details, see documentation below. Please also checkout the `examples api/initializer api/optimizer api/callback + api/metric api/io api/ndarray api/symbolic-node diff --git a/src/metric.jl b/src/metric.jl index c88239ab8cc8..73e4b9a30a7b 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -1,5 +1,46 @@ +#=doc +Evaluation Metrics +================== + +Evaluation metrics provide a way to evaluate the performance of a learned model. +This is typically used during training to monitor performance on the validation +set. +=# + +#=doc +.. class:: AbstractEvalMetric + + The base class for all evaluation metrics. The sub-types should implement the following + interfaces. + + .. function:: update!(metric, labels, preds) + + Update and accumulate metrics. + + :param AbstractEvalMetric metric: the metric object. + :param labels: the labels from the data provider. + :type labels: Vector{NDArray} + :param preds: the outputs (predictions) of the network. + :type preds: Vector{NDArray} + + .. function:: reset!(metric) + + Reset the accumulation counter. + + .. function:: get(metric) + + Get the accumulated metrics. + + :return: ``Vector{Tuple{Base.Symbol, Real}}``, a list of name-value pairs. For + example, ``[(:accuracy, 0.9)]``. +=# abstract AbstractEvalMetric +#=doc +.. class:: Accuracy + + Multiclass classification accuracy. +=# type Accuracy <: AbstractEvalMetric acc_sum :: Float64 n_sample :: Int @@ -35,3 +76,5 @@ function reset!(metric :: Accuracy) metric.acc_sum = 0.0 metric.n_sample = 0 end + + From 2b85c9caf5ee5621308fb8c57976fb26baa35418 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 10 Nov 2015 00:29:20 -0500 Subject: [PATCH 194/630] share NDArray data with Julia Array. --- src/ndarray.jl | 53 +++++++++++++++++++++++++++++++++++++++++++++++++- 1 file changed, 52 insertions(+), 1 deletion(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 82293d2fdbe9..eceabb3eb5be 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -368,13 +368,64 @@ end #=doc .. function:: convert(::Type{Array{T}}, arr :: NDArray) - Convert an :class:`NDArray` into a Julia ``Array`` of specific type. + Convert an :class:`NDArray` into a Julia ``Array`` of specific type. Data will be copied. =# # Convert copy: NDArray -> Julia Array function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) convert(t, copy(arr)) end +# NOTE: internal use only. Accessing pointers on a different device (e.g. accessing GPU +# pointers from CPU) leads to undefined behavior. +import Base.pointer +function pointer(arr :: NDArray) + pdata = Ref{Ptr{MX_float}}(0) + @mxcall(:MXNDArrayGetData, (MX_handle, Ref{Ptr{MX_float}}), arr, pdata) + return pdata[] +end +#=doc +.. function:: try_get_shared(arr) + + Try to create a Julia array by sharing the data with the underlying :class:`NDArray`. + + :param NDArray arr: the array to be shared. + + .. warning:: + + The returned array does not guarantee to share data with the underlying :class:`NDArray`. + In particular, data sharing is possible only when the :class:`NDArray` lives on CPU. +=# +function try_get_shared(arr :: NDArray) + if context(arr).device_type == CPU + # try to do data sharing + vec = pointer_to_array(pointer(arr), length(arr)) + return reshape(vec, size(arr)) + else + # impossible to share, just copying + return copy(arr) + end +end + +#=doc +.. function:: is_shared(j_arr, arr) + + Test whether ``j_arr`` is sharing data with ``arr``. + + :param Array j_arr: the Julia Array. + :param NDArray arr: the :class:`NDArray`. +=# +function is_shared{T}(j_arr :: Array{T}, arr :: NDArray) + false +end +function is_shared(j_arr :: Array{MX_float}, arr :: NDArray) + if length(j_arr) != length(arr) + return false + end + if context(arr).device_type != CPU + return false + end + return pointer(j_arr) == pointer(arr) +end #=doc Basic arithmetics From 2055727383eb3d135b2619eab719687c4afd83a0 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 10 Nov 2015 01:41:10 -0500 Subject: [PATCH 195/630] nd_as_jl macro --- src/ndarray.jl | 212 +++++++++++++++++++++++++++++++++++++------------ 1 file changed, 160 insertions(+), 52 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index eceabb3eb5be..9fc86002fcad 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -375,58 +375,6 @@ function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) convert(t, copy(arr)) end -# NOTE: internal use only. Accessing pointers on a different device (e.g. accessing GPU -# pointers from CPU) leads to undefined behavior. -import Base.pointer -function pointer(arr :: NDArray) - pdata = Ref{Ptr{MX_float}}(0) - @mxcall(:MXNDArrayGetData, (MX_handle, Ref{Ptr{MX_float}}), arr, pdata) - return pdata[] -end -#=doc -.. function:: try_get_shared(arr) - - Try to create a Julia array by sharing the data with the underlying :class:`NDArray`. - - :param NDArray arr: the array to be shared. - - .. warning:: - - The returned array does not guarantee to share data with the underlying :class:`NDArray`. - In particular, data sharing is possible only when the :class:`NDArray` lives on CPU. -=# -function try_get_shared(arr :: NDArray) - if context(arr).device_type == CPU - # try to do data sharing - vec = pointer_to_array(pointer(arr), length(arr)) - return reshape(vec, size(arr)) - else - # impossible to share, just copying - return copy(arr) - end -end - -#=doc -.. function:: is_shared(j_arr, arr) - - Test whether ``j_arr`` is sharing data with ``arr``. - - :param Array j_arr: the Julia Array. - :param NDArray arr: the :class:`NDArray`. -=# -function is_shared{T}(j_arr :: Array{T}, arr :: NDArray) - false -end -function is_shared(j_arr :: Array{MX_float}, arr :: NDArray) - if length(j_arr) != length(arr) - return false - end - if context(arr).device_type != CPU - return false - end - return pointer(j_arr) == pointer(arr) -end - #=doc Basic arithmetics ----------------- @@ -634,6 +582,166 @@ function /(arg0 :: NDArray, arg :: Real) ./(arg0, arg) end + +#=doc +Manipulating as Julia Arrays +---------------------------- + +.. function:: @nd_as_jl(captures..., statement) + + A convenient macro that allows to operate :class:`NDArray` as Julia Arrays. For example, + + .. code-block:: julia + + x = mx.zeros(3,4) + y = mx.ones(3,4) + z = mx.zeros((3,4), mx.gpu()) + + @mx.nd_as_jl ro=(x,y) rw=z begin + # now x, y, z are just ordinary Julia Arrays + z[:,1] = y[:,2] + z[:,2] = 5 + end + + Under the hood, the macro convert all the declared captures from :class:`NDArray` into Julia + Arrays, by using :func:`try_get_shared`. And automatically commit the modifications back into + the :class:`NDArray` that is declared as ``rw``. This is useful for fast prototyping and when + implement non-critical computations, such as :class:`AbstractEvalMetric`. + + .. note:: + + - Multiple ``rw`` and / or ``ro`` capture declaration could be made. + - The macro does **not** check to make sure that ``ro`` captures are not modified. If the + original :class:`NDArray` lives in CPU memory, then it is very likely the corresponding + Julia Array shares data with the :class:`NDArray`, so modifying the Julia Array will also + modify the underlying :class:`NDArray`. + - When an :class:`NDArray` is declared to be captured as ``rw``, its contents is always sync + back in the end. + - The execution results of the expanded macro is always ``nothing``. + - The statements are wrapped in a ``let``, thus locally introduced new variables will not be + available after the statements. So you will need to declare the variables before calling the + macro if needed. +=# +macro nd_as_jl(m_args...) + @assert(length(m_args) > 0) + stmts = m_args[end] + @assert(isa(stmts, Expr) && stmts.head == :block, + "The last argument should be a statement block (begin-end); but get $stmts") + stmts = esc(stmts) + + dclrs = m_args[1:end-1] + nd_ro = [] + nd_rw = [] + nd_all = [] + for declr in dclrs + @assert(isa(declr, Expr) && declr.head == :(=) && length(declr.args)==2 && declr.args[1] ∈ (:ro,:rw), + "Invalid declaration, should be rw=(x,y) or ro=z; but get $declr") + + declr_vars = declr.args[2] + if isa(declr_vars, Symbol) + declr_vars = (declr_vars,) + elseif isa(declr_vars, Expr) + @assert(declr_vars.head ∈ (:tuple, :vect), + "Capture declaration should be a variable or a tuple of variables; but got $declr_vars") + declr_vars = declr_vars.args + else + @assert(false, "Capture declaration should be a variable or a tuple of variables; but got $declr_vars") + end + for declr_var in declr_vars + @assert(isa(declr_var, Symbol), + "Captured ndarrays in ro/rw declaration should be variables, but get $(declr_var)") + end + append!(nd_all, [declr_vars...]) + if declr.args[1] == :ro + append!(nd_ro, [declr_vars...]) + else + append!(nd_rw, [declr_vars...]) + end + end + + nd_ro = map(esc, nd_ro) + nd_rw = map(esc, nd_rw) + nd_all = map(esc, nd_all) + rw_origs = [gensym() for _ in nd_rw] + + save_statements = Expr(:block, [:($v_orig = $v) for (v_orig, v) in zip(rw_origs, nd_rw)]...) + clear_statements = Expr(:block, [:($v_orig = nothing) for v_orig in rw_origs]...) + let_assignments = [:($v = try_get_shared($v)) for v in nd_all] + sync_statements = map(rw_origs, nd_rw) do v_orig, v + quote + if !is_shared($v, $v_orig) + # copy data back if not or no longer sharing data + copy!($v_orig, $v) + end + end + end + sync_statements = Expr(:block, sync_statements...) + + let_statement = Expr(:let, quote + $sync_statements + end, let_assignments...) + m_body = quote + $save_statements + $let_statement + $clear_statements + nothing # the final results is always nothing + end + + m_body +end + +# NOTE: internal use only. Accessing pointers on a different device (e.g. accessing GPU +# pointers from CPU) leads to undefined behavior. +import Base.pointer +function pointer(arr :: NDArray) + pdata = Ref{Ptr{MX_float}}(0) + @mxcall(:MXNDArrayGetData, (MX_handle, Ref{Ptr{MX_float}}), arr, pdata) + return pdata[] +end +#=doc +.. function:: try_get_shared(arr) + + Try to create a Julia array by sharing the data with the underlying :class:`NDArray`. + + :param NDArray arr: the array to be shared. + + .. warning:: + + The returned array does not guarantee to share data with the underlying :class:`NDArray`. + In particular, data sharing is possible only when the :class:`NDArray` lives on CPU. +=# +function try_get_shared(arr :: NDArray) + if context(arr).device_type == CPU + # try to do data sharing + vec = pointer_to_array(pointer(arr), length(arr)) + return reshape(vec, size(arr)) + else + # impossible to share, just copying + return copy(arr) + end +end + +#=doc +.. function:: is_shared(j_arr, arr) + + Test whether ``j_arr`` is sharing data with ``arr``. + + :param Array j_arr: the Julia Array. + :param NDArray arr: the :class:`NDArray`. +=# +function is_shared{T}(j_arr :: Array{T}, arr :: NDArray) + false +end +function is_shared(j_arr :: Array{MX_float}, arr :: NDArray) + if length(j_arr) != length(arr) + return false + end + if context(arr).device_type != CPU + return false + end + return pointer(j_arr) == pointer(arr) +end + #=doc IO -- From ea90b55aef0385134018634473c63434fdffffdb Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 10 Nov 2015 02:24:50 -0500 Subject: [PATCH 196/630] use nd_as_jl to re-write accuracy --- docs/api/ndarray.rst | 71 +++++++++++++++++++++++++++++++++++++++++++- src/metric.jl | 15 +++++----- src/ndarray.jl | 15 ++++++++++ 3 files changed, 92 insertions(+), 9 deletions(-) diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index 05a3dccba7dc..270d85bab837 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -178,7 +178,7 @@ Copying functions .. function:: convert(::Type{Array{T}}, arr :: NDArray) - Convert an :class:`NDArray` into a Julia ``Array`` of specific type. + Convert an :class:`NDArray` into a Julia ``Array`` of specific type. Data will be copied. @@ -296,6 +296,75 @@ Basic arithmetics +Manipulating as Julia Arrays +---------------------------- + +.. function:: @nd_as_jl(captures..., statement) + + A convenient macro that allows to operate :class:`NDArray` as Julia Arrays. For example, + + .. code-block:: julia + + x = mx.zeros(3,4) + y = mx.ones(3,4) + z = mx.zeros((3,4), mx.gpu()) + + @mx.nd_as_jl ro=(x,y) rw=z begin + # now x, y, z are just ordinary Julia Arrays + z[:,1] = y[:,2] + z[:,2] = 5 + end + + Under the hood, the macro convert all the declared captures from :class:`NDArray` into Julia + Arrays, by using :func:`try_get_shared`. And automatically commit the modifications back into + the :class:`NDArray` that is declared as ``rw``. This is useful for fast prototyping and when + implement non-critical computations, such as :class:`AbstractEvalMetric`. + + .. note:: + + - Multiple ``rw`` and / or ``ro`` capture declaration could be made. + - The macro does **not** check to make sure that ``ro`` captures are not modified. If the + original :class:`NDArray` lives in CPU memory, then it is very likely the corresponding + Julia Array shares data with the :class:`NDArray`, so modifying the Julia Array will also + modify the underlying :class:`NDArray`. + - More importantly, since the :class:`NDArray` is + asynchronized, we will wait for *writing* for ``rw`` variables but wait only for *reading* + in ``ro`` variables. If we write into those ``ro`` variables, **and** if the memory is + shared, racing condition might happen, and the behavior is undefined. + - When an :class:`NDArray` is declared to be captured as ``rw``, its contents is always sync + back in the end. + - The execution results of the expanded macro is always ``nothing``. + - The statements are wrapped in a ``let``, thus locally introduced new variables will not be + available after the statements. So you will need to declare the variables before calling the + macro if needed. + + + + +.. function:: try_get_shared(arr) + + Try to create a Julia array by sharing the data with the underlying :class:`NDArray`. + + :param NDArray arr: the array to be shared. + + .. warning:: + + The returned array does not guarantee to share data with the underlying :class:`NDArray`. + In particular, data sharing is possible only when the :class:`NDArray` lives on CPU. + + + + +.. function:: is_shared(j_arr, arr) + + Test whether ``j_arr`` is sharing data with ``arr``. + + :param Array j_arr: the Julia Array. + :param NDArray arr: the :class:`NDArray`. + + + + IO -- diff --git a/src/metric.jl b/src/metric.jl index 73e4b9a30a7b..297aee384079 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -49,14 +49,13 @@ type Accuracy <: AbstractEvalMetric end function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDArray) - label = copy(label) - pred = copy(pred) - - n_sample = size(pred)[end] - metric.n_sample += n_sample - for i = 1:n_sample - klass = indmax(pred[:,i]) - metric.acc_sum += (klass-1) == label[i] + @nd_as_jl ro=(label,pred) begin + n_sample = size(pred)[end] + metric.n_sample += n_sample + for i = 1:n_sample + klass = indmax(pred[:,i]) + metric.acc_sum += (klass-1) == label[i] + end end end diff --git a/src/ndarray.jl b/src/ndarray.jl index 9fc86002fcad..e477bf6fd2f4 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -615,6 +615,10 @@ Manipulating as Julia Arrays original :class:`NDArray` lives in CPU memory, then it is very likely the corresponding Julia Array shares data with the :class:`NDArray`, so modifying the Julia Array will also modify the underlying :class:`NDArray`. + - More importantly, since the :class:`NDArray` is + asynchronized, we will wait for *writing* for ``rw`` variables but wait only for *reading* + in ``ro`` variables. If we write into those ``ro`` variables, **and** if the memory is + shared, racing condition might happen, and the behavior is undefined. - When an :class:`NDArray` is declared to be captured as ``rw``, its contents is always sync back in the end. - The execution results of the expanded macro is always ``nothing``. @@ -665,6 +669,8 @@ macro nd_as_jl(m_args...) rw_origs = [gensym() for _ in nd_rw] save_statements = Expr(:block, [:($v_orig = $v) for (v_orig, v) in zip(rw_origs, nd_rw)]...) + wait_statements = Expr(:block, [:(_wait_to_read($v)) for v in nd_ro]..., + [:(_wait_to_write($v)) for v in nd_rw]...) clear_statements = Expr(:block, [:($v_orig = nothing) for v_orig in rw_origs]...) let_assignments = [:($v = try_get_shared($v)) for v in nd_all] sync_statements = map(rw_origs, nd_rw) do v_orig, v @@ -678,9 +684,11 @@ macro nd_as_jl(m_args...) sync_statements = Expr(:block, sync_statements...) let_statement = Expr(:let, quote + $stmts $sync_statements end, let_assignments...) m_body = quote + $wait_statements $save_statements $let_statement $clear_statements @@ -698,6 +706,13 @@ function pointer(arr :: NDArray) @mxcall(:MXNDArrayGetData, (MX_handle, Ref{Ptr{MX_float}}), arr, pdata) return pdata[] end +function _wait_to_read(arr :: NDArray) + @mxcall(:MXNDArrayWaitToRead, (MX_handle,), arr) +end +function _wait_to_write(arr :: NDArray) + @mxcall(:MXNDArrayWaitToWrite, (MX_handle,), arr) +end + #=doc .. function:: try_get_shared(arr) From b5c0d96af18c9ea341ade0b714a1965c6776fa42 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 11 Nov 2015 13:00:37 +0900 Subject: [PATCH 197/630] reformultate accuracy with multi_output in mind --- src/metric.jl | 26 +++++++++++++++++++++----- 1 file changed, 21 insertions(+), 5 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 297aee384079..12860a5ae0d9 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -50,11 +50,27 @@ end function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDArray) @nd_as_jl ro=(label,pred) begin - n_sample = size(pred)[end] - metric.n_sample += n_sample - for i = 1:n_sample - klass = indmax(pred[:,i]) - metric.acc_sum += (klass-1) == label[i] + if ndims(label) > 1 # Multidimensional case + # Construct cartesian index + initial = tuple([1 for _ in 1:ndims(label)-1]...) + final = tuple([size(label, i) for i in 1:ndims(label)-1]...) + crange = CartesianRange(CartesianIndex(initial), CartesianIndex(final)) + + for sample in 1:size(label, ndims(label)) + for i in crange + ps = sub(pred, i.I..., :, sample) + klass = indmax(ps) + metric.acc_sum += (klass-1) == label[i.I..., sample] + metric.n_sample += 1 + end + end + else # 1-dimensional case + for sample in 1:size(label, 1) + ps = sub(pred, :, sample) + klass = indmax(ps) + metric.acc_sum += (klass-1) == label[sample] + metric.n_sample += 1 + end end end end From 8322b6337f32dbcfe597f6ba95e0d369490eeb3d Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 11 Nov 2015 14:19:13 +0900 Subject: [PATCH 198/630] Calculate accuracy based on size of pred. The label array is reshaped and misses the information about the size of the first few dimensions. --- src/metric.jl | 11 ++++++----- 1 file changed, 6 insertions(+), 5 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 12860a5ae0d9..aed5ca0fede6 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -50,17 +50,18 @@ end function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDArray) @nd_as_jl ro=(label,pred) begin - if ndims(label) > 1 # Multidimensional case + if ndims(pred) > 2 # Multidimensional case # Construct cartesian index - initial = tuple([1 for _ in 1:ndims(label)-1]...) - final = tuple([size(label, i) for i in 1:ndims(label)-1]...) - crange = CartesianRange(CartesianIndex(initial), CartesianIndex(final)) + initial = tuple(fill(1, ndims(pred)-2)...) + dims = size(pred, (1:ndims(pred)-2)...) + crange = CartesianRange(CartesianIndex(initial), CartesianIndex(dims)) for sample in 1:size(label, ndims(label)) for i in crange + l_i = sub2ind(dims, i.I...) ps = sub(pred, i.I..., :, sample) klass = indmax(ps) - metric.acc_sum += (klass-1) == label[i.I..., sample] + metric.acc_sum += (klass-1) == label[l_i, sample] metric.n_sample += 1 end end From c30097172a54fffa8d21185bd2c7b7d3ce8bf477 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 11 Nov 2015 14:37:02 +0900 Subject: [PATCH 199/630] remove sub from accuracy --- src/metric.jl | 29 +++++++++++++++++++++++------ 1 file changed, 23 insertions(+), 6 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index aed5ca0fede6..8d5838aff4ba 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -48,27 +48,44 @@ type Accuracy <: AbstractEvalMetric Accuracy() = new(0.0, 0) end +""" +Implementation taken from findmax in Julia base. +Searches for the maximum value in p_dim of a. +I and n are values for the other dimensions. +""" +function _indmax(a, I, p_dim, n) + m = a[I..., 1, n] + mi = 1 + for i in 2:size(a, p_dim) + ai = a[I..., i, n] + if ai > m || m!=m + m = ai + mi = i + end + end + return mi +end + function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDArray) @nd_as_jl ro=(label,pred) begin if ndims(pred) > 2 # Multidimensional case # Construct cartesian index - initial = tuple(fill(1, ndims(pred)-2)...) - dims = size(pred, (1:ndims(pred)-2)...) + p_dim = ndims(pred)-1 + initial = tuple(fill(1,p_dim-1)...) + dims = size(pred, (1:p_dim-1)...) crange = CartesianRange(CartesianIndex(initial), CartesianIndex(dims)) for sample in 1:size(label, ndims(label)) for i in crange l_i = sub2ind(dims, i.I...) - ps = sub(pred, i.I..., :, sample) - klass = indmax(ps) + klass = _indmax(pred, i.I, p_dim, sample) metric.acc_sum += (klass-1) == label[l_i, sample] metric.n_sample += 1 end end else # 1-dimensional case for sample in 1:size(label, 1) - ps = sub(pred, :, sample) - klass = indmax(ps) + klass = indmax(pred[:, sample]) metric.acc_sum += (klass-1) == label[sample] metric.n_sample += 1 end From d51d2af73a23ebbed7488a479a9be44261e31972 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 11 Nov 2015 14:44:23 +0900 Subject: [PATCH 200/630] add comments for accuracy and rebuild docs --- docs/api/io.rst | 4 ++-- docs/api/metric.rst | 3 +++ docs/api/symbolic-node.rst | 23 +++++++++++++++++++++++ src/metric.jl | 3 +++ 4 files changed, 31 insertions(+), 2 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index e9d9c04e9f3c..6c9d71836108 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -317,7 +317,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -460,7 +460,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/metric.rst b/docs/api/metric.rst index db18ae731a59..5f13bd7006c3 100644 --- a/docs/api/metric.rst +++ b/docs/api/metric.rst @@ -42,5 +42,8 @@ set. Multiclass classification accuracy. + Calculates the mean accuracy per sample for softmax in one dimension. + For a multi-dimensional softmax the mean accuracy over all dimensions is calculated. + diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index f811d41aaad5..6106b54e6a8f 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -501,6 +501,29 @@ Public APIs +.. function:: SwapAxis(...) + + Apply swapaxis to input. + + :param data: Input data to the SwapAxisOp. + :type data: SymbolicNode + + + :param dim1: the first axis to be swapped. + :type dim1: int (non-negative), optional, default=0 + + + :param dim2: the second axis to be swapped. + :type dim2: int (non-negative), optional, default=0 + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: exp(...) Take exp of the src diff --git a/src/metric.jl b/src/metric.jl index 8d5838aff4ba..3f35e7455ac5 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -40,6 +40,9 @@ abstract AbstractEvalMetric .. class:: Accuracy Multiclass classification accuracy. + + Calculates the mean accuracy per sample for softmax in one dimension. + For a multi-dimensional softmax the mean accuracy over all dimensions is calculated. =# type Accuracy <: AbstractEvalMetric acc_sum :: Float64 From 4362525754175dc095a1f6ac9e42a4a4276dee08 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 11 Nov 2015 09:03:36 -0500 Subject: [PATCH 201/630] add nd_as_jl unit test --- test/unittest/ndarray.jl | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index cfab1dea0d86..b7208f532222 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -239,6 +239,27 @@ function test_sqrt() @test reldiff(copy(sqrt_ed), sqrt(j_array)) < 1e-6 end +function test_nd_as_jl() + dims = (2,3) + info("NDArray::nd_as_jl::dims = $dims") + + x = mx.zeros(dims) + 5 + y = mx.ones(dims) + z = mx.zeros(dims) + @mx.nd_as_jl ro=x rw=(y,z) begin + for i = 1:length(z) + z[i] = x[i] + end + + z[:,1] = y[:,1] + y[:] = 0 + end + + @test reldiff(copy(y), 0) < 1e-6 + @test reldiff(copy(z)[:,1], 1) < 1e-6 + @test reldiff(copy(z)[:,2:end], copy(x)[:,2:end]) < 1e-6 +end + ################################################################################ # Run tests @@ -254,5 +275,6 @@ test_gd() test_saveload() test_clip() test_sqrt() +test_nd_as_jl() end From e8846927c3fb0b6585dcd777e5cc0f2b2ae448ad Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 11 Nov 2015 09:50:05 -0500 Subject: [PATCH 202/630] update ipython notebook BGR -> RGB --- .../Prediction with Pre-trained Model.ipynb | 40 +++++++++++++------ .../ijulia-pretrained-predict/imagehelper.py | 4 +- 2 files changed, 31 insertions(+), 13 deletions(-) diff --git a/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb b/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb index 9f4f2b8cb1d3..2d5d0ee7dd97 100644 --- a/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb +++ b/examples/imagenet/ijulia-pretrained-predict/Prediction with Pre-trained Model.ipynb @@ -32,7 +32,7 @@ "image/png": "", "text/plain": [ "RGB4 Images.Image with:\n", - " data: 256x256 Array{ColorTypes.RGB4{FixedPointNumbers.UfixedBase{UInt8,8}},2}\n", + " data: 256x256 Array{ColorTypes.RGB4{FixedPointNumbers.UFixed{UInt8,8}},2}\n", " properties:\n", " imagedescription: \n", " spatialorder: x y\n", @@ -45,8 +45,8 @@ } ], "source": [ - "using Images, Colors\n", - "img = imread(\"cat.png\")" + "using Images, Colors, ImageMagick\n", + "img = load(\"cat.png\")" ] }, { @@ -127,11 +127,18 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 7, "metadata": { "collapsed": false }, "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "[09:48:53] src/operator/./softmax_output-inl.h:187: Softmax symbol is renamed to SoftmaxOutput. This API will be deprecated in Dec, 2015\n" + ] + }, { "name": "stdout", "output_type": "stream", @@ -156,7 +163,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 8, "metadata": { "collapsed": false }, @@ -165,7 +172,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "lynx, catamount\n" + "tiger cat\n" ] } ], @@ -186,7 +193,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 9, "metadata": { "collapsed": false }, @@ -195,11 +202,11 @@ "name": "stdout", "output_type": "stream", "text": [ - " lynx, catamount w.p. 0.552236\n", - " tabby, tabby cat w.p. 0.118180\n", - " Persian cat w.p. 0.114004\n", - " Egyptian cat w.p. 0.090389\n", - " tiger cat w.p. 0.086328\n" + " tiger cat w.p. 0.415807\n", + " tabby, tabby cat w.p. 0.235859\n", + " Egyptian cat w.p. 0.161553\n", + " lynx, catamount w.p. 0.136078\n", + " Persian cat w.p. 0.007109\n" ] } ], @@ -213,6 +220,15 @@ " println(mx.format(\"{1:>18} w.p. {2:4f}\", l, p))\n", "end" ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [] } ], "metadata": { diff --git a/examples/imagenet/ijulia-pretrained-predict/imagehelper.py b/examples/imagenet/ijulia-pretrained-predict/imagehelper.py index bdaade19ff28..7584b45d9313 100644 --- a/examples/imagenet/ijulia-pretrained-predict/imagehelper.py +++ b/examples/imagenet/ijulia-pretrained-predict/imagehelper.py @@ -20,7 +20,9 @@ def PreprocessImage(img): # WRONG channel will lead to WRONG result #------------------------------------------------------------------- # swap channel from RGB to BGR - sample = sample[:, :, [2,1,0]] + # sample = sample[:, :, [2,1,0]] + sample = sample[:, :, [0,1,2]] # actually, in this pre-trained model RGB is used + # swap axes to make image from (224, 224, 4) to (3, 224, 224) sample = np.swapaxes(sample, 0, 2) sample = np.swapaxes(sample, 1, 2) From 32267131f83095a34676102ebd1fcf58b73d6d02 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 00:10:09 -0500 Subject: [PATCH 203/630] complete doc for symbolic-node --- docs/api/io.rst | 4 +- docs/api/symbolic-node.rst | 123 +++++++++++++++++++++++++++++++ src/symbolic-node.jl | 146 ++++++++++++++++++++++++++++++------- 3 files changed, 243 insertions(+), 30 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index 6c9d71836108..e9d9c04e9f3c 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -317,7 +317,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -460,7 +460,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index 6106b54e6a8f..2868bf27681e 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -26,6 +26,129 @@ Symbolic API +.. function:: + call(self :: SymbolicNode, args :: SymbolicNode...) + call(self :: SymbolicNode; kwargs...) + + Make a new node by composing ``self`` with ``args``. Or the arguments + can be specified using keyword arguments. + + + + +.. function:: list_arguments(self :: SymbolicNode) + + List all the arguments of this node. The argument for a node contains both + the inputs and parameters. For example, a :class:`FullyConnected` node will + have both data and weights in its arguments. A composed node (e.g. a MLP) will + list all the arguments for intermediate nodes. + + :return: A list of symbols indicating the names of the arguments. + + + + +.. function:: list_outputs(self :: SymbolicNode) + + List all the outputs of this node. + + :return: A list of symbols indicating the names of the outputs. + + + + +.. function:: list_auxiliary_states(self :: SymbolicNode) + + + List all auxiliary states in the symbool. + + Auxiliary states are special states of symbols that do not corresponds to an argument, + and do not have gradient. But still be useful for the specific operations. + A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. + Most operators do not have Auxiliary states. + + :return: A list of symbols indicating the names of the auxiliary states. + + + + +.. function:: get_internals(self :: SymbolicNode) + + Get a new grouped :class:`SymbolicNode` whose output contains all the internal outputs of + this :class:`SymbolicNode`. + + + + +.. function:: Variable(name :: Union{Base.Symbol, AbstractString}) + + Create a symbolic variable with the given name. This is typically used as a placeholder. + For example, the data node, acting as the starting point of a network architecture. + + + + +.. function:: Group(nodes :: SymbolicNode...) + + Create a :class:`SymbolicNode` by grouping nodes together. + + + + +.. function:: + infer_shape(self :: SymbolicNode; args...) + infer_shape(self :: SymbolicNode; kwargs...) + + Do shape inference according to the input shapes. The input shapes could be provided + as a list of shapes, which should specify the shapes of inputs in the same order as + the arguments returned by :func:`list_arguments`. Alternatively, the shape information + could be specified via keyword arguments. + + :return: A 3-tuple containing shapes of all the arguments, shapes of all the outputs and + shapes of all the auxiliary variables. If shape inference failed due to incomplete + or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. + + + + +.. function:: + getindex(self :: SymbolicNode, idx :: Union{Int, Base.Symbol, AbstractString}) + + Get a node representing the specified output of this node. The index could be + a symbol or string indicating the name of the output, or a 1-based integer + indicating the index, as in the list of :func:`list_outputs`. + + + + +.. function:: to_json(self :: SymbolicNode) + + Convert a :class:`SymbolicNode` into a JSON string. + + + + +.. function:: from_json(repr :: AbstractString, ::Type{SymbolicNode}) + + Load a :class:`SymbolicNode` from a JSON string representation. + + + + +.. function:: load(filename :: AbstractString, ::Type{SymbolicNode}) + + Load a :class:`SymbolicNode` from a JSON file. + + + + +.. function:: save(filename :: AbstractString, node :: SymbolicNode) + + Save a :class:`SymbolicNode` to a JSON file. + + + + libmxnet APIs ------------- diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 7f993c7491b5..8b0a5b4fad5f 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -37,6 +37,14 @@ function Base.copy(self :: SymbolicNode) Base.deepcopy(self) end +#=doc +.. function:: + call(self :: SymbolicNode, args :: SymbolicNode...) + call(self :: SymbolicNode; kwargs...) + + Make a new node by composing ``self`` with ``args``. Or the arguments + can be specified using keyword arguments. +=# function Base.call(self :: SymbolicNode, args :: SymbolicNode...) s = deepcopy(self) _compose!(s, args...) @@ -58,40 +66,81 @@ macro _list_symbol_info(self, func_name) return names end end + +#=doc +.. function:: list_arguments(self :: SymbolicNode) + + List all the arguments of this node. The argument for a node contains both + the inputs and parameters. For example, a :class:`FullyConnected` node will + have both data and weights in its arguments. A composed node (e.g. a MLP) will + list all the arguments for intermediate nodes. + + :return: A list of symbols indicating the names of the arguments. +=# function list_arguments(self :: SymbolicNode) @_list_symbol_info(self, :MXSymbolListArguments) end + +#=doc +.. function:: list_outputs(self :: SymbolicNode) + + List all the outputs of this node. + + :return: A list of symbols indicating the names of the outputs. +=# function list_outputs(self :: SymbolicNode) @_list_symbol_info(self, :MXSymbolListOutputs) end -"""List all auxiliary states in the symbool. -Auxiliary states are special states of symbols that do not corresponds to an argument, -and do not have gradient. But still be useful for the specific operations. -A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. -Most operators do not have Auxiliary states. -""" + +#=doc +.. function:: list_auxiliary_states(self :: SymbolicNode) + + + List all auxiliary states in the symbool. + + Auxiliary states are special states of symbols that do not corresponds to an argument, + and do not have gradient. But still be useful for the specific operations. + A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. + Most operators do not have Auxiliary states. + + :return: A list of symbols indicating the names of the auxiliary states. +=# function list_auxiliary_states(self :: SymbolicNode) @_list_symbol_info(self, :MXSymbolListAuxiliaryStates) end -"Get a new grouped SymbolicNode whose output contains all the internal outputs of this SymbolicNode." +#=doc +.. function:: get_internals(self :: SymbolicNode) + + Get a new grouped :class:`SymbolicNode` whose output contains all the internal outputs of + this :class:`SymbolicNode`. +=# function get_internals(self :: SymbolicNode) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolGetInternals, (MX_handle, Ref{MX_handle}), self, ref_hdr) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -"Create a symbolic variable with the given name" +#=doc +.. function:: Variable(name :: Union{Base.Symbol, AbstractString}) + + Create a symbolic variable with the given name. This is typically used as a placeholder. + For example, the data node, acting as the starting point of a network architecture. +=# function Variable(name :: Union{Base.Symbol, AbstractString}) hdr_ref = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) SymbolicNode(MX_SymbolHandle(hdr_ref[])) end -"Create a SymbolicNode that groups symbols together" -function Group(symbols :: SymbolicNode...) - handles = MX_handle[symbols...] +#=doc +.. function:: Group(nodes :: SymbolicNode...) + + Create a :class:`SymbolicNode` by grouping nodes together. +=# +function Group(nodes :: SymbolicNode...) + handles = MX_handle[nodes...] ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateGroup, (MX_uint, Ptr{MX_handle}, Ref{MX_handle}), length(handles), handles, ref_hdr) @@ -141,6 +190,21 @@ macro _infer_shape(self, keys, indptr, sdata) end end end + +#=doc +.. function:: + infer_shape(self :: SymbolicNode; args...) + infer_shape(self :: SymbolicNode; kwargs...) + + Do shape inference according to the input shapes. The input shapes could be provided + as a list of shapes, which should specify the shapes of inputs in the same order as + the arguments returned by :func:`list_arguments`. Alternatively, the shape information + could be specified via keyword arguments. + + :return: A 3-tuple containing shapes of all the arguments, shapes of all the outputs and + shapes of all the auxiliary variables. If shape inference failed due to incomplete + or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. +=# function infer_shape(self :: SymbolicNode; kwargs...) sdata = MX_uint[] indptr = MX_uint[0] @@ -163,6 +227,14 @@ function infer_shape(self :: SymbolicNode, args :: Union{Tuple, Void}...) @_infer_shape(self, keys, indptr, sdata) end +#=doc +.. function:: + getindex(self :: SymbolicNode, idx :: Union{Int, Base.Symbol, AbstractString}) + + Get a node representing the specified output of this node. The index could be + a symbol or string indicating the name of the output, or a 1-based integer + indicating the index, as in the list of :func:`list_outputs`. +=# function Base.getindex(self :: SymbolicNode, idx :: Union{Base.Symbol, AbstractString}) idx = symbol(idx) i_idx = find(idx .== list_outputs(self)) @@ -211,7 +283,7 @@ function ./(self :: SymbolicNode, arg :: SymbolicNode) _Div(self, arg) end -function _compose!(sym :: SymbolicNode; kwargs...) +function _compose!(node :: SymbolicNode; kwargs...) name = char_p(0) arg_keys = AbstractString[] arg_vals = MX_handle[] @@ -228,45 +300,63 @@ function _compose!(sym :: SymbolicNode; kwargs...) @mxcall(:MXSymbolCompose, (MX_handle, char_p, MX_uint, Ptr{char_p}, Ptr{MX_handle}), - sym, name, length(arg_keys), arg_keys, arg_vals) - return sym + node, name, length(arg_keys), arg_keys, arg_vals) + return node end -function _compose!(sym :: SymbolicNode, args::SymbolicNode...) - _compose!(sym, char_p(0), args...) +function _compose!(node :: SymbolicNode, args::SymbolicNode...) + _compose!(node, char_p(0), args...) end -function _compose!(sym :: SymbolicNode, name :: Union{Base.Symbol, char_p}, args::SymbolicNode...) +function _compose!(node :: SymbolicNode, name :: Union{Base.Symbol, char_p}, args::SymbolicNode...) if isa(name, Base.Symbol); name = string(name); end arg_keys = Ptr{char_p}(0) arg_vals = MX_handle[args...] @mxcall(:MXSymbolCompose, (MX_handle, char_p, MX_uint, Ptr{char_p}, Ptr{MX_handle}), - sym, name, length(arg_vals), arg_keys, arg_vals) - return sym + node, name, length(arg_vals), arg_keys, arg_vals) + return node end -"""Save SymbolicNode into a JSON string""" +#=doc +.. function:: to_json(self :: SymbolicNode) + + Convert a :class:`SymbolicNode` into a JSON string. +=# function to_json(self :: SymbolicNode) ref_json = Ref{char_p}(0) @mxcall(:MXSymbolSaveToJSON, (MX_handle, Ref{char_p}), self, ref_json) return bytestring(ref_json[]) end -"""Load SymbolicNode from a JSON string representation.""" +#=doc +.. function:: from_json(repr :: AbstractString, ::Type{SymbolicNode}) + + Load a :class:`SymbolicNode` from a JSON string representation. +=# function from_json(repr :: AbstractString, ::Type{SymbolicNode}) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateFromJSON, (char_p, Ref{MX_handle}), repr, ref_hdr) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -"""Load SymbolicNode from a JSON file.""" +#=doc +.. function:: load(filename :: AbstractString, ::Type{SymbolicNode}) + + Load a :class:`SymbolicNode` from a JSON file. +=# function load(filename :: AbstractString, ::Type{SymbolicNode}) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateFromFile, (char_p, Ref{MX_handle}), filename, ref_hdr) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -function save(filename :: AbstractString, sym :: SymbolicNode) - @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), sym, filename) + +#=doc +.. function:: save(filename :: AbstractString, node :: SymbolicNode) + + Save a :class:`SymbolicNode` to a JSON file. +=# +function save(filename :: AbstractString, node :: SymbolicNode) + @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), node, filename) end #=doc @@ -359,17 +449,17 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) $hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) sym_hdr = ref_sym_hdr[] - sym = SymbolicNode(MX_SymbolHandle(sym_hdr)) + node = SymbolicNode(MX_SymbolHandle(sym_hdr)) hint = lowercase(string($func_name)) name = get!(DEFAULT_NAME_MANAGER, name, hint) if length(args) != 0 - _compose!(sym, name, args...) + _compose!(node, name, args...) else - _compose!(sym; name=name, symbol_kws...) + _compose!(node; name=name, symbol_kws...) end - return sym + return node end func_def = Expr(:function, func_head, Expr(:block, func_body)) From f5f27779649779b8c49e36c3d160186dfc85e003 Mon Sep 17 00:00:00 2001 From: Andre Pemmelaar Date: Thu, 12 Nov 2015 19:28:18 +0900 Subject: [PATCH 204/630] Adds Mean Squared Error evaluation metric --- src/metric.jl | 41 +++++++++++++++++++++++++++++++++++++++++ 1 file changed, 41 insertions(+) diff --git a/src/metric.jl b/src/metric.jl index 3f35e7455ac5..a9e4db2dea4e 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -113,4 +113,45 @@ function reset!(metric :: Accuracy) metric.n_sample = 0 end +#=doc +.. class:: MSE + + Mean Squared Error. + + Calculates the mean squared error regression loss in one dimension. +=# + +type MSE <: AbstractEvalMetric + mse_sum :: Float64 + n_sample :: Int + MSE() = new(0.0, 0) +end + +function _update_single_output(metric :: MSE, label :: NDArray, pred :: NDArray) + label = copy(label) + pred = copy(pred) + + n_sample = size(pred)[end] + metric.n_sample += n_sample + + for i = 1:n_sample + metric.mse_sum += (label[i] - pred[i])^2 + end +end + +function update!(metric :: MSE, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + @assert length(labels) == length(preds) + for i = 1:length(labels) + _update_single_output(metric, labels[i], preds[i]) + end +end + +function get(metric :: MSE) + return [(:MSE, metric.mse_sum / metric.n_sample)] +end + +function reset!(metric :: MSE) + metric.mse_sum = 0.0 + metric.n_sample = 0 +end From 0b538d1400bbbebb49b6e52810687726b4ae1672 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 12:37:55 -0500 Subject: [PATCH 205/630] make notes on MSE metrics --- docs/api/metric.rst | 9 +++++++++ src/metric.jl | 2 +- 2 files changed, 10 insertions(+), 1 deletion(-) diff --git a/docs/api/metric.rst b/docs/api/metric.rst index 5f13bd7006c3..614058d18294 100644 --- a/docs/api/metric.rst +++ b/docs/api/metric.rst @@ -47,3 +47,12 @@ set. + +.. class:: MSE + + Mean Squared Error. Todo: add support for multi-dimensional outputs. + + Calculates the mean squared error regression loss in one dimension. + + + diff --git a/src/metric.jl b/src/metric.jl index a9e4db2dea4e..5bf14e52a840 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -116,7 +116,7 @@ end #=doc .. class:: MSE - Mean Squared Error. + Mean Squared Error. TODO: add support for multi-dimensional outputs. Calculates the mean squared error regression loss in one dimension. =# From 645091c2a9a2a039f779cc55179745048241ee69 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 16:26:20 -0500 Subject: [PATCH 206/630] char-ltsm temp commit --- examples/char-lstm/.gitignore | 1 + examples/char-lstm/lstm.jl | 98 ++++++++++++++++++++++++++++++++++ examples/char-lstm/seq-data.jl | 37 +++++++++++++ 3 files changed, 136 insertions(+) create mode 100644 examples/char-lstm/.gitignore create mode 100644 examples/char-lstm/lstm.jl create mode 100644 examples/char-lstm/seq-data.jl diff --git a/examples/char-lstm/.gitignore b/examples/char-lstm/.gitignore new file mode 100644 index 000000000000..06c798bc3232 --- /dev/null +++ b/examples/char-lstm/.gitignore @@ -0,0 +1 @@ +input.txt diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl new file mode 100644 index 000000000000..f429313dc723 --- /dev/null +++ b/examples/char-lstm/lstm.jl @@ -0,0 +1,98 @@ +# An explicitly unrolled LSTM with fixed sequence length. +using MXNet + +immutable LSTMState + c :: mx.SymbolicNode + h :: mx.SymbolicNode +end + +immutable LSTMParam + i2h_W :: mx.SymbolicNode + h2h_W :: mx.SymbolicNode + i2h_b :: mx.SymbolicNode + h2h_b :: mx.SymbolicNode +end + +function ltsm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMParam; + num_hidden::Int=512, dropout::Real=0, name::Symbol=gensym()) + + if dropout > 0 + data = mx.Dropout(data, p=dropout) + end + + i2h = mx.FullyConnected(data, weight=param.i2h_W, bias=param.i2h_b, + num_hidden=4num_hidden, name=symbol(name, "_i2h")) + h2h = mx.FullyConnected(prev_state.h, weight=param.h2h_W, bias=param.h2h_b, + num_hidden=4num_hidden, name=symbol(name, "_h2h")) + + gates = mx.SliceChannel(i2h + h2h, num_outputs=4, name=symbol(name, "_gates")) + + in_gate = mx.Activation(gates[1], act_type=:sigmoid) + in_trans = mx.Activation(gates[2], act_type=:tanh) + forget_gate = mx.Activation(gates[3], act_type=:sigmoid) + out_gate = mx.Activation(gates[4], act_type=:sigmoid) + + next_c = (forget_gate .* prev_state.c) + (in_gate .* in_trans) + next_h = out_gate .* mx.Activation(next_c, act_type=:tanh) + + return LTSMState(next_c, next_h) +end + +function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_class::Int; + dropout::Real=0, name::Symbol=gensym()) + + # placeholder nodes for all parameters + embed_W = mx.Variable(symbol(name, "_embed_weight")) + pred_W = mx.Variable(symbol(name, "_pred_weight")) + pred_b = mx.Variable(symbol(name, "_pred_bias")) + + layer_param_states = map(1:n_layer) do i + param = LSTMParam(mx.Variable(symbol(name, "_l$(i)_i2h_weight")), + mx.Variable(symbol(name, "_l$(i)_h2h_weight")), + mx.Variable(symbol(name, "_l$(i)_i2h_bias")), + mx.Variable(symbol(name, "_l$(i)_h2h_bias"))) + state = LTSMState(mx.Variable(symbol(name, "_l$(i)_init_c")), + mx.Variable(symbol(name, "_l$(i)_init_h"))) + (param, state) + end + + # now unroll over time + outputs = mx.SymbolicNode[] + for t = 1:seq_len + data = mx.Variable(symbol(name, "_data_$t")) + label = mx.Variable(symbol(name, "_label_$t")) + hidden = mx.FullyConnected(data, weight=embed_W, num_hidden=dim_embed, + no_bias=true, name=symbol(name, "_embed_$t")) + + + # stack LTSM cells + for i = 1:n_layer + l_param, l_state = layer_param_states[i] + dp = i == 1 ? 0 : dropout # don't do dropout for data + next_state = ltsm_cell(hidden, l_state, l_param, num_hidden=dim_hidden, dropout=dp, + name=symbol(name, "_lstm_$t")) + hidden = next_state.h + layer_param_states[i] = (l_param, next_state) + end + + # prediction / decoder + if dropout > 0 + hidden = mx.Dropout(hidden, p=dropout) + end + pred = mx.FullyConnected(hidden, weight=pred_W, bias=pred_b, num_hidden=n_class, + name=symbol(name, "_pred_$t")) + smax = mx.SoftmaxOutput(pred, label, name=symbol(name, "_softmax_$t")) + push!(outputs, smax) + end + + # append block-gradient nodes to the final states + for i = 1:n_layer + l_param, l_state = layer_param_states[i] + final_state = LTSMState(mx.BlockGrad(l_state.c, name=symbol(name, "_l$(i)_last_c")), + mx.BlockGrad(l_state.h, name=symbol(name, "_l$(i)_last_h"))) + layer_param_states[i] = (l_param, final_state) + end + + # now group all outputs together + return mx.Group(outputs...) +end diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl new file mode 100644 index 000000000000..ea6c390581bb --- /dev/null +++ b/examples/char-lstm/seq-data.jl @@ -0,0 +1,37 @@ +# Simple data provider that load text +using MXNet + +const UNKNOWN_CHAR = Char(0) + +function build_vocabulary(corpus_fn::AbstractString, vocab_fn::AbstractString; max_vocab=10000) + if isfile(vocab_fn) + info("Vocabulary already exists, reusing $vocab_fn...") + vocab = open(corpus_fn) do io + Dict([w[1] => i for (i,w) in enumerate(eachline(io))]) + end + else + # count symbol frequency + dict = Dict{Char,Int}() + open(corpus_fn) do io + for line in eachline(io) + for c in line + dict[c] = get(dict, c, 0) + 1 + end + end + end + + vocab = sort(collect(dict), by=x->-x.second) + vocab = vocab[1:min(max_vocab,length(vocab))] + open(vocab_fn, "w") do io + for x in vocab + println(io, x.first) + end + end + + vocab = Dict([x.first => i for (i,x) in enumerate(vocab)]) + end + vocab[UNKNOWN_CHAR] = 0 + return vocab +end + +build_vocabulary("input.txt", "vocab.txt") From 703d78fd97df64373729d6b182a181d1f2874892 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 19:08:23 -0500 Subject: [PATCH 207/630] char-ltsm example, not tested --- examples/char-lstm/.gitignore | 1 + examples/char-lstm/config.jl | 19 ++++++++ examples/char-lstm/seq-data.jl | 87 ++++++++++++++++++++++++++++++---- examples/char-lstm/train.jl | 34 +++++++++++++ plugins/io/svmlight.jl | 1 + 5 files changed, 134 insertions(+), 8 deletions(-) create mode 100644 examples/char-lstm/config.jl create mode 100644 examples/char-lstm/train.jl diff --git a/examples/char-lstm/.gitignore b/examples/char-lstm/.gitignore index 06c798bc3232..4b87bf4070f6 100644 --- a/examples/char-lstm/.gitignore +++ b/examples/char-lstm/.gitignore @@ -1 +1,2 @@ input.txt +vocab.dat diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl new file mode 100644 index 000000000000..d94d6e995cbf --- /dev/null +++ b/examples/char-lstm/config.jl @@ -0,0 +1,19 @@ +const DROPOUT = 0 +const BATCH_SIZE = 32 +const SEQ_LENGTH = 32 +const DIM_HIDDEN = 256 +const DIM_EMBED = 256 +const LTSM_N_LAYER = 2 +const N_EPOCH = 21 +const LEARNING_RATE = 1 +const WEIGHT_DECAY = 0.00001 +const MOMENTUM = 0.0 +const CLIP_GRADIENT = 1 +const NAME = :ptb +const N_GPU = 4 +const USE_GPU = true +const DATA_TR_RATIO = 0.9 + +const UNKNOWN_CHAR = Char(0) +const INPUT_FILE = joinpath(dirname(@__FILE__), "input.txt") +const VOCAB_FILE = joinpath(dirname(@__FILE__), "vocab.dat") diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index ea6c390581bb..acf5f9394a5b 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -1,14 +1,11 @@ # Simple data provider that load text +using Iterators using MXNet -const UNKNOWN_CHAR = Char(0) - function build_vocabulary(corpus_fn::AbstractString, vocab_fn::AbstractString; max_vocab=10000) if isfile(vocab_fn) info("Vocabulary already exists, reusing $vocab_fn...") - vocab = open(corpus_fn) do io - Dict([w[1] => i for (i,w) in enumerate(eachline(io))]) - end + vocab = Dict{Char,Int}([w => i for (i,w) in enumerate(readall(vocab_fn))]) else # count symbol frequency dict = Dict{Char,Int}() @@ -24,14 +21,88 @@ function build_vocabulary(corpus_fn::AbstractString, vocab_fn::AbstractString; m vocab = vocab[1:min(max_vocab,length(vocab))] open(vocab_fn, "w") do io for x in vocab - println(io, x.first) + print(io, x.first) end end vocab = Dict([x.first => i for (i,x) in enumerate(vocab)]) end - vocab[UNKNOWN_CHAR] = 0 + vocab[UNKNOWN_CHAR] = length(vocab) return vocab end -build_vocabulary("input.txt", "vocab.txt") +function char_idx(vocab :: Dict{Char,Int}, c :: Char) + if haskey(vocab, c) + vocab[c] + else + vocab[UNKNOWN_CHAR] + end +end + +type CharSeqProvider <: mx.AbstractDataProvider + text :: AbstractString + batch_size :: Int + seq_len :: Int + vocab :: Dict{Char,Int} + + prefix :: Symbol + n_layer :: Int + dim_hidden :: Int +end + +function mx.get_batch_size(p :: CharSeqProvider) + p.batch_size +end +function mx.provide_data(p :: CharSeqProvider) + [(symbol(p.prefix, "_data_$t"), (length(p.vocab), p.batch_size)) for t = 1:p.seq_len] ∪ + [(symbol(p.prefix, "_l$(l)_init_c"), (p.dim_hidden, p.batch_size)) for l=1:p.n_layer] ∪ + [(symbol(p.prefix, "_l$(l)_init_h"), (p.dim_hidden, p.batch_size)) for l=1:p.n_layer] +end +function mx.provide_label(p :: CharSeqProvider) + [(symbol(p.prefix, "_label_$t"), (p.batch_size),) for t = 1:p.seq_len] +end + +function mx.eachbatch(p :: CharSeqProvider) + data_all = [mx.zeros(shape) for (name, shape) in mx.provide_data(p)] + label_all = [mx.zeros(shape) for (name, shape) in mx.provide_label(p)] + + data_jl = [copy(x) for x in data_all] + label_jl= [copy(x) for x in label_all] + + batch = mx.DataBatch(data_all, label_all, p.batch_size) + + function _text_iter() + text = p.text + + n_batch = floor(Int, length(text) / p.batch_size / p.seq_len) + text = text[1:n_batch*p.batch_size*p.seq_len] # discard tailing + idx_all = 1:length(text) + + for idx_batch in partition(idx_all, p.batch_size*p.seq_len) + for i = 1:p.seq_len + data_jl[i][:] = 0 + label_jl[i][:] = 0 + end + + for (i, idx_seq) in enumerate(partition(idx_batch, p.seq_len)) + println("i = $i, idx_seq = $idx_seq") + for (j, idx) in enumerate(idx_seq) + c_this = text[idx] + c_next = idx == length(text) ? UNKNOWN_CHAR : text[idx+1] + data_jl[j][char_idx(vocab,c_this),i] = 1 + label_jl[j][i] = char_idx(vocab,c_next)-1 + end + end + + for i = 1:p.seq_len + copy!(data_all[i], data_jl[i]) + copy!(label_all[i], label_jl[i]) + end + + produce(batch) + end + end + + return Task(_text_iter) +end + diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl new file mode 100644 index 000000000000..1d391255a8ab --- /dev/null +++ b/examples/char-lstm/train.jl @@ -0,0 +1,34 @@ +include(joinpath(dirname(@__FILE__), "config.jl")) +include(joinpath(dirname(@__FILE__), "lstm.jl")) +include(joinpath(dirname(@__FILE__), "seq-data.jl")) + +# build vocabulary +vocab = build_vocabulary(INPUT_FILE, VOCAB_FILE) +n_class = length(vocab) + +# define LTSM +ltsm = LTSM(LTSM_N_LAYER, SEQ_LENGTH, DIM_HIDDEN, DIM_EMBED, n_class, dropout=DROPOUT, name=NAME) + +# load data +text_all = readall(INPUT_FILE) +len_train = round(Int, length(text_all)*DATA_TR_RATIO) +text_tr = text_all[1:len_train] +text_val = text_all[len_train+1:end] + +data_tr = CharSeqProvider(text_tr, BATCH_SIZE, SEQ_LENGTH, vocab, NAME, + LSTM_N_LAYER, DIM_HIDDEN) +data_val = CharSeqProvider(text_val, BATCH_SIZE, SEQ_LENGTH, vocab, NAME, + LSTM_N_LAYER, DIM_HIDDEN) + +# set up training +if USE_GPU + context = [mx.gpu(i) for i = 0:N_GPU-1] +else + context = [mx.cpu()] +end + +model = mx.FeedForward(lstm, context=context) +optimizer = mx.SGD(lr=LEARNING_RATE, momentum=MOMENTUM, + weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) + +mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH) diff --git a/plugins/io/svmlight.jl b/plugins/io/svmlight.jl index 94563357ee6e..500c040394ee 100644 --- a/plugins/io/svmlight.jl +++ b/plugins/io/svmlight.jl @@ -44,6 +44,7 @@ function mx.eachbatch(provider :: SVMLightProvider) function _svmlight_iter() f = SVMLightFile(provider.filename) while true + error("This is actually buggy and needs fixing") raw = collect(take(f, provider.batch_size)) cnt = length(raw) if cnt == 0 From eea7d2c1c2739f5592a82726b753511f82af0576 Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 12 Nov 2015 19:24:09 -0500 Subject: [PATCH 208/630] typo ltsm -> lstm --- examples/char-lstm/config.jl | 2 +- examples/char-lstm/lstm.jl | 12 ++++++------ examples/char-lstm/train.jl | 4 ++-- 3 files changed, 9 insertions(+), 9 deletions(-) diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl index d94d6e995cbf..b6de43c440d8 100644 --- a/examples/char-lstm/config.jl +++ b/examples/char-lstm/config.jl @@ -3,7 +3,7 @@ const BATCH_SIZE = 32 const SEQ_LENGTH = 32 const DIM_HIDDEN = 256 const DIM_EMBED = 256 -const LTSM_N_LAYER = 2 +const LSTM_N_LAYER = 2 const N_EPOCH = 21 const LEARNING_RATE = 1 const WEIGHT_DECAY = 0.00001 diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index f429313dc723..81805b95da95 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -13,7 +13,7 @@ immutable LSTMParam h2h_b :: mx.SymbolicNode end -function ltsm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMParam; +function lstm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMParam; num_hidden::Int=512, dropout::Real=0, name::Symbol=gensym()) if dropout > 0 @@ -35,7 +35,7 @@ function ltsm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMPara next_c = (forget_gate .* prev_state.c) + (in_gate .* in_trans) next_h = out_gate .* mx.Activation(next_c, act_type=:tanh) - return LTSMState(next_c, next_h) + return LSTMState(next_c, next_h) end function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_class::Int; @@ -51,7 +51,7 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla mx.Variable(symbol(name, "_l$(i)_h2h_weight")), mx.Variable(symbol(name, "_l$(i)_i2h_bias")), mx.Variable(symbol(name, "_l$(i)_h2h_bias"))) - state = LTSMState(mx.Variable(symbol(name, "_l$(i)_init_c")), + state = LSTMState(mx.Variable(symbol(name, "_l$(i)_init_c")), mx.Variable(symbol(name, "_l$(i)_init_h"))) (param, state) end @@ -65,11 +65,11 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla no_bias=true, name=symbol(name, "_embed_$t")) - # stack LTSM cells + # stack LSTM cells for i = 1:n_layer l_param, l_state = layer_param_states[i] dp = i == 1 ? 0 : dropout # don't do dropout for data - next_state = ltsm_cell(hidden, l_state, l_param, num_hidden=dim_hidden, dropout=dp, + next_state = lstm_cell(hidden, l_state, l_param, num_hidden=dim_hidden, dropout=dp, name=symbol(name, "_lstm_$t")) hidden = next_state.h layer_param_states[i] = (l_param, next_state) @@ -88,7 +88,7 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla # append block-gradient nodes to the final states for i = 1:n_layer l_param, l_state = layer_param_states[i] - final_state = LTSMState(mx.BlockGrad(l_state.c, name=symbol(name, "_l$(i)_last_c")), + final_state = LSTMState(mx.BlockGrad(l_state.c, name=symbol(name, "_l$(i)_last_c")), mx.BlockGrad(l_state.h, name=symbol(name, "_l$(i)_last_h"))) layer_param_states[i] = (l_param, final_state) end diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index 1d391255a8ab..03631c2672bf 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -6,8 +6,8 @@ include(joinpath(dirname(@__FILE__), "seq-data.jl")) vocab = build_vocabulary(INPUT_FILE, VOCAB_FILE) n_class = length(vocab) -# define LTSM -ltsm = LTSM(LTSM_N_LAYER, SEQ_LENGTH, DIM_HIDDEN, DIM_EMBED, n_class, dropout=DROPOUT, name=NAME) +# define LSTM +lstm = LSTM(LSTM_N_LAYER, SEQ_LENGTH, DIM_HIDDEN, DIM_EMBED, n_class, dropout=DROPOUT, name=NAME) # load data text_all = readall(INPUT_FILE) From e35b92941c262f976774367f9f8e5a03aa4e822e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 19:25:22 -0500 Subject: [PATCH 209/630] fix macro error reporting --- src/symbolic-node.jl | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 8b0a5b4fad5f..0b7385ffa1a7 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -382,7 +382,8 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) Ref{char_pp}, Ref{char_p}), hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, ref_kv_nargs) - func_name = symbol(bytestring(ref_name[])) + func_name_s= bytestring(ref_name[]) + func_name = symbol(func_name_s) kv_nargs_s = bytestring(ref_kv_nargs[]) kv_nargs = symbol(kv_nargs_s) @@ -431,12 +432,12 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) end if length(args) != 0 && length(symbol_kws) != 0 - @assert(false, "$func_name only accepts Symbols either as positional or keyword arguments, not both.") + @assert(false, $func_name_s * " only accepts Symbols either as positional or keyword arguments, not both.") end $(if kv_nargs != symbol("") quote if length(symbol_kws) > 0 - @assert(false, "$func_name takes variable number of SymbolicNode arguments, please pass input Symbols " * + @assert(false, $func_name * " takes variable number of SymbolicNode arguments, please pass input Symbols " * "via positional arguments, instead of keyword arguments.") end end @@ -450,7 +451,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) sym_hdr = ref_sym_hdr[] node = SymbolicNode(MX_SymbolHandle(sym_hdr)) - hint = lowercase(string($func_name)) + hint = lowercase($func_name_s) name = get!(DEFAULT_NAME_MANAGER, name, hint) if length(args) != 0 From 5a9d56af303e38298edbfb1c809f41a22bc87aae Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 19:29:42 -0500 Subject: [PATCH 210/630] fix some errors --- examples/char-lstm/lstm.jl | 8 ++++---- examples/char-lstm/seq-data.jl | 2 +- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index 81805b95da95..aca4d7660e1b 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -20,9 +20,9 @@ function lstm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMPara data = mx.Dropout(data, p=dropout) end - i2h = mx.FullyConnected(data, weight=param.i2h_W, bias=param.i2h_b, + i2h = mx.FullyConnected(data=data, weight=param.i2h_W, bias=param.i2h_b, num_hidden=4num_hidden, name=symbol(name, "_i2h")) - h2h = mx.FullyConnected(prev_state.h, weight=param.h2h_W, bias=param.h2h_b, + h2h = mx.FullyConnected(data=prev_state.h, weight=param.h2h_W, bias=param.h2h_b, num_hidden=4num_hidden, name=symbol(name, "_h2h")) gates = mx.SliceChannel(i2h + h2h, num_outputs=4, name=symbol(name, "_gates")) @@ -61,7 +61,7 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla for t = 1:seq_len data = mx.Variable(symbol(name, "_data_$t")) label = mx.Variable(symbol(name, "_label_$t")) - hidden = mx.FullyConnected(data, weight=embed_W, num_hidden=dim_embed, + hidden = mx.FullyConnected(data=data, weight=embed_W, num_hidden=dim_embed, no_bias=true, name=symbol(name, "_embed_$t")) @@ -79,7 +79,7 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla if dropout > 0 hidden = mx.Dropout(hidden, p=dropout) end - pred = mx.FullyConnected(hidden, weight=pred_W, bias=pred_b, num_hidden=n_class, + pred = mx.FullyConnected(data=hidden, weight=pred_W, bias=pred_b, num_hidden=n_class, name=symbol(name, "_pred_$t")) smax = mx.SoftmaxOutput(pred, label, name=symbol(name, "_softmax_$t")) push!(outputs, smax) diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index acf5f9394a5b..bd7c04576d90 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -59,7 +59,7 @@ function mx.provide_data(p :: CharSeqProvider) [(symbol(p.prefix, "_l$(l)_init_h"), (p.dim_hidden, p.batch_size)) for l=1:p.n_layer] end function mx.provide_label(p :: CharSeqProvider) - [(symbol(p.prefix, "_label_$t"), (p.batch_size),) for t = 1:p.seq_len] + [(symbol(p.prefix, "_label_$t"), (p.batch_size,)) for t = 1:p.seq_len] end function mx.eachbatch(p :: CharSeqProvider) From 487d5e85300125799fb6bad3fcf421668d80578d Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 12 Nov 2015 19:36:48 -0500 Subject: [PATCH 211/630] fix kvstore refactoring bug --- examples/char-lstm/seq-data.jl | 1 - src/kvstore.jl | 2 +- 2 files changed, 1 insertion(+), 2 deletions(-) diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index bd7c04576d90..3f545671facd 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -85,7 +85,6 @@ function mx.eachbatch(p :: CharSeqProvider) end for (i, idx_seq) in enumerate(partition(idx_batch, p.seq_len)) - println("i = $i, idx_seq = $idx_seq") for (j, idx) in enumerate(idx_seq) c_this = text[idx] c_next = idx == length(text) ? UNKNOWN_CHAR : text[idx+1] diff --git a/src/kvstore.jl b/src/kvstore.jl index 1d8c98935768..d52433f567b2 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -121,7 +121,7 @@ end function set_optimizer(self :: KVStore, optimizer :: AbstractOptimizer) ref_is_worker = Ref{Cint}(0) - @mxcall(:MXKVStoreIsWorkerSymbolicNode, (Ref{Cint},), ref_is_worker) + @mxcall(:MXKVStoreIsWorkerNode, (Ref{Cint},), ref_is_worker) is_worker = ref_is_worker[] if ismatch(r"dist", string(get_type(self))) && is_worker From e4b6306e3e1e0807e3a21eb6175b33230f917632 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 19:44:31 -0500 Subject: [PATCH 212/630] fix databatch --- src/io.jl | 4 ++-- src/model.jl | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/src/io.jl b/src/io.jl index 71bbc38a7f50..1b3ee3b091a9 100644 --- a/src/io.jl +++ b/src/io.jl @@ -204,8 +204,8 @@ type DataBatch <: AbstractDataBatch count :: Int end count_samples(batch :: DataBatch) = batch.count -get_data(batch :: DataBatch) = batch.data -get_label(batch :: DataBatch) = batch.label +get_data{Provider<:AbstractDataProvider}(::Provider, batch :: DataBatch) = batch.data +get_label{Provider<:AbstractDataProvider}(::Provider, batch :: DataBatch) = batch.label #=doc .. class:: SlicedNDArray diff --git a/src/model.jl b/src/model.jl index 1a9d11facbe2..6d77306597dc 100644 --- a/src/model.jl +++ b/src/model.jl @@ -391,7 +391,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # invoke callbacks on epoch 0 _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) - # now start training... + info("Start training...") for i_epoch = 1:opts.n_epoch time_start = time() reset!(opts.eval_metric) From 6ddbecdd3e72b7ca8051ce9bbfe3eea12e50f745 Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 12 Nov 2015 20:11:22 -0500 Subject: [PATCH 213/630] add speedometer --- examples/char-lstm/train.jl | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index 03631c2672bf..de81e3691739 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -31,4 +31,5 @@ model = mx.FeedForward(lstm, context=context) optimizer = mx.SGD(lr=LEARNING_RATE, momentum=MOMENTUM, weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) -mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH) +mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH, + callbacks=[mx.speedometer()]) From 00c7bff664e8cee9cece4cc2464223e69b1fe711 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 20:12:14 -0500 Subject: [PATCH 214/630] neg-log-likilihood eval metric --- examples/char-lstm/lstm.jl | 29 +++++++++++++++++++++++++++++ examples/char-lstm/train.jl | 4 ++-- 2 files changed, 31 insertions(+), 2 deletions(-) diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index aca4d7660e1b..05be419596c0 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -96,3 +96,32 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla # now group all outputs together return mx.Group(outputs...) end + + +# Negative Log-likelihood +type NLL <: mx.AbstractEvalMetric + nll_sum :: Float64 + n_sample :: Int + + NLL() = new(0.0, 0) +end + +function mx.update!(metric :: NLL, labels :: Vector{mx.NDArray}, preds :: Vector{NDArray}) + @assert length(labels) == length(preds) + nll = 0.0 + for (label, pred) in zip(labels, preds) + @nd_as_jl ro=(label, pred) begin + nll -= sum(log(broadcast_getindex(pred, label+1, 1:length(label)))) + end + end + + nll = nll / length(labels) + metric.nll_sum += nll + metric.n_sample += length(labels[1]) +end + +function mx.get(metric :: NLL) + nll = metric.nll / metric.n_sample + perp = exp(nll) + return [(symbol("neg-log-likelihood"), nll), (:perplexity, perp)] +end diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index de81e3691739..d66b2b4a88eb 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -31,5 +31,5 @@ model = mx.FeedForward(lstm, context=context) optimizer = mx.SGD(lr=LEARNING_RATE, momentum=MOMENTUM, weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) -mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH, - callbacks=[mx.speedometer()]) +mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH, + callbacks=[mx.speedometer()], eval_metric=NLL()) From d685f77b4e936cd247f50c5dbc075127555c5620 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 20:15:17 -0500 Subject: [PATCH 215/630] tweak training log formatting --- examples/char-lstm/lstm.jl | 2 +- src/model.jl | 6 +++--- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index 05be419596c0..9305b119ee06 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -123,5 +123,5 @@ end function mx.get(metric :: NLL) nll = metric.nll / metric.n_sample perp = exp(nll) - return [(symbol("neg-log-likelihood"), nll), (:perplexity, perp)] + return [(:NLL, nll), (:perplexity, perp)] end diff --git a/src/model.jl b/src/model.jl index 6d77306597dc..015d9c09af05 100644 --- a/src/model.jl +++ b/src/model.jl @@ -461,9 +461,9 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra info(format("== Epoch {1:0>3d} ==========", i_epoch)) info("## Training summary") for (name, value) in get(opts.eval_metric) - info(format("{1:>15s} = {2:.4f}", name, value)) + info(format("{1:>18s} = {2:.4f}", string(name), value)) end - info(format("{1:>15s} = {2:.4f} seconds", "time", time_stop-time_start)) + info(format("{1:>18s} = {2:.4f} seconds", "time", time_stop-time_start)) # evaluation on validation set if !isa(opts.eval_data, Void) @@ -491,7 +491,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra info("## Validation summary") for (name, value) in get(opts.eval_metric) - info(format("{1:>15s} = {2:.4f}", name, value)) + info(format("{1:>18s} = {2:.4f}", string(name), value)) end end From 69cc430743fb5c43aecf3804c058513072c1401c Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 12 Nov 2015 20:27:47 -0500 Subject: [PATCH 216/630] reset! for NLL calculation --- examples/char-lstm/lstm.jl | 13 +++++++++---- 1 file changed, 9 insertions(+), 4 deletions(-) diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index 9305b119ee06..538fe0497676 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -106,12 +106,12 @@ type NLL <: mx.AbstractEvalMetric NLL() = new(0.0, 0) end -function mx.update!(metric :: NLL, labels :: Vector{mx.NDArray}, preds :: Vector{NDArray}) +function mx.update!(metric :: NLL, labels :: Vector{mx.NDArray}, preds :: Vector{mx.NDArray}) @assert length(labels) == length(preds) nll = 0.0 for (label, pred) in zip(labels, preds) - @nd_as_jl ro=(label, pred) begin - nll -= sum(log(broadcast_getindex(pred, label+1, 1:length(label)))) + @mx.nd_as_jl ro=(label, pred) begin + nll -= sum(log(max(broadcast_getindex(pred, round(Int,label+1), 1:length(label)), 1e-20))) end end @@ -121,7 +121,12 @@ function mx.update!(metric :: NLL, labels :: Vector{mx.NDArray}, preds :: Vector end function mx.get(metric :: NLL) - nll = metric.nll / metric.n_sample + nll = metric.nll_sum / metric.n_sample perp = exp(nll) return [(:NLL, nll), (:perplexity, perp)] end + +function mx.reset!(metric :: NLL) + metric.nll_sum = 0.0 + metric.n_sample = 0 +end From c5c1e057c7f45de3e8c7e3f2922f7bff3eb4082b Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 22:03:59 -0500 Subject: [PATCH 217/630] basic network visualization --- REQUIRE | 1 + src/MXNet.jl | 1 + src/visualize.jl | 154 +++++++++++++++++++++++++++++++++++++++++++++++ 3 files changed, 156 insertions(+) create mode 100644 src/visualize.jl diff --git a/REQUIRE b/REQUIRE index a0f5c9865565..fea260919fbc 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,3 +1,4 @@ julia 0.4 Formatting BinDeps +JSON diff --git a/src/MXNet.jl b/src/MXNet.jl index a3e280d26a11..42c9e45f477e 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -29,6 +29,7 @@ include("callback.jl") include("model.jl") include("util.jl") +include("visualize.jl") include("nn-factory.jl") diff --git a/src/visualize.jl b/src/visualize.jl new file mode 100644 index 000000000000..982a155ad990 --- /dev/null +++ b/src/visualize.jl @@ -0,0 +1,154 @@ +import JSON + +#=doc +Network Visualization +===================== +=# + +#=doc +.. function:: to_graphviz(network) + + :param SymbolicNode network: the network to visualize. + :param AbstractString title: keyword argument, default "Network Visualization", + the title of the GraphViz graph. + :param input_shapes: keyword argument, default ``nothing``. If provided, + will run shape inference and plot with the shape information. Should + be either a dictionary of name-shape mapping or an array of shapes. + :return: the graph description in GraphViz ``dot`` language. +=# +function to_graphviz(network :: SymbolicNode; title="Network Visualization", input_shapes=nothing) + if !isa(input_shapes, Void) + internals = get_internals(network) + if isa(input_shapes, Dict) + _, out_shapes, _ = infer_shape(; input_shapes...) + else + _, out_shapes, _ = infer_shape(input_shapes...) + end + @assert(!isa(out_shapes, Void), "Failed to do shape inference, input shapes are incomplete") + shapes = Dict(zip(list_outputs(internals), out_shapes)) + draw_shape = true + else + draw_shape = false + end + + conf = JSON.parse(to_json(network)) + nodes = conf["nodes"] + heads = unique(conf["heads"][1]+1) + node_attr = Dict(:shape => :box, :fixedsize => true, :width => 1.3, + :height => 0.8034, :style => :filled) + io = IOBuffer() + println(io, "digraph $(_simple_escape(title)) {") + println(io, "node [fontsize=10];") + + # color map + cm = ("#8dd3c7", "#fb8072", "#ffffb3", "#bebada", "#80b1d3", + "#fdb462", "#b3de69", "#fccde5") + + # make nodes + for i = 1:length(nodes) + node = nodes[i] + op = node["op"] + name = node["name"] + attr = deepcopy(node_attr) + label = op + + if op == "null" + if i ∈ heads + label = node["name"] + attr[:fillcolor] = cm[1] + else + continue + end + elseif op == "Convolution" + label = format("Convolution\nkernel={1},stride={2},n-filter={3}", + _extract_shape(node["param"]["kernel"]), + _extract_shape(node["param"]["stride"]), + node["param"]["num_filter"]) + attr[:fillcolor] = cm[2] + elseif op == "FullyConnected" + label = format("FullyConnected\nnum-hidden={1}", node["param"]["num_hidden"]) + attr[:fillcolor] = cm[2] + # TODO: add more + else + attr[:fillcolor] = cm[8] + end + + attr[:label] = label + _format_graphviz_node(io, name, attr) + end + + # add edges + for i = 1:length(nodes) + node = nodes[i] + op = node["op"] + name = node["name"] + if op == "null" + continue + end + inputs = node["inputs"] + for item in inputs + input_node = nodes[item[1]+1] + input_name = input_node["name"] + if input_node["op"] != "null" || (item[1]+1) ∈ heads + attr = Dict(:dir => :back, :arrowtail => :open) + if draw_shape + if input_node["op"] != "null" + key = symbol(input_name, "_output") + shape = shape_dict[key][1:end-1] + else + key = symbol(input_name) + shape = shape_dict[key][1:end-1] + end + label = "(" * join([string(x) for x in shape], ",") * ")" + attr[:label] = label + end + _format_graphviz_edge(io, input_name, name, attr) + end + end + end + println(io, "}") + + return takebuf_string(io) +end + +function _format_graphviz_attr(io::IOBuffer, attrs) + label = get(attrs, :label, nothing) + if isa(label, Void) + print(io, " [") + else + print(io, " [label=$(_simple_escape(label)),") + end + first_attr = true + for (k,v) in attrs + if k != :label + if !first_attr + print(io, ",") + end + first_attr = false + + if isa(v, AbstractString) && v[1] == '#' + # color + v = _simple_escape(v) + end + print(io, "$k=$v") + end + end + println(io, "];") +end +function _simple_escape(str :: AbstractString) + str = replace(str, r"\n", "\\n") + return "\"$str\"" +end +function _format_graphviz_node(io::IOBuffer, name::AbstractString, attrs) + print(io, "$(_simple_escape(name)) ") + _format_graphviz_attr(io, attrs) +end +function _format_graphviz_edge(io::IOBuffer, head, tail, attrs) + print(io, """$(_simple_escape(head)) -> $(_simple_escape(tail)) """) + _format_graphviz_attr(io, attrs) +end +function _extract_shape(str :: AbstractString) + shape = matchall(r"\d+", str) + shape = reverse(shape) # JSON in libmxnet has reversed shape (column vs row majoring) + return "(" * join(shape, ",") * ")" +end From e0857a2b53dd370e677644837503704a56bf67e6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 22:14:06 -0500 Subject: [PATCH 218/630] add visualization doc --- docs/api/metric.rst | 2 +- docs/api/symbolic-node.rst | 92 ++++++++++++++++++++++++++++++++++++++ docs/api/visualize.rst | 19 ++++++++ docs/build-api.jl | 1 + docs/index.rst | 1 + src/visualize.jl | 18 +++++++- 6 files changed, 130 insertions(+), 3 deletions(-) create mode 100644 docs/api/visualize.rst diff --git a/docs/api/metric.rst b/docs/api/metric.rst index 614058d18294..db503d5e6849 100644 --- a/docs/api/metric.rst +++ b/docs/api/metric.rst @@ -50,7 +50,7 @@ set. .. class:: MSE - Mean Squared Error. Todo: add support for multi-dimensional outputs. + Mean Squared Error. TODO: add support for multi-dimensional outputs. Calculates the mean squared error regression loss in one dimension. diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index 2868bf27681e..78e359537ec3 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -725,6 +725,29 @@ Internal APIs +.. function:: _DivScalar(...) + + Perform an elementwise div. + + :param array: Input array operand to the operation. + :type array: SymbolicNode + + + :param scalar: scalar value. + :type scalar: float, required + + + :param scalar_on_right: scalar operand is on the right. + :type scalar_on_right: boolean, optional, default=False + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: _Minus(...) Perform an elementwise minus. @@ -737,6 +760,29 @@ Internal APIs +.. function:: _MinusScalar(...) + + Perform an elementwise minus. + + :param array: Input array operand to the operation. + :type array: SymbolicNode + + + :param scalar: scalar value. + :type scalar: float, required + + + :param scalar_on_right: scalar operand is on the right. + :type scalar_on_right: boolean, optional, default=False + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: _Mul(...) Perform an elementwise mul. @@ -749,6 +795,29 @@ Internal APIs +.. function:: _MulScalar(...) + + Perform an elementwise mul. + + :param array: Input array operand to the operation. + :type array: SymbolicNode + + + :param scalar: scalar value. + :type scalar: float, required + + + :param scalar_on_right: scalar operand is on the right. + :type scalar_on_right: boolean, optional, default=False + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: _Native(...) Stub for implementing an operator implemented in native frontend language. @@ -780,6 +849,29 @@ Internal APIs +.. function:: _PlusScalar(...) + + Perform an elementwise plus. + + :param array: Input array operand to the operation. + :type array: SymbolicNode + + + :param scalar: scalar value. + :type scalar: float, required + + + :param scalar_on_right: scalar operand is on the right. + :type scalar_on_right: boolean, optional, default=False + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + diff --git a/docs/api/visualize.rst b/docs/api/visualize.rst new file mode 100644 index 000000000000..42857c5f4ff0 --- /dev/null +++ b/docs/api/visualize.rst @@ -0,0 +1,19 @@ + +Network Visualization +===================== + + + + +.. function:: to_graphviz(network) + + :param SymbolicNode network: the network to visualize. + :param AbstractString title: keyword argument, default "Network Visualization", + the title of the GraphViz graph. + :param input_shapes: keyword argument, default ``nothing``. If provided, + will run shape inference and plot with the shape information. Should + be either a dictionary of name-shape mapping or an array of shapes. + :return: the graph description in GraphViz ``dot`` language. + + + diff --git a/docs/build-api.jl b/docs/build-api.jl index 99ae5ad1c709..53ca9f6f7ca1 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -94,4 +94,5 @@ extract_doc("metric.rst", "metric.jl") extract_doc("io.rst", "io.jl") embed_mxnet_api("io.rst", "io", mx._import_io_iterators) +extract_doc("visualize.rst", "visualize.jl") extract_doc("nn-factory.rst", "nn-factory.jl") diff --git a/docs/index.rst b/docs/index.rst index da28e3080440..4f718e1861b9 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -42,6 +42,7 @@ For more details, see documentation below. Please also checkout the `examples api/symbolic-node api/nn-factory api/executor + api/visualize Indices and tables ================== diff --git a/src/visualize.jl b/src/visualize.jl index 982a155ad990..e668ba37ecd9 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -60,7 +60,7 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp continue end elseif op == "Convolution" - label = format("Convolution\nkernel={1},stride={2},n-filter={3}", + label = format("Convolution\nkernel={1}\nstride={2}\nn-filter={3}", _extract_shape(node["param"]["kernel"]), _extract_shape(node["param"]["stride"]), node["param"]["num_filter"]) @@ -68,7 +68,21 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp elseif op == "FullyConnected" label = format("FullyConnected\nnum-hidden={1}", node["param"]["num_hidden"]) attr[:fillcolor] = cm[2] - # TODO: add more + elseif op == "Activation" + label = format("Activation\nact-type={1}", node["param"]["act_type"]) + attr[:fillcolor] = cm[3] + elseif op == "BatchNorm" + attr[:fillcolor] = cm[4] + elseif op == "Pooling" + label = format("Pooling\ntype={1}\nkernel={2}\nstride={3}", + node["param"]["pool_type"], + _extract_shape(node["param"]["kernel"]), + _extract_shape(node["param"]["stride"])) + attr[:fillcolor] = cm[5] + elseif op ∈ ("Concat", "Flatten", "Reshape") + attr[:fillcolor] = cm[6] + elseif endswith(op, "Output") + attr[:fillcolor] = cm[7] else attr[:fillcolor] = cm[8] end From c4abb973bc4033d6a1c34246678bd2410b152435 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 22:17:11 -0500 Subject: [PATCH 219/630] fix visualization bugs --- src/visualize.jl | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/src/visualize.jl b/src/visualize.jl index e668ba37ecd9..e6ada19f179c 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -20,12 +20,12 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp if !isa(input_shapes, Void) internals = get_internals(network) if isa(input_shapes, Dict) - _, out_shapes, _ = infer_shape(; input_shapes...) + _, out_shapes, _ = infer_shape(internals; input_shapes...) else - _, out_shapes, _ = infer_shape(input_shapes...) + _, out_shapes, _ = infer_shape(internals, input_shapes...) end @assert(!isa(out_shapes, Void), "Failed to do shape inference, input shapes are incomplete") - shapes = Dict(zip(list_outputs(internals), out_shapes)) + shape_dict = Dict(zip(list_outputs(internals), out_shapes)) draw_shape = true else draw_shape = false @@ -149,8 +149,8 @@ function _format_graphviz_attr(io::IOBuffer, attrs) end println(io, "];") end -function _simple_escape(str :: AbstractString) - str = replace(str, r"\n", "\\n") +function _simple_escape(str) + str = replace(string(str), r"\n", "\\n") return "\"$str\"" end function _format_graphviz_node(io::IOBuffer, name::AbstractString, attrs) From 0e1515d3df7aa05debac9f478412a938146b2f55 Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 12 Nov 2015 22:18:20 -0500 Subject: [PATCH 220/630] fix lstm learning rate --- examples/char-lstm/config.jl | 2 +- examples/char-lstm/train.jl | 1 + 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl index b6de43c440d8..fb07d3368f4d 100644 --- a/examples/char-lstm/config.jl +++ b/examples/char-lstm/config.jl @@ -5,7 +5,7 @@ const DIM_HIDDEN = 256 const DIM_EMBED = 256 const LSTM_N_LAYER = 2 const N_EPOCH = 21 -const LEARNING_RATE = 1 +const LEARNING_RATE = 0.1 const WEIGHT_DECAY = 0.00001 const MOMENTUM = 0.0 const CLIP_GRADIENT = 1 diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index d66b2b4a88eb..b23880f589ff 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -32,4 +32,5 @@ optimizer = mx.SGD(lr=LEARNING_RATE, momentum=MOMENTUM, weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH, + initializer=mx.UniformInitializer(0.1), callbacks=[mx.speedometer()], eval_metric=NLL()) From 6193ef4a3f6e6e71fbc66d9d859c63ecfada0cfc Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 12 Nov 2015 22:31:48 -0500 Subject: [PATCH 221/630] add lr decay to lstm training --- examples/char-lstm/config.jl | 3 ++- examples/char-lstm/train.jl | 7 ++++--- 2 files changed, 6 insertions(+), 4 deletions(-) diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl index fb07d3368f4d..e4d4f0c180b8 100644 --- a/examples/char-lstm/config.jl +++ b/examples/char-lstm/config.jl @@ -5,7 +5,8 @@ const DIM_HIDDEN = 256 const DIM_EMBED = 256 const LSTM_N_LAYER = 2 const N_EPOCH = 21 -const LEARNING_RATE = 0.1 +const BASE_LR = 0.1 +const LR_DECAY = 0.7 const WEIGHT_DECAY = 0.00001 const MOMENTUM = 0.0 const CLIP_GRADIENT = 1 diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index b23880f589ff..997ba674f8c5 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -28,9 +28,10 @@ else end model = mx.FeedForward(lstm, context=context) -optimizer = mx.SGD(lr=LEARNING_RATE, momentum=MOMENTUM, - weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) +optimizer = mx.SGD(lr_scheduler=mx.LearningRate.Exp(BASE_LR, gamma=LR_DECAY), + momentum=MOMENTUM, weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) +ckpoint_prefix = joinpath(dirname(@__FILE__), "checkpoints/$NAME") mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH, initializer=mx.UniformInitializer(0.1), - callbacks=[mx.speedometer()], eval_metric=NLL()) + callbacks=[mx.speedometer(), mx.do_checkpoint(ckpoint_prefix)], eval_metric=NLL()) From b078fecd59fb0414a1825c643136d0705005a965 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 12 Nov 2015 23:22:17 -0500 Subject: [PATCH 222/630] lstm sampler (not tested) --- examples/char-lstm/config.jl | 15 +++++++++ examples/char-lstm/sampler.jl | 56 ++++++++++++++++++++++++++++++++++ examples/char-lstm/seq-data.jl | 8 ----- examples/char-lstm/train.jl | 3 +- src/io.jl | 3 ++ 5 files changed, 75 insertions(+), 10 deletions(-) create mode 100644 examples/char-lstm/sampler.jl diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl index e4d4f0c180b8..ff982950132e 100644 --- a/examples/char-lstm/config.jl +++ b/examples/char-lstm/config.jl @@ -14,7 +14,22 @@ const NAME = :ptb const N_GPU = 4 const USE_GPU = true const DATA_TR_RATIO = 0.9 +const CKPOINT_PREFIX = joinpath(dirname(@__FILE__), "checkpoints/$NAME") + +const BATCH_SIZE_SMP= 10 +const SAMPLE_LENGTH = 100 +const SAMPLE_START = 'a' const UNKNOWN_CHAR = Char(0) const INPUT_FILE = joinpath(dirname(@__FILE__), "input.txt") const VOCAB_FILE = joinpath(dirname(@__FILE__), "vocab.dat") + +# helper function to convert a char into index in vocabulary +function char_idx(vocab :: Dict{Char,Int}, c :: Char) + if haskey(vocab, c) + vocab[c] + else + vocab[UNKNOWN_CHAR] + end +end + diff --git a/examples/char-lstm/sampler.jl b/examples/char-lstm/sampler.jl new file mode 100644 index 000000000000..c481da1d1950 --- /dev/null +++ b/examples/char-lstm/sampler.jl @@ -0,0 +1,56 @@ +include(joinpath(dirname(@__FILE__), "config.jl")) + +using StatsBase +using MXNet + +# load vocabulary +vocab = build_vocabulary(INPUT_FILE, VOCAB_FILE) + +# prepare data provider +jl_data = [(symbol(NAME, "_data_$t"), zeros(mx.MX_float, (length(vocab), BATCH_SIZE_SMP))) + for t = 1:SEQ_LENGTH] +jl_c = [(symbol(NAME, "_l$(l)_init_c"), zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) + for l = 1:LSTM_N_LAYER] +jl_h = [(symbol(NAME, "_l$(l)_init_h"), zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) + for l = 1:LSTM_N_LAYER] + +# the first input in the sequence +jl_data_start = jl_data[1] +jl_data_start[char_idx(vocab, SAMPLE_START),:] = 1 + +data = mx.ArrayDataProvider(nd_data ∪ nd_c ∪ nd_h) + +# load model +model = mx.load_checkpoint(CKPOINT_PREFIX, N_EPOCH, mx.FeedForward) + +# prepare outputs +output_samples = zeros(Char, (SAMPLE_LENGTH, BATCH_SIZE_SMP)) +output_samples[1, :] = SAMPLE_START + +# build inverse vocabulary for convenience +inv_vocab = Dict([v => k for (k,v) in vocab]) + +# do prediction and sampling step by step +for t = 2:SAMPLE_LENGTH-1 + outputs = mx.predict(model, data) + + # we will only use the first output to do sampling + outputs = outputs[1] + + jl_data_start[:] = 0 + for i = 1:BATCH_SIZE_SMP + prob = WeightVec(outputs[:, i]) + k = sample(prob) + output_samples[t, k] = inv_vocab[k] + jl_data_start[k, i] = 1 + end +end + +output_texts = [join(output_samples[:,i]) for i = 1:BATCH_SIZE_SMP] +output_texts = [replace(x, UNKNOWN_CHAR, '?') for x in output_texts] + +for (i, text) in enumerate(output_texts) + println("## Sample $i") + println(text) + println() +end diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index 3f545671facd..8bbcfece56c1 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -31,14 +31,6 @@ function build_vocabulary(corpus_fn::AbstractString, vocab_fn::AbstractString; m return vocab end -function char_idx(vocab :: Dict{Char,Int}, c :: Char) - if haskey(vocab, c) - vocab[c] - else - vocab[UNKNOWN_CHAR] - end -end - type CharSeqProvider <: mx.AbstractDataProvider text :: AbstractString batch_size :: Int diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index 997ba674f8c5..ed4e4403c402 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -31,7 +31,6 @@ model = mx.FeedForward(lstm, context=context) optimizer = mx.SGD(lr_scheduler=mx.LearningRate.Exp(BASE_LR, gamma=LR_DECAY), momentum=MOMENTUM, weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) -ckpoint_prefix = joinpath(dirname(@__FILE__), "checkpoints/$NAME") mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH, initializer=mx.UniformInitializer(0.1), - callbacks=[mx.speedometer(), mx.do_checkpoint(ckpoint_prefix)], eval_metric=NLL()) + callbacks=[mx.speedometer(), mx.do_checkpoint(CKPOINT_PREFIX)], eval_metric=NLL()) diff --git a/src/io.jl b/src/io.jl index 1b3ee3b091a9..d6ba2fd3d8ce 100644 --- a/src/io.jl +++ b/src/io.jl @@ -307,6 +307,9 @@ end be less samples to include than a mini-batch. This value specify a scalar to pad the contents of all the missing data points. :param Real label_padding: the same as ``data_padding``, except for the labels. + + TODO: remove ``data_padding`` and ``label_padding``, and implement rollover that copies + the last or first several training samples to feed the padding. =# # Julia's type system is sometimes very frustrating. You cannot specify a function # with argument Vector{Pair} to expect to be matched when calling with the parameter From 0c3f32de0ad787086b5721b4963dd0d352918233 Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 12 Nov 2015 23:22:58 -0500 Subject: [PATCH 223/630] tweak learning rate --- examples/char-lstm/.gitignore | 1 + examples/char-lstm/config.jl | 2 +- 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/examples/char-lstm/.gitignore b/examples/char-lstm/.gitignore index 4b87bf4070f6..7588feca6bfe 100644 --- a/examples/char-lstm/.gitignore +++ b/examples/char-lstm/.gitignore @@ -1,2 +1,3 @@ input.txt vocab.dat +checkpoints diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl index e4d4f0c180b8..79a2040aad8e 100644 --- a/examples/char-lstm/config.jl +++ b/examples/char-lstm/config.jl @@ -5,7 +5,7 @@ const DIM_HIDDEN = 256 const DIM_EMBED = 256 const LSTM_N_LAYER = 2 const N_EPOCH = 21 -const BASE_LR = 0.1 +const BASE_LR = 0.5 const LR_DECAY = 0.7 const WEIGHT_DECAY = 0.00001 const MOMENTUM = 0.0 From 0f1fbaa7b2148e40541144d740d5dfa7296b1e56 Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 12 Nov 2015 23:30:35 -0500 Subject: [PATCH 224/630] fix sampler --- examples/char-lstm/config.jl | 9 --------- examples/char-lstm/sampler.jl | 21 +++++++++++---------- examples/char-lstm/seq-data.jl | 9 +++++++++ 3 files changed, 20 insertions(+), 19 deletions(-) diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl index e2abe8bb70b5..dbe972899666 100644 --- a/examples/char-lstm/config.jl +++ b/examples/char-lstm/config.jl @@ -24,12 +24,3 @@ const UNKNOWN_CHAR = Char(0) const INPUT_FILE = joinpath(dirname(@__FILE__), "input.txt") const VOCAB_FILE = joinpath(dirname(@__FILE__), "vocab.dat") -# helper function to convert a char into index in vocabulary -function char_idx(vocab :: Dict{Char,Int}, c :: Char) - if haskey(vocab, c) - vocab[c] - else - vocab[UNKNOWN_CHAR] - end -end - diff --git a/examples/char-lstm/sampler.jl b/examples/char-lstm/sampler.jl index c481da1d1950..2df8de8c0302 100644 --- a/examples/char-lstm/sampler.jl +++ b/examples/char-lstm/sampler.jl @@ -1,4 +1,5 @@ include(joinpath(dirname(@__FILE__), "config.jl")) +include(joinpath(dirname(@__FILE__), "seq-data.jl")) using StatsBase using MXNet @@ -7,23 +8,22 @@ using MXNet vocab = build_vocabulary(INPUT_FILE, VOCAB_FILE) # prepare data provider -jl_data = [(symbol(NAME, "_data_$t"), zeros(mx.MX_float, (length(vocab), BATCH_SIZE_SMP))) - for t = 1:SEQ_LENGTH] -jl_c = [(symbol(NAME, "_l$(l)_init_c"), zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) - for l = 1:LSTM_N_LAYER] -jl_h = [(symbol(NAME, "_l$(l)_init_h"), zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) - for l = 1:LSTM_N_LAYER] +jl_data = Pair[(symbol(NAME, "_data_$t") => zeros(mx.MX_float, (length(vocab), BATCH_SIZE_SMP))) + for t = 1:SEQ_LENGTH] +jl_c = Pair[(symbol(NAME, "_l$(l)_init_c") => zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) + for l = 1:LSTM_N_LAYER] +jl_h = Pair[(symbol(NAME, "_l$(l)_init_h") => zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) + for l = 1:LSTM_N_LAYER] # the first input in the sequence -jl_data_start = jl_data[1] +jl_data_start = jl_data[1].second jl_data_start[char_idx(vocab, SAMPLE_START),:] = 1 -data = mx.ArrayDataProvider(nd_data ∪ nd_c ∪ nd_h) - # load model model = mx.load_checkpoint(CKPOINT_PREFIX, N_EPOCH, mx.FeedForward) # prepare outputs +Base.zero(::Type{Char}) = Char(0) output_samples = zeros(Char, (SAMPLE_LENGTH, BATCH_SIZE_SMP)) output_samples[1, :] = SAMPLE_START @@ -32,6 +32,7 @@ inv_vocab = Dict([v => k for (k,v) in vocab]) # do prediction and sampling step by step for t = 2:SAMPLE_LENGTH-1 + data = mx.ArrayDataProvider(jl_data ∪ jl_c ∪ jl_h) outputs = mx.predict(model, data) # we will only use the first output to do sampling @@ -41,7 +42,7 @@ for t = 2:SAMPLE_LENGTH-1 for i = 1:BATCH_SIZE_SMP prob = WeightVec(outputs[:, i]) k = sample(prob) - output_samples[t, k] = inv_vocab[k] + output_samples[t, i] = inv_vocab[k] jl_data_start[k, i] = 1 end end diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index 8bbcfece56c1..2837ab7d8b55 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -97,3 +97,12 @@ function mx.eachbatch(p :: CharSeqProvider) return Task(_text_iter) end +# helper function to convert a char into index in vocabulary +function char_idx(vocab :: Dict{Char,Int}, c :: Char) + if haskey(vocab, c) + vocab[c] + else + vocab[UNKNOWN_CHAR] + end +end + From a6886c2280edccf41bcafb0aa4af39acc6b8b6f6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 13 Nov 2015 00:09:19 -0500 Subject: [PATCH 225/630] copy states over for sampler --- examples/char-lstm/lstm.jl | 5 ++++- examples/char-lstm/sampler.jl | 23 ++++++++++++++++++----- src/model.jl | 9 ++++++--- 3 files changed, 28 insertions(+), 9 deletions(-) diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index 538fe0497676..7ad9fa91b8d9 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -39,7 +39,7 @@ function lstm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMPara end function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_class::Int; - dropout::Real=0, name::Symbol=gensym()) + dropout::Real=0, name::Symbol=gensym(), output_states::Bool=false) # placeholder nodes for all parameters embed_W = mx.Variable(symbol(name, "_embed_weight")) @@ -94,6 +94,9 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla end # now group all outputs together + if output_states + outputs = outputs ∪ [x[2].c for x in layer_param_states] ∪ [x[2].h for x in layer_param_states] + end return mx.Group(outputs...) end diff --git a/examples/char-lstm/sampler.jl b/examples/char-lstm/sampler.jl index 2df8de8c0302..02b157b2f539 100644 --- a/examples/char-lstm/sampler.jl +++ b/examples/char-lstm/sampler.jl @@ -19,8 +19,14 @@ jl_h = Pair[(symbol(NAME, "_l$(l)_init_h") => zeros(mx.MX_float, (DIM_HIDDEN, jl_data_start = jl_data[1].second jl_data_start[char_idx(vocab, SAMPLE_START),:] = 1 -# load model -model = mx.load_checkpoint(CKPOINT_PREFIX, N_EPOCH, mx.FeedForward) +# define a LSTM with sequence length 1, also output states so that we could manually copy the states +# when sampling the next char +lstm = LSTM(LSTM_N_LAYER, 1, DIM_HIDDEN, DIM_EMBED, n_class, dropout=DROPOUT, name=NAME, output_states=true) +model = mx.FeedForward(lstm, context=cpu()) + +# load parameters from traind LSTM, though the sequence length is different, since the weights are shared +# over time, this should be compatible. +model = mx.load_checkpoint(model, CKPOINT_PREFIX, N_EPOCH, allow_different_arch=true) # prepare outputs Base.zero(::Type{Char}) = Char(0) @@ -33,11 +39,12 @@ inv_vocab = Dict([v => k for (k,v) in vocab]) # do prediction and sampling step by step for t = 2:SAMPLE_LENGTH-1 data = mx.ArrayDataProvider(jl_data ∪ jl_c ∪ jl_h) - outputs = mx.predict(model, data) + preds = mx.predict(model, data) - # we will only use the first output to do sampling - outputs = outputs[1] + # the first output is prediction + outputs = preds[1] + # do sampling and init the next inputs jl_data_start[:] = 0 for i = 1:BATCH_SIZE_SMP prob = WeightVec(outputs[:, i]) @@ -45,6 +52,12 @@ for t = 2:SAMPLE_LENGTH-1 output_samples[t, i] = inv_vocab[k] jl_data_start[k, i] = 1 end + + # copy the states over + for l = 1:LSTM_N_LAYER + copy!(jl_c[l][2], preds[1+l]) + copy!(jl_h[l][2], preds[1+LSTM_N_LAYER+l]) + end end output_texts = [join(output_samples[:,i]) for i = 1:BATCH_SIZE_SMP] diff --git a/src/model.jl b/src/model.jl index 015d9c09af05..b232ea28bd9d 100644 --- a/src/model.jl +++ b/src/model.jl @@ -550,15 +550,18 @@ function load_checkpoint(prefix :: AbstractString, epoch :: Int, ::Type{FeedForw return model end -function load_checkpoint(self :: FeedForward, prefix :: AbstractString, epoch :: Int; overwrite :: Bool = true) +function load_checkpoint(self :: FeedForward, prefix :: AbstractString, epoch :: Int; + overwrite :: Bool = true, allow_different_arch :: Bool = false) if isdefined(self, :arg_params) && isdefined(self, :aux_params) && !overwrite info("model weights already exists, skip loading... (call with overwrite=true if needed)") return self end arch, arg_params, aux_params = load_checkpoint(prefix, epoch) - # TODO: is there better way to compare two symbols - @assert(to_json(self.arch) == to_json(arch), "Cannot load from a checkpoint with different network architecture") + if !allow_different_arch + # TODO: is there better way to compare two symbols + @assert(to_json(self.arch) == to_json(arch), "Cannot load from a checkpoint with different network architecture") + end self.arg_params = arg_params self.aux_params = aux_params return self From f915865753002f88d4fe7f08b316ffd4e494c528 Mon Sep 17 00:00:00 2001 From: pluskid Date: Fri, 13 Nov 2015 00:10:04 -0500 Subject: [PATCH 226/630] use adam optimizer --- examples/char-lstm/config.jl | 4 +--- examples/char-lstm/train.jl | 3 +-- 2 files changed, 2 insertions(+), 5 deletions(-) diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl index dbe972899666..b8aa6df49247 100644 --- a/examples/char-lstm/config.jl +++ b/examples/char-lstm/config.jl @@ -5,10 +5,8 @@ const DIM_HIDDEN = 256 const DIM_EMBED = 256 const LSTM_N_LAYER = 2 const N_EPOCH = 21 -const BASE_LR = 0.5 -const LR_DECAY = 0.7 +const BASE_LR = 0.05 const WEIGHT_DECAY = 0.00001 -const MOMENTUM = 0.0 const CLIP_GRADIENT = 1 const NAME = :ptb const N_GPU = 4 diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index ed4e4403c402..cb19891f03b1 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -28,8 +28,7 @@ else end model = mx.FeedForward(lstm, context=context) -optimizer = mx.SGD(lr_scheduler=mx.LearningRate.Exp(BASE_LR, gamma=LR_DECAY), - momentum=MOMENTUM, weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) +optimizer = mx.ADAM(lr=BASE_LR, weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH, initializer=mx.UniformInitializer(0.1), From db7ae38008c5ca294ec41c0262a82c35aec55430 Mon Sep 17 00:00:00 2001 From: pluskid Date: Fri, 13 Nov 2015 00:14:58 -0500 Subject: [PATCH 227/630] fix LSTM sampler --- examples/char-lstm/sampler.jl | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/examples/char-lstm/sampler.jl b/examples/char-lstm/sampler.jl index 02b157b2f539..a641ccb39d69 100644 --- a/examples/char-lstm/sampler.jl +++ b/examples/char-lstm/sampler.jl @@ -1,4 +1,5 @@ include(joinpath(dirname(@__FILE__), "config.jl")) +include(joinpath(dirname(@__FILE__), "lstm.jl")) include(joinpath(dirname(@__FILE__), "seq-data.jl")) using StatsBase @@ -6,10 +7,11 @@ using MXNet # load vocabulary vocab = build_vocabulary(INPUT_FILE, VOCAB_FILE) +n_class = length(vocab) # prepare data provider jl_data = Pair[(symbol(NAME, "_data_$t") => zeros(mx.MX_float, (length(vocab), BATCH_SIZE_SMP))) - for t = 1:SEQ_LENGTH] + for t = 1:1] jl_c = Pair[(symbol(NAME, "_l$(l)_init_c") => zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) for l = 1:LSTM_N_LAYER] jl_h = Pair[(symbol(NAME, "_l$(l)_init_h") => zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) @@ -22,7 +24,7 @@ jl_data_start[char_idx(vocab, SAMPLE_START),:] = 1 # define a LSTM with sequence length 1, also output states so that we could manually copy the states # when sampling the next char lstm = LSTM(LSTM_N_LAYER, 1, DIM_HIDDEN, DIM_EMBED, n_class, dropout=DROPOUT, name=NAME, output_states=true) -model = mx.FeedForward(lstm, context=cpu()) +model = mx.FeedForward(lstm, context=mx.cpu()) # load parameters from traind LSTM, though the sequence length is different, since the weights are shared # over time, this should be compatible. From 88299124eae5870282fecef3492ae96739fdb708 Mon Sep 17 00:00:00 2001 From: pluskid Date: Fri, 13 Nov 2015 00:26:59 -0500 Subject: [PATCH 228/630] add basic readme for lstm example --- examples/char-lstm/README.md | 80 ++++++++++++++++++++++++++++++++++++ 1 file changed, 80 insertions(+) create mode 100644 examples/char-lstm/README.md diff --git a/examples/char-lstm/README.md b/examples/char-lstm/README.md new file mode 100644 index 000000000000..6e122a96d945 --- /dev/null +++ b/examples/char-lstm/README.md @@ -0,0 +1,80 @@ +# LSTM char-rnn + +Because we explicitly unroll the LSTM/RNN over time for a fixed sequence length, +it is easy to fit this model into the existing FeedForward model and re-use everything. +To get a more flexible LSTM/RNN implementation that avoids explicit unrolling and +deals with variable-length sequences, we still need to implement another model +beside the existing FeedForward. + +To run this example, you will need to install two extra Julia packages: `Iterators.jl` +and `StatsBase.jl`. + +## Training + +This example is adapted from the +[example in Python binding](https://github.com/dmlc/mxnet/blob/master/example/rnn/char_lstm.ipynb) of +MXNet. The data `input.txt` can be downloaded [here](https://github.com/dmlc/web-data/tree/master/mxnet/tinyshakespeare). + +Modify parameters in [config.jl](config.jl) and then run [train.jl](train.jl). An example output +of training looks like this: +``` +... +INFO: Speed: 355.18 samples/sec +INFO: == Epoch 020 ========== +INFO: ## Training summary +INFO: NLL = 1.9670 +INFO: perplexity = 7.1494 +INFO: time = 88.0757 seconds +INFO: ## Validation summary +INFO: NLL = 2.0452 +INFO: perplexity = 7.7307 +INFO: Saved checkpoint to '/cbcl/cbcl01/chiyuan/mxnet/julia/examples/char-lstm/checkpoints/ptb-0020.params' +INFO: Speed: 366.23 samples/sec +INFO: Speed: 360.19 samples/sec +INFO: Speed: 355.77 samples/sec +INFO: Speed: 356.83 samples/sec +INFO: Speed: 354.80 samples/sec +INFO: Speed: 349.89 samples/sec +INFO: Speed: 352.00 samples/sec +INFO: Speed: 358.46 samples/sec +INFO: Speed: 356.58 samples/sec +INFO: Speed: 353.03 samples/sec +INFO: Speed: 351.98 samples/sec +INFO: Speed: 365.54 samples/sec +INFO: Speed: 359.14 samples/sec +INFO: Speed: 355.60 samples/sec +INFO: Speed: 362.44 samples/sec +INFO: Speed: 359.01 samples/sec +INFO: Speed: 357.99 samples/sec +INFO: Speed: 350.07 samples/sec +INFO: Speed: 358.03 samples/sec +INFO: == Epoch 021 ========== +INFO: ## Training summary +INFO: NLL = 1.9698 +INFO: perplexity = 7.1695 +INFO: time = 87.9392 seconds +INFO: ## Validation summary +INFO: NLL = 2.0458 +INFO: perplexity = 7.7353 +INFO: Saved checkpoint to '/cbcl/cbcl01/chiyuan/mxnet/julia/examples/char-lstm/checkpoints/ptb-0021.params' +``` + +## Sampling + +Run [sampler.jl](sampler.jl) to generate sample sentences from the trained model. Some example sentences are +``` +... +## Sample 8 +a, good. Baps, +To she tur in his God twerian: well Resice hestle, the a I here's a not as I lign? +H? + +## Sample 9 +ame. +What high sisiss itle by mard have of on sol I cound: +And pruch you betsts; you god eie hearry? + +## Sample 10 +and oar +Serens Iffall as a we of tere geling pover your nive relly lers; is here whill cheadaplee k? +``` From 5da45f39b38244d33316b8ef9e2d181d0942d8df Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 13 Nov 2015 00:51:43 -0500 Subject: [PATCH 229/630] use a more sensible default argument in favor of #24 --- src/model.jl | 17 ++++++++++++----- 1 file changed, 12 insertions(+), 5 deletions(-) diff --git a/src/model.jl b/src/model.jl index b232ea28bd9d..80f0a9644778 100644 --- a/src/model.jl +++ b/src/model.jl @@ -158,9 +158,9 @@ end :param Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory allocation of the :class:`Executor` depends on the mini-batch size of the test data provider. If you call predict twice with data provider of the same batch-size, - then the executor can be re-used. Otherwise, if ``overwrite`` is false (default), - an error will be raised; if ``overwrite`` is set to true, a new :class:`Executor` - will be created to replace the old one. + then the executor can be potentially be re-used. So, if ``overwrite`` is false, + we will try to re-use, and raise an error if batch-size changed. If ``overwrite`` + is true (the default), a new :class:`Executor` will be created to replace the old one. .. note:: @@ -172,12 +172,19 @@ end For the same reason, currently prediction will only use the first device even if multiple devices are provided to construct the model. + .. note:: + + If you perform further after prediction. The weights are not automatically synchronized if ``overwrite`` + is set to false and the old predictor is re-used. In this case + setting ``overwrite`` to true (the default) will re-initialize the predictor the next time you call + predict and synchronize the weights again. + :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` =# -function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = false) +function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = true) predict(self, data; overwrite = overwrite, callback=callback) end -function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::Bool=false, callback::Union{Function,Void}=nothing) +function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::Bool=true, callback::Union{Function,Void}=nothing) data_shapes = provide_data(data) data_names = [x[1] for x in data_shapes] _setup_predictor(self, overwrite; data_shapes...) From 3bc4fb5c0f83d6b43654ed26063c70e1d246efa3 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 13 Nov 2015 00:55:29 -0500 Subject: [PATCH 230/630] fix path in char-lstm example outputs --- examples/char-lstm/README.md | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/examples/char-lstm/README.md b/examples/char-lstm/README.md index 6e122a96d945..7d625d090c72 100644 --- a/examples/char-lstm/README.md +++ b/examples/char-lstm/README.md @@ -11,8 +11,8 @@ and `StatsBase.jl`. ## Training -This example is adapted from the -[example in Python binding](https://github.com/dmlc/mxnet/blob/master/example/rnn/char_lstm.ipynb) of +This example is adapted from the +[example in Python binding](https://github.com/dmlc/mxnet/blob/master/example/rnn/char_lstm.ipynb) of MXNet. The data `input.txt` can be downloaded [here](https://github.com/dmlc/web-data/tree/master/mxnet/tinyshakespeare). Modify parameters in [config.jl](config.jl) and then run [train.jl](train.jl). An example output @@ -28,7 +28,7 @@ INFO: time = 88.0757 seconds INFO: ## Validation summary INFO: NLL = 2.0452 INFO: perplexity = 7.7307 -INFO: Saved checkpoint to '/cbcl/cbcl01/chiyuan/mxnet/julia/examples/char-lstm/checkpoints/ptb-0020.params' +INFO: Saved checkpoint to 'examples/char-lstm/checkpoints/ptb-0020.params' INFO: Speed: 366.23 samples/sec INFO: Speed: 360.19 samples/sec INFO: Speed: 355.77 samples/sec @@ -56,7 +56,7 @@ INFO: time = 87.9392 seconds INFO: ## Validation summary INFO: NLL = 2.0458 INFO: perplexity = 7.7353 -INFO: Saved checkpoint to '/cbcl/cbcl01/chiyuan/mxnet/julia/examples/char-lstm/checkpoints/ptb-0021.params' +INFO: Saved checkpoint to 'examples/char-lstm/checkpoints/ptb-0021.params' ``` ## Sampling From 0e6402df6c76abff674e417ee7c464394f6ff56e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 13 Nov 2015 01:03:52 -0500 Subject: [PATCH 231/630] add simple visualization example of char-lstm --- examples/char-lstm/.gitignore | 2 ++ examples/char-lstm/sampler.jl | 2 +- examples/char-lstm/visualize.jl | 15 +++++++++++++++ 3 files changed, 18 insertions(+), 1 deletion(-) create mode 100644 examples/char-lstm/visualize.jl diff --git a/examples/char-lstm/.gitignore b/examples/char-lstm/.gitignore index 7588feca6bfe..d8923cc201b1 100644 --- a/examples/char-lstm/.gitignore +++ b/examples/char-lstm/.gitignore @@ -1,3 +1,5 @@ input.txt vocab.dat checkpoints +visualize.dot +visualize.svg diff --git a/examples/char-lstm/sampler.jl b/examples/char-lstm/sampler.jl index a641ccb39d69..22166b7700c9 100644 --- a/examples/char-lstm/sampler.jl +++ b/examples/char-lstm/sampler.jl @@ -23,7 +23,7 @@ jl_data_start[char_idx(vocab, SAMPLE_START),:] = 1 # define a LSTM with sequence length 1, also output states so that we could manually copy the states # when sampling the next char -lstm = LSTM(LSTM_N_LAYER, 1, DIM_HIDDEN, DIM_EMBED, n_class, dropout=DROPOUT, name=NAME, output_states=true) +lstm = LSTM(LSTM_N_LAYER, 1, DIM_HIDDEN, DIM_EMBED, n_class, name=NAME, output_states=true) model = mx.FeedForward(lstm, context=mx.cpu()) # load parameters from traind LSTM, though the sequence length is different, since the weights are shared diff --git a/examples/char-lstm/visualize.jl b/examples/char-lstm/visualize.jl new file mode 100644 index 000000000000..336afea30705 --- /dev/null +++ b/examples/char-lstm/visualize.jl @@ -0,0 +1,15 @@ +include(joinpath(dirname(@__FILE__), "config.jl")) +include(joinpath(dirname(@__FILE__), "lstm.jl")) + +using MXNet + +vis_n_layer = 2 +vis_seq_len = 3 +vis_n_class = 128 + +lstm = LSTM(vis_n_layer, vis_seq_len, DIM_HIDDEN, DIM_EMBED, vis_n_class, name=NAME, output_states=true) + +open("visualize.dot", "w") do io + println(io, mx.to_graphviz(lstm)) +end +run(pipeline(`dot -Tsvg visualize.dot`, stdout="visualize.svg")) From a392e042216199b3923a9663ca81f632c7ae9ac7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 13 Nov 2015 01:31:00 -0500 Subject: [PATCH 232/630] tweak visualization --- src/visualize.jl | 12 +++++++++--- 1 file changed, 9 insertions(+), 3 deletions(-) diff --git a/src/visualize.jl b/src/visualize.jl index e6ada19f179c..0b5c0c3d8e90 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -33,12 +33,13 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp conf = JSON.parse(to_json(network)) nodes = conf["nodes"] - heads = unique(conf["heads"][1]+1) + heads = unique([x[1]+1 for x in conf["heads"]]) node_attr = Dict(:shape => :box, :fixedsize => true, :width => 1.3, :height => 0.8034, :style => :filled) io = IOBuffer() println(io, "digraph $(_simple_escape(title)) {") println(io, "node [fontsize=10];") + println(io, "edge [fontsize=10];") # color map cm = ("#8dd3c7", "#fb8072", "#ffffb3", "#bebada", "#80b1d3", @@ -54,9 +55,11 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp if op == "null" if i ∈ heads + # heads are output nodes label = node["name"] attr[:fillcolor] = cm[1] else + # otherwise, input nodes, might be data, label or parameters continue end elseif op == "Convolution" @@ -81,12 +84,15 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp attr[:fillcolor] = cm[5] elseif op ∈ ("Concat", "Flatten", "Reshape") attr[:fillcolor] = cm[6] - elseif endswith(op, "Output") + elseif endswith(op, "Output") || op == "BlockGrad" attr[:fillcolor] = cm[7] else attr[:fillcolor] = cm[8] end + if op != "null" + label = "$name\n$label" + end attr[:label] = label _format_graphviz_node(io, name, attr) end @@ -116,7 +122,7 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp label = "(" * join([string(x) for x in shape], ",") * ")" attr[:label] = label end - _format_graphviz_edge(io, input_name, name, attr) + _format_graphviz_edge(io, name, input_name, attr) end end end From 75c32cd7b14db86044b906ae8ce191a3d8385c90 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 13 Nov 2015 09:09:51 -0500 Subject: [PATCH 233/630] Add gitter link to dmlc/mxnet --- README.md | 2 ++ 1 file changed, 2 insertions(+) diff --git a/README.md b/README.md index 7dc99a24a7b4..a6ae2d5cebe8 100644 --- a/README.md +++ b/README.md @@ -4,6 +4,8 @@ [![codecov.io](https://codecov.io/github/dmlc/MXNet.jl/coverage.svg?branch=master)](https://codecov.io/github/dmlc/MXNet.jl?branch=master) [![Documentation Status](https://readthedocs.org/projects/mxnetjl/badge/?version=latest)](http://mxnetjl.readthedocs.org/en/latest/?badge=latest) [![License](http://dmlc.github.io/img/apache2.svg)](LICENSE.md) +[![Join the chat at https://gitter.im/dmlc/mxnet](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/dmlc/mxnet?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge) + MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julialang.org/) package. MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of features include: From 5b9df89d68ae1847b0cc1e47d20f21e3b0196883 Mon Sep 17 00:00:00 2001 From: pluskid Date: Fri, 13 Nov 2015 09:58:35 -0500 Subject: [PATCH 234/630] update README for LSTM example. --- examples/char-lstm/README.md | 124 +++++++++++++++++++++++------------ examples/char-lstm/config.jl | 2 +- 2 files changed, 84 insertions(+), 42 deletions(-) diff --git a/examples/char-lstm/README.md b/examples/char-lstm/README.md index 6e122a96d945..6e250ba5788c 100644 --- a/examples/char-lstm/README.md +++ b/examples/char-lstm/README.md @@ -19,62 +19,104 @@ Modify parameters in [config.jl](config.jl) and then run [train.jl](train.jl). A of training looks like this: ``` ... -INFO: Speed: 355.18 samples/sec +INFO: Speed: 356.66 samples/sec +INFO: Speed: 357.72 samples/sec INFO: == Epoch 020 ========== INFO: ## Training summary -INFO: NLL = 1.9670 -INFO: perplexity = 7.1494 -INFO: time = 88.0757 seconds +INFO: NLL = 1.4672 +INFO: perplexity = 4.3373 +INFO: time = 87.2631 seconds INFO: ## Validation summary -INFO: NLL = 2.0452 -INFO: perplexity = 7.7307 -INFO: Saved checkpoint to '/cbcl/cbcl01/chiyuan/mxnet/julia/examples/char-lstm/checkpoints/ptb-0020.params' -INFO: Speed: 366.23 samples/sec -INFO: Speed: 360.19 samples/sec -INFO: Speed: 355.77 samples/sec -INFO: Speed: 356.83 samples/sec -INFO: Speed: 354.80 samples/sec -INFO: Speed: 349.89 samples/sec -INFO: Speed: 352.00 samples/sec -INFO: Speed: 358.46 samples/sec -INFO: Speed: 356.58 samples/sec -INFO: Speed: 353.03 samples/sec -INFO: Speed: 351.98 samples/sec -INFO: Speed: 365.54 samples/sec -INFO: Speed: 359.14 samples/sec -INFO: Speed: 355.60 samples/sec -INFO: Speed: 362.44 samples/sec -INFO: Speed: 359.01 samples/sec -INFO: Speed: 357.99 samples/sec -INFO: Speed: 350.07 samples/sec -INFO: Speed: 358.03 samples/sec +INFO: NLL = 1.6374 +INFO: perplexity = 5.1418 +INFO: Saved checkpoint to 'examples/char-lstm/checkpoints/ptb-0020.params' +INFO: Speed: 368.74 samples/sec +INFO: Speed: 361.04 samples/sec +INFO: Speed: 360.02 samples/sec +INFO: Speed: 362.34 samples/sec +INFO: Speed: 360.80 samples/sec +INFO: Speed: 362.77 samples/sec +INFO: Speed: 357.18 samples/sec +INFO: Speed: 355.30 samples/sec +INFO: Speed: 362.33 samples/sec +INFO: Speed: 359.23 samples/sec +INFO: Speed: 358.09 samples/sec +INFO: Speed: 356.89 samples/sec +INFO: Speed: 371.91 samples/sec +INFO: Speed: 372.24 samples/sec +INFO: Speed: 356.59 samples/sec +INFO: Speed: 356.64 samples/sec +INFO: Speed: 360.24 samples/sec +INFO: Speed: 360.32 samples/sec +INFO: Speed: 362.38 samples/sec INFO: == Epoch 021 ========== INFO: ## Training summary -INFO: NLL = 1.9698 -INFO: perplexity = 7.1695 -INFO: time = 87.9392 seconds +INFO: NLL = 1.4655 +INFO: perplexity = 4.3297 +INFO: time = 86.9243 seconds INFO: ## Validation summary -INFO: NLL = 2.0458 -INFO: perplexity = 7.7353 -INFO: Saved checkpoint to '/cbcl/cbcl01/chiyuan/mxnet/julia/examples/char-lstm/checkpoints/ptb-0021.params' +INFO: NLL = 1.6366 +INFO: perplexity = 5.1378 +INFO: Saved checkpoint to 'examples/char-lstm/checkpoints/ptb-0021.params' ``` ## Sampling Run [sampler.jl](sampler.jl) to generate sample sentences from the trained model. Some example sentences are ``` -... +## Sample 1 +all have sir, +Away will fill'd in His time, I'll keep her, do not madam, if they here? Some more ha? + +## Sample 2 +am. + +CLAUDIO: +Hone here, let her, the remedge, and I know not slept a likely, thou some soully free? + +## Sample 3 +arrel which noble thing +The exchnachsureding worns: I ne'er drunken Biancas, fairer, than the lawfu? + +## Sample 4 +augh assalu, you'ld tell me corn; +Farew. First, for me of a loved. Has thereat I knock you presents? + +## Sample 5 +ame the first answer. + +MARIZARINIO: +Door of Angelo as her lord, shrield liken Here fellow the fool ? + +## Sample 6 +ad well. + +CLAUDIO: +Soon him a fellows here; for her fine edge in a bogms' lord's wife. + +LUCENTIO: +I? + +## Sample 7 +adrezilian measure. + +LUCENTIO: +So, help'd you hath nes have a than dream's corn, beautio, I perchas? + ## Sample 8 -a, good. Baps, -To she tur in his God twerian: well Resice hestle, the a I here's a not as I lign? -H? +as eatter me; +The girlly: and no other conciolation! + +BISTRUMIO: +I have be rest girl. O, that I a h? ## Sample 9 -ame. -What high sisiss itle by mard have of on sol I cound: -And pruch you betsts; you god eie hearry? +and is intend you sort: +What held her all 'clama's for maffice. Some servant.' what I say me the cu? ## Sample 10 -and oar -Serens Iffall as a we of tere geling pover your nive relly lers; is here whill cheadaplee k? +an thoughts will said in our pleasue, +Not scanin on him that you live; believaries she. + +ISABELLLLL? ``` diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl index b8aa6df49247..974989167ad1 100644 --- a/examples/char-lstm/config.jl +++ b/examples/char-lstm/config.jl @@ -5,7 +5,7 @@ const DIM_HIDDEN = 256 const DIM_EMBED = 256 const LSTM_N_LAYER = 2 const N_EPOCH = 21 -const BASE_LR = 0.05 +const BASE_LR = 0.01 const WEIGHT_DECAY = 0.00001 const CLIP_GRADIENT = 1 const NAME = :ptb From 379de2bf669f3de4fda05dfae52861a1b9ebb376 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 14 Nov 2015 21:09:56 -0500 Subject: [PATCH 235/630] part of LSTM tutorial --- docs/index.rst | 1 + docs/tutorial/char-lstm.rst | 75 +++++++++++++++++++++++++++++++++++++ examples/char-lstm/lstm.jl | 10 ++++- 3 files changed, 85 insertions(+), 1 deletion(-) create mode 100644 docs/tutorial/char-lstm.rst diff --git a/docs/index.rst b/docs/index.rst index 4f718e1861b9..05077bed6904 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -19,6 +19,7 @@ For more details, see documentation below. Please also checkout the `examples :caption: Tutorials tutorial/mnist + tutorial/char-lstm .. toctree:: :maxdepth: 2 diff --git a/docs/tutorial/char-lstm.rst b/docs/tutorial/char-lstm.rst new file mode 100644 index 000000000000..4cb9c1c814ae --- /dev/null +++ b/docs/tutorial/char-lstm.rst @@ -0,0 +1,75 @@ +Generating Random Sentence with LSTM RNN +======================================== + +This tutorial shows how to train a LSTM (Long short-term memory) RNN (recurrent +neural network) to perform character-level sequence training and prediction. The +original model, usually called ``char-rnn`` is described in `Andrej Karpathy's +blog `_, with +a reference implementation in Torch available `here +`_. + +Because MXNet.jl does not have a specialized model for recurrent neural networks +yet, the example shown here is an implementation of LSTM by using the default +:class:`FeedForward` model via explicitly unfolding over time. We will be using +fixed-length input sequence for training. The code is adapted from the `char-rnn +example for MXNet's Python binding +`_, which +demonstrates how to use low-level :doc:`symbolic APIs ` to +build customized neural network models directly. + +LSTM Cells +---------- + +Christopher Olah has a `great blog post about LSTM +`_ with beautiful and +clear illustrations. So we will not repeat the definition and explanation of +what an LSTM cell is here. Basically, an LSTM cell takes input ``x``, as well as +previous states (including ``c`` and ``h``), and produce the next states. +We define a helper type to bundle the two state variables together: + +.. literalinclude:: ../../examples/char-lstm/lstm.jl + :language: julia + :start-after: #--LSTMState + :end-before: #--/LSTMState + +Because LSTM weights are shared at every time when we do explicit unfolding, so +we also define a helper type to hold all the weights (and bias) for an LSTM cell +for convenience. + +.. literalinclude:: ../../examples/char-lstm/lstm.jl + :language: julia + :start-after: #--LSTMParam + :end-before: #--/LSTMParam + +Note all the variables are of type :class:`SymbolicNode`. We will construct the +LSTM network as a symbolic computation graph, which is then instantiated with +:class:`NDArray` for actual computation. + +.. literalinclude:: ../../examples/char-lstm/lstm.jl + :language: julia + :start-after: #--lstm_cell + :end-before: #--/lstm_cell + +The following figure is stolen from +`Christopher Olah's blog +`_, which illustrate +exactly what the code snippet above is doing. + +.. image:: http://colah.github.io/posts/2015-08-Understanding-LSTMs/img/LSTM3-chain.png + +In particular, instead of defining the four gates independently, we do the +computation together and then use :class:`SliceChannel` to split them into four +outputs. The computation of gates are all done with the symbolic API. The return +value is a LSTM state containing the output of a LSTM cell. + +Unfolding LSTM +-------------- +Using the LSTM cell defined above, we are now ready to define a function to +unfold a LSTM network with L layers and T time steps. The first part of the +function is just defining all the symbolic variables for the shared weights and +states. + +.. literalinclude:: ../../examples/char-lstm/lstm.jl + :language: julia + :start-after: #--LSTM-part1 + :end-before: #--/LSTM-part1 diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index 7ad9fa91b8d9..ab0c678f581d 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -1,18 +1,23 @@ # An explicitly unrolled LSTM with fixed sequence length. using MXNet +#--LSTMState immutable LSTMState c :: mx.SymbolicNode h :: mx.SymbolicNode end +#--/LSTMState +#--LSTMParam immutable LSTMParam i2h_W :: mx.SymbolicNode h2h_W :: mx.SymbolicNode i2h_b :: mx.SymbolicNode h2h_b :: mx.SymbolicNode end +#--/LSTMParam +#--lstm_cell function lstm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMParam; num_hidden::Int=512, dropout::Real=0, name::Symbol=gensym()) @@ -37,7 +42,9 @@ function lstm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMPara return LSTMState(next_c, next_h) end +#--/lstm_cell +#--LSTM-part1 function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_class::Int; dropout::Real=0, name::Symbol=gensym(), output_states::Bool=false) @@ -55,6 +62,8 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla mx.Variable(symbol(name, "_l$(i)_init_h"))) (param, state) end + #... + #--/LSTM-part1 # now unroll over time outputs = mx.SymbolicNode[] @@ -64,7 +73,6 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla hidden = mx.FullyConnected(data=data, weight=embed_W, num_hidden=dim_embed, no_bias=true, name=symbol(name, "_embed_$t")) - # stack LSTM cells for i = 1:n_layer l_param, l_state = layer_param_states[i] From c804be9df6168edae462ba5d6b5424c020ca4d16 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 14 Nov 2015 23:36:46 -0500 Subject: [PATCH 236/630] char-LSTM tutorial --- docs/api/io.rst | 87 ++--- docs/api/model.rst | 13 +- docs/tutorial/char-lstm.rst | 297 ++++++++++++++++- docs/tutorial/images/LSTM3-chain.png | Bin 0 -> 229688 bytes docs/tutorial/images/char-lstm-vis.svg | 435 +++++++++++++++++++++++++ examples/char-lstm/lstm.jl | 8 +- examples/char-lstm/seq-data.jl | 11 + examples/char-lstm/train.jl | 9 +- src/io.jl | 84 ++--- 9 files changed, 857 insertions(+), 87 deletions(-) create mode 100644 docs/tutorial/images/LSTM3-chain.png create mode 100644 docs/tutorial/images/char-lstm-vis.svg diff --git a/docs/api/io.rst b/docs/api/io.rst index e9d9c04e9f3c..f1ab959be6f2 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -59,62 +59,66 @@ and split it into mini-batches so that the model can consume the data in a unifo By default, :func:`eachbatch` simply returns the provider itself, so the iterator interface is implemented on the provider type itself. But the extra layer of abstraction allows us to - implement a data provider easily via a Julia ``Task`` coroutine. - The detailed interface function is listed below: + implement a data provider easily via a Julia ``Task`` coroutine. See the + data provider defined in :doc:`the char-lstm example + ` for an example of using coroutine to define data + providers. - .. function:: Base.eltype(provider) -> AbstractDataBatch +The detailed interface functions for the iterator API is listed below: - :param AbstractDataProvider provider: the data provider. - :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. +.. function:: Base.eltype(provider) -> AbstractDataBatch - .. function:: Base.start(provider) -> AbstractDataProviderState + :param AbstractDataProvider provider: the data provider. + :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. - :param AbstractDataProvider provider: the data provider. +.. function:: Base.start(provider) -> AbstractDataProviderState - This function is always called before iterating into the dataset. It should initialize - the iterator, reset the index, and do data shuffling if needed. + :param AbstractDataProvider provider: the data provider. - .. function:: Base.done(provider, state) -> Bool + This function is always called before iterating into the dataset. It should initialize + the iterator, reset the index, and do data shuffling if needed. - :param AbstractDataProvider provider: the data provider. - :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. - :return: true if there is no more data to iterate in this dataset. +.. function:: Base.done(provider, state) -> Bool - .. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) + :param AbstractDataProvider provider: the data provider. + :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. + :return: true if there is no more data to iterate in this dataset. - :param AbstractDataProvider provider: the data provider. - :return: the current data batch, and the state for the next iteration. +.. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) - Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that - is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this - case, you can safely assume that + :param AbstractDataProvider provider: the data provider. + :return: the current data batch, and the state for the next iteration. - * :func:`Base.start` will always be called, and called only once before the iteration starts. - * :func:`Base.done` will always be called at the beginning of every iteration and always be called once. - * If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with - a call to :func:`Base.start`. - * :func:`Base.next` will always be called only once in each iteration. It will always be called after - one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will - not be called. +Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that +is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this +case, you can safely assume that - With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation - of the built-in :class:`MXDataProvider` for example. +* :func:`Base.start` will always be called, and called only once before the iteration starts. +* :func:`Base.done` will always be called at the beginning of every iteration and always be called once. +* If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with + a call to :func:`Base.start`. +* :func:`Base.next` will always be called only once in each iteration. It will always be called after + one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will + not be called. - .. caution:: +With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation +of the built-in :class:`MXDataProvider` for example. - Please do not use the one data provider simultaneously in two different places, either in parallel, - or in a nested loop. For example, the behavior for the following code is undefined +.. caution:: - .. code-block:: julia + Please do not use the one data provider simultaneously in two different places, either in parallel, + or in a nested loop. For example, the behavior for the following code is undefined - for batch in data - # updating the parameters + .. code-block:: julia + + for batch in data + # updating the parameters - # now let's test the performance on the training set - for b2 in data - # ... - end - end + # now let's test the performance on the training set + for b2 in data + # ... + end + end @@ -163,7 +167,7 @@ and split it into mini-batches so that the model can consume the data in a unifo :param AbstractDataBatch batch: the data batch object. :param Base.Symbol name: the name of the data to get, should be one of the names provided in either :func:`provide_data() ` - or :func:`provide_label() `. + or :func:`provide_label() `. :return: the corresponding data array corresponding to that name. .. function:: load_data!(provider, batch, targets) @@ -243,6 +247,9 @@ Built-in data providers contents of all the missing data points. :param Real label_padding: the same as ``data_padding``, except for the labels. + TODO: remove ``data_padding`` and ``label_padding``, and implement rollover that copies + the last or first several training samples to feed the padding. + diff --git a/docs/api/model.rst b/docs/api/model.rst index d5245614061b..764d3e9329a8 100644 --- a/docs/api/model.rst +++ b/docs/api/model.rst @@ -71,9 +71,9 @@ a network described using the symbolic API. :param Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory allocation of the :class:`Executor` depends on the mini-batch size of the test data provider. If you call predict twice with data provider of the same batch-size, - then the executor can be re-used. Otherwise, if ``overwrite`` is false (default), - an error will be raised; if ``overwrite`` is set to true, a new :class:`Executor` - will be created to replace the old one. + then the executor can be potentially be re-used. So, if ``overwrite`` is false, + we will try to re-use, and raise an error if batch-size changed. If ``overwrite`` + is true (the default), a new :class:`Executor` will be created to replace the old one. .. note:: @@ -85,6 +85,13 @@ a network described using the symbolic API. For the same reason, currently prediction will only use the first device even if multiple devices are provided to construct the model. + .. note:: + + If you perform further after prediction. The weights are not automatically synchronized if ``overwrite`` + is set to false and the old predictor is re-used. In this case + setting ``overwrite`` to true (the default) will re-initialize the predictor the next time you call + predict and synchronize the weights again. + :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` diff --git a/docs/tutorial/char-lstm.rst b/docs/tutorial/char-lstm.rst index 4cb9c1c814ae..5b1c348e5568 100644 --- a/docs/tutorial/char-lstm.rst +++ b/docs/tutorial/char-lstm.rst @@ -17,6 +17,13 @@ example for MXNet's Python binding demonstrates how to use low-level :doc:`symbolic APIs ` to build customized neural network models directly. +The most important code snippets of this example is shown and explained here. +To see and run the complete code, please refer to the `examples/char-lstm +`_ directory. +You will need to install `Iterators.jl +`_ and `StatsBase.jl +`_ to run this example. + LSTM Cells ---------- @@ -50,12 +57,12 @@ LSTM network as a symbolic computation graph, which is then instantiated with :start-after: #--lstm_cell :end-before: #--/lstm_cell -The following figure is stolen from +The following figure is stolen (permission requested) from `Christopher Olah's blog `_, which illustrate exactly what the code snippet above is doing. -.. image:: http://colah.github.io/posts/2015-08-Understanding-LSTMs/img/LSTM3-chain.png +.. image:: images/LSTM3-chain.png In particular, instead of defining the four gates independently, we do the computation together and then use :class:`SliceChannel` to split them into four @@ -69,7 +76,293 @@ unfold a LSTM network with L layers and T time steps. The first part of the function is just defining all the symbolic variables for the shared weights and states. +The ``embed_W`` is the weights used for character embedding --- i.e. mapping the +one-hot encoded characters into real vectors. The ``pred_W`` and ``pred_b`` are +weights and bias for the final prediction at each time step. + +Then we define the weights for each LSTM cell. Note there is one cell for each +layer, and it will be replicated (unrolled) over time. The states are, however, +*not* shared over time. Instead, here we define the initial states here at the +beginning of a sequence, and we will update them with the output states at each +time step as we explicitly unroll the LSTM. + .. literalinclude:: ../../examples/char-lstm/lstm.jl :language: julia :start-after: #--LSTM-part1 :end-before: #--/LSTM-part1 + +Unrolling over time is a straightforward procedure of stacking the embedding +layer, and then LSTM cells, on top of which the prediction layer. During +unrolling, we update the states and collect all the outputs. Note each time step +takes data and label as inputs. If the LSTM is named as ``:ptb``, the data and +label at step ``t`` will be named ``:ptb_data_$t`` and ``:ptb_label_$t``. Late +on when we prepare the data, we will define the data provider to match those +names. + +.. literalinclude:: ../../examples/char-lstm/lstm.jl + :language: julia + :start-after: #--LSTM-part2 + :end-before: #--/LSTM-part2 + +Note at each time step, the prediction is connected to a :class:`SoftmaxOutput` +operator, which could back propagate when corresponding labels are provided. The +states are then connected to the next time step, which allows back propagate +through time. However, at the end of the sequence, the final states are not +connected to anything. This dangling outputs is problematic, so we explicitly +connect each of them to a :class:`BlockGrad` operator, which simply back +propagates 0-gradient and closes the computation graph. + +In the end, we just group all the prediction outputs at each time step as +a single :class:`SymbolicNode` and return. Optionally we will also group the +final states, this is used when we use the trained LSTM to sample sentences. + +.. literalinclude:: ../../examples/char-lstm/lstm.jl + :language: julia + :start-after: #--LSTM-part3 + :end-before: #--/LSTM-part3 + +Data Provider for Text Sequences +-------------------------------- + +Now we need to construct a data provider that takes a text file, divide the text +into mini-batches of fixed-length character-sequences, and provide them as +one-hot encoded vectors. + +Note the is no fancy feature extraction at all. Each character is simply encoded +as a one-hot vector: a 0-1 vector of the size given by the vocabulary. Here we +just construct the vocabulary by collecting all the unique characters in the +training text -- there are not too many of them (including punctuations and +whitespace) for English text. Each input character is then encoded as a vector +of 0s on all coordinates, and 1 on the coordinate corresponding to that +character. The character-to-coordinate mapping is giving by the vocabulary. + +The text sequence data provider implement the :doc:`data provider API +`. We define the ``CharSeqProvider`` as below: + +.. literalinclude:: ../../examples/char-lstm/seq-data.jl + :language: julia + :start-after: #--CharSeqProvider + :end-before: #--/CharSeqProvider + +The provided data and labels follow the naming convention of inputs used when +unrolling the LSTM. Note in the code below, apart from ``$name_data_$t`` and +``$name_label_$t``, we also provides the initial ``c`` and ``h`` states for each +layer. This is because we are using the high-level :class:`FeedForward` API, +which has no idea about time and states. So we will feed the initial states for +each sequence from the data provider. Since the initial states is always zero, +we just need to always provide constant zero blobs. + +.. literalinclude:: ../../examples/char-lstm/seq-data.jl + :language: julia + :start-after: #--provide + :end-before: #--/provide + +Next we implement the :func:`AbstractDataProvider.eachbatch` interface for the provider. +We start by defining the data and label arrays, and the ``DataBatch`` object we +will provide in each iteration. + +.. literalinclude:: ../../examples/char-lstm/seq-data.jl + :language: julia + :start-after: #--eachbatch-part1 + :end-before: #--/eachbatch-part1 + +The actual data providing iteration is implemented as a Julia **coroutine**. In this +way, we can write the data loading logic as a simple coherent ``for`` loop, and +do not need to implement the interface functions like :func:`Base.start`, +:func:`Base.next`, etc. + +Basically, we partition the text into +batches, each batch containing several contiguous text sequences. Note at each +time step, the LSTM is trained to predict the next character, so the label is +the same as the data, but shifted ahead by one index. + +.. literalinclude:: ../../examples/char-lstm/seq-data.jl + :language: julia + :start-after: #--eachbatch-part2 + :end-before: #--/eachbatch-part2 + + +Training the LSTM +----------------- + +Now we have implemented all the supporting infrastructures for our char-lstm. +To train the model, we just follow the standard high-level API. Firstly, we +construct a LSTM symbolic architecture: + +.. literalinclude:: ../../examples/char-lstm/train.jl + :language: julia + :start-after: #--LSTM + :end-before: #--/LSTM + +Note all the parameters are defined in `examples/char-lstm/config.jl +`_. +Now we load the text file and define the data provider. The data ``input.txt`` +we used in this example is `a tiny Shakespeare dataset +`_. But you +can try with other text files. + +.. literalinclude:: ../../examples/char-lstm/train.jl + :language: julia + :start-after: #--data + :end-before: #--/data + +The last step is to construct a model, an optimizer and fit the mode to the +data. We are using the :class:`ADAM` optimizer [Adam]_ in this example. + +.. literalinclude:: ../../examples/char-lstm/train.jl + :language: julia + :start-after: #--train + :end-before: #--/train + +Note we are also using a customized ``NLL`` evaluation metric, which calculate +the negative log-likelihood during training. Here is an output sample at the end of +the training process. + +.. code-block:: text + + ... + INFO: Speed: 357.72 samples/sec + INFO: == Epoch 020 ========== + INFO: ## Training summary + INFO: NLL = 1.4672 + INFO: perplexity = 4.3373 + INFO: time = 87.2631 seconds + INFO: ## Validation summary + INFO: NLL = 1.6374 + INFO: perplexity = 5.1418 + INFO: Saved checkpoint to 'char-lstm/checkpoints/ptb-0020.params' + INFO: Speed: 368.74 samples/sec + INFO: Speed: 361.04 samples/sec + INFO: Speed: 360.02 samples/sec + INFO: Speed: 362.34 samples/sec + INFO: Speed: 360.80 samples/sec + INFO: Speed: 362.77 samples/sec + INFO: Speed: 357.18 samples/sec + INFO: Speed: 355.30 samples/sec + INFO: Speed: 362.33 samples/sec + INFO: Speed: 359.23 samples/sec + INFO: Speed: 358.09 samples/sec + INFO: Speed: 356.89 samples/sec + INFO: Speed: 371.91 samples/sec + INFO: Speed: 372.24 samples/sec + INFO: Speed: 356.59 samples/sec + INFO: Speed: 356.64 samples/sec + INFO: Speed: 360.24 samples/sec + INFO: Speed: 360.32 samples/sec + INFO: Speed: 362.38 samples/sec + INFO: == Epoch 021 ========== + INFO: ## Training summary + INFO: NLL = 1.4655 + INFO: perplexity = 4.3297 + INFO: time = 86.9243 seconds + INFO: ## Validation summary + INFO: NLL = 1.6366 + INFO: perplexity = 5.1378 + INFO: Saved checkpoint to 'examples/char-lstm/checkpoints/ptb-0021.params' + + +.. [Adam] Diederik Kingma and Jimmy Ba: *Adam: A Method for Stochastic + Optimization*. `arXiv:1412.6980 `_ + [cs.LG]. + + +Sampling Random Sentences +------------------------- + +After training the LSTM, we can now sample random sentences from the trained +model. The sampler works in the following way: + +- Starting from some fixed character, take ``a`` for example, and feed it as input to the LSTM. +- The LSTM will produce an output distribution over the vocabulary and a state + in the first time step. We sample a character from the output distribution, + fix it as the second character. +- In the next time step, we feed the previously sampled character as input and + continue running the LSTM by also taking the previous states (instead of the + 0 initial states). +- Continue running until we sampled enough characters. + +Note we are running with mini-batches, so several sentences could be sampled +simultaneously. Here are some sampled outputs from a network I trained for +around half an hour on the Shakespeare dataset. Note all the line-breaks, +punctuations and upper-lower case letters are produced by the sampler itself. +I did not do any post-processing. + +.. code-block:: text + + ## Sample 1 + all have sir, + Away will fill'd in His time, I'll keep her, do not madam, if they here? Some more ha? + + ## Sample 2 + am. + + CLAUDIO: + Hone here, let her, the remedge, and I know not slept a likely, thou some soully free? + + ## Sample 3 + arrel which noble thing + The exchnachsureding worns: I ne'er drunken Biancas, fairer, than the lawfu? + + ## Sample 4 + augh assalu, you'ld tell me corn; + Farew. First, for me of a loved. Has thereat I knock you presents? + + ## Sample 5 + ame the first answer. + + MARIZARINIO: + Door of Angelo as her lord, shrield liken Here fellow the fool ? + + ## Sample 6 + ad well. + + CLAUDIO: + Soon him a fellows here; for her fine edge in a bogms' lord's wife. + + LUCENTIO: + I? + + ## Sample 7 + adrezilian measure. + + LUCENTIO: + So, help'd you hath nes have a than dream's corn, beautio, I perchas? + + ## Sample 8 + as eatter me; + The girlly: and no other conciolation! + + BISTRUMIO: + I have be rest girl. O, that I a h? + + ## Sample 9 + and is intend you sort: + What held her all 'clama's for maffice. Some servant.' what I say me the cu? + + ## Sample 10 + an thoughts will said in our pleasue, + Not scanin on him that you live; believaries she. + + ISABELLLLL? + +See `Andrej Karpathy's blog post +`_ on more examples and +links including Linux source codes, Algebraic Geometry Theorems, and even +cooking recipes. The code for sampling can be found in +`examples/char-lstm/sampler.jl +`_. + +Visualizing the LSTM +-------------------- + +Finally, you could visualize the LSTM by calling :func:`to_graphviz` on the +constructed LSTM symbolic architecture. We only show an example of 1-layer and +2-time-step LSTM below. The automatic layout produced by GraphViz is definitely +much less clear than `Christopher Olah's illustrations +`_, but could +otherwise be very useful for debugging. As we can see, the LSTM unfolded over +time is just a (very) deep neural network. The complete code for producing this +visualization can be found in `examples/char-lstm/visualize.jl +`_. + +.. image:: images/char-lstm-vis.svg diff --git a/docs/tutorial/images/LSTM3-chain.png b/docs/tutorial/images/LSTM3-chain.png new file mode 100644 index 0000000000000000000000000000000000000000..e962a3c720781e37949a0d654e11dffff1b6803a GIT binary patch literal 229688 zcmYg&1yq#V_x8}25L8r=R6t4^X@gF|p-X|GTL$UwZif7y z7yNzeo3&W?Ixz1!XZL>gb0+A8((@}sR75Zs?24?6qzVl7Uj+BnsZV?I@+`sA_BG=wgI0g}J!6uvyx` z9gL0aOxbJ^=85aVR4~{bn5^VeHP@uoF>}Y815~K3bEUiAvHCo0Rir*KsjS_@zV&?( z8T=NnnuzFuGj5}P(U-W4udi*h93}D6Wo`S?C9XefYptb!`(JC))yOCT#%|mE$0l_i zW^~uZR=M2F!+)UfK`%G+kRaSQ*n3KcIYf;(_ROA5*ev4rKH05yOB(VO&Ho*IW0;TR z?H%)Z9|&GDn*yb`3OifjTMtjF@XyT^>2PS~CU_3T461yQCItl6QZTrJ?G$#Z6%@6Rcgne->LcRq+L64YFSJY`{T=~V6Z~V z5+^DeHjI<(8zz4L&hO?p3~@a132w(vw9Wn&MoJRA-iC2zF!cEO3{IO*k08tOcyUVn zKARLYl^t!KKy=G{5G2;Fnq`%pS%n`Lq(I)m}+}NyP9ylu!#>QhOO!=@QP3EVgoP^ zR3ny%Z-EJKY4m{v32`3G42wQuX!k3R$A799rwF7##Xk|ZofJ%apE{FdLCtYH-Xj0B zf5Hgbzocg;r7G#7#JqO(XXv-Y96=q(!#6$w(4MZ@kNnX1pii=k$Hu%fkmhGX{Fy9R z=?9u^$AxlBgr@@1f{9UxC5f=yJoeaN;oWUyQ+*VAcT`hK-k95 zCgjVrY&o?;&EUu;IdTeGWnD)ad(JJ%=S`83&e8Ag2gnLX0vlrXGUuS|?sGiFW zzl@9|2Tv1!jld3wBrP@_WGY=9PMSa-(mWZQuABY$G`|)~axxNZe4M5ohk};Cduk6= z-@pFR6d24Vt*anx-@DZ)-5jwl%giY-b?7d#C4+rTwqbhUr+1i^X~ek6u^FUqdgJ8J zEVQ%tDV!Pn95>1d0=w4ir;Mh!^M<0)pWZrfPgTtQ zu$HB>r;wW8G-$2YY5Rzx$YP+IA(J6>Jv#%7Obb4k>ii$1?g*H1NDz}lvgo`1(TXNY ziM6&p3;jACj?Q~tS8m&#~6dEjXZhz>lQ{gK@ z;F5}V3&YS-0!0h56UZCBxG=#R+Nk(@^~v>ihzgm)7nRp3epZL@hK}^-7zs@qf4r$F z8qS=YzT&g6Fjw+<@0cVuPcM2zqTjE~F9JQRhj;4*bTEeS5Kbw-DqjLWE`)by(`Lrf9(D;JTUaP#^4yXq7WE$S>a5a*uqwO>P~!}6)yq#erneg zv9A$&SPL&oi6}Bb7i{Hw4=0K;jqmfwmqGr4lk!DZHk65c#bssP5u{qYCH0cakIsxBIREjc(`*t zl>8QU%o<9Oo`MTFqN!Y=v>s)1^Pg}HxjDMDJ-!?E2SKNpP32_5F2|yL%7$Ks4YUo; z7CVb9x!Wi&t7RK}+Ct23edn?rdR&`uK*;5N`mu5L-6-7=4u@_b-4(WrU=#7IiBc8s z@T!GZPQ{$utI2hJiHfhMJd#rL?hB3@C)J*$#>`@E#d|)pW=Cw3?(nq`>@dcQjmL0i z;D3g1-O5bRDKNoXU)sAPBDjC=o^bJG!(1dX7O&lm%Vv3|LNC~s;An~PC1g~DCa8Gn zdIE8O-HtivoY^BVs=+s}Hm8(S<+O>oD7>0;>BZV}I@=vQ{(96Wzj;AM`frmBl>PYe zq|xn``nrz7WqaiT)K%lMz4xTX2;&IQ+O-%AS4#3WzmBuD;D93;$6xK^uf)BOrAR8h z4zVQjB$+KYck@)>v{~^c<8!RJKRGyUzNl6 z)PW)cqe`9ZukALB{uGX9P5RIEi^2CPL|s2B3L%hOM^DlMkj}srndI}$q`X+^|ost#ucrmf3$hqd2Pf#XNka96g_OK7s%xH zorwa{gC#J!Clt%)okpZ_rE6W2;|K6DLfJJll68@{4vEf=j2chn6y=S!T{bp{n`e{;(o(R5NrX)Y z6s~=`42V#^B#Fn?owrunIm&lk{E%s(BD6V9o1o!AdeTWuFWgBWcEX-%ndobS9=^%e zbR8Tm;#ni5D)!;k^7@ga*ehLgU#L^kj5;&c@g5oaY)rJ4XDe^FcCZL2>O7y<_C(76 zfD|AZ#)bL`6UEALO;oKyh~V$hq2A|LR#J2@f}pB!xUD{ZbYcp!0XWueyBg$vk$f*h z+`lchQmPUk(pXGdckRWEqa@DV-fnLGcks4iF&EQ+`>4$~DTP51cBBojv*V0~MEH*1 zSV3=+IIW;epv;lF<#aHVq2pZzMTbTV*ZJwY;|EtEA zbW3zt!{giB?EDrO@?ct@L+lVfD2*Rdo5G{>YM$HrN>77!Ra?4dB=M!gd@>HPR5oLF zXUTMzbY-}2ODj>hQ|Q7MPoMX<{GCwBQe1zPG?y>P6`X9S3$a}_4OznW#ErJgp$H0@ z4m#`Z{nmh7$KUa1gj3irEPAgBl#h(uxOA=H3#om-D!Bi!H_lh6x-;lw$m`jBG5Fd7TT`U!W&D44!&pJpQ1t4G8oO2=cj4$c9c!1> zj17m_u!9{Rjc>k+HutQ#z1x5Ik5`V^{t9xKNZMsARd+4xD9e zxXd4%rTJs1JR-q47rD<`_5|_^nJMECw=0Vq`T9Q`P4(R-eYkVnVuQ1>o2v|JQCUIZ zlUv_C5+g}F62hvq4(|ty})783#p)DqF(xwPz$G!JJ!r*qj#!ezNGVqiUO+Era+YLLBL?+D@S zHCdmWE|-!Ybk^A3O=f@jGjIl<{XGhbtvefH@8gbtc=$TxA$=-nOqyI4pv+(25F+;57jZ>l9{QF{$wW?Z1qFGJGB_`%xKW=@d2pQ(}>mi)BSbRbQ zM+Y>GAbxP7>}d@aJ1{fP@k1)YKnzH3gSY5@r$-1}m_06wafjNZcII%+plFM4?z)S> z%gKbT6%7*i^;;@^DoJhfexL}JWoy1PMw1ZBD<`;;=J`_3n>hB@2g{2F=GF;_?JSqF zh4=Tbj;C&=l(7W+k!qJ6E63O2K#nyV$2o6P&0VhBKPR}p!u9M58?(hk9&tB`=YUQH z-KHO>bpA0UAcPz$-pJL`Zpov!^Nn5W^xN3Dtv|`^?vMEJ&dhhGE(+;w;ML@ZGy(W= zn?-i|G$&zHy4Aq#e$SMNJ?~cXs#dflRp3Nr4gOZ%4F&NuBF!wM0!F!@2Ddk(rmL~e zYY%$ckZxVYwYf}C9m9^j8%hpECYsyE?yzv7fnjc&?!d$pXMvY?i_YT%qv%sQ+qsl_ znS(y)95Pv)s3a`UE7A5jWOYlHg1mJ-V=taAwgQi=>~$M&8}nVz4Y|+Uv+@zBj=|!# z@iMFqW^R(N4hm1@6ifuDi>v4#%V@$YR)(k#ZKf#3Ge%$MdyRA|K&QV>6T+$JizjY{ z)<$mgU|j!@d~7z=$!O=i&Fg>m?dXZamWz@p@oq6%$>E>k1Rx9aNb^@cMHRSg_FPe} zq<$Dkt0dUS)4=u`R43r^@O-adoeEzsQ;P~J-gQzV%^R)ls769Bx8PXKPC~YMlb9l*gkEcRHbq4)$wW`Ukgd$k7S;pbv}Xr zD%M)ZBS9#xaGS4=&207g>tA>6nv;2-a2Yx&MV`*H-Dj@&Y3+iq>r_WSjayf;f}GtN zX?A-g_9i6AnJXMJZQQ&}KP%eXB0_sp^ENmqSD6oymZK@x_(az7Pu_7djhNE|6>p%FGv+ohG^wv-w_u6{lg@L zWy6{7LaMsW=%p|+CQ|TuIn$i-q^!+yP#$RWw(OI@#5oO%+U<#GFZz3#qH-#W2&W?F zIrrT~*L?cvcLg8QA32;dmI=mugeh0jJclHEvcWXjk>{`YhHoa4SL5)m(qhibAGb7I z))&-1;?X$^gk2a|>9}}JoMQ<>uLnbS2F ze6w1iY>1t}nQ^a&amDr6OwZzF9g_a~O**N2-^yp?niX|k_h3T>5yR|l;~bo!Qh3Gg zDBYiY_ly-cqNv08*Q4%DdP?c9#rfi9ApOX|fVtrmTifebSn;e)PZN|KlsD@vG4VOv zV7jbZ#Rmxjc-jY&3wI=#O&f+g&fuEw8c|zPPSn6Pczv|qEtFs4-XF_ z4Y)n{UBvHv`p<>M!mTmM)dlqFFrI8L-n|@NyN6EPs6UQE%0_9I+IJkXnYB=Tl>JZ*Q#Xl5}%9{ag*wbqZV^W@G2WNVo!f+xkZ_LLv zkJ94v&2cLSuqR7UHm)TmE63f6dr>L*8M||qUE^on2V3v6$18S}J+!Vvr;?DeReC}= zLwzf?nyX5yo=m2YD#|I%=Hm5ZJiEAgH%9Bn{j0W2T$K{YZ@+vuzo*mtWeDRauyFm2 zTHadb&&*7ZX87mRW-_gS`@X@xLF>%W9K0*$P; z`x~?h-=vY4B$4Gm1)_&6i$>fuZvMrKE70j^rw=t+rx!D;;!IHoK-$FlHY4<-EG^Qa z7)Lf+y6!@*%3WH&jgbf_>CV)&vL|JxZPQ+Ucac{lpT*4Fx~DgCb5#4pac#6JnL?DZ zX^=Q06_MHWb64$FL45n~n+~@{EE&c|4qn@(PDQh;_a+y)Ii3l`U8lV{v%9epa`_;l zZ^TLX9?sjRY;2&=Y0AA-Y`K6BdgEUOUL!*;7VKM`O%JXaM5;8&_g8yAN*IJoxw=l- z2tn`dbXPPk8TB%u;t}ZKy3>e9YB$%d(f%|GSHPNO1gemW=HTZT`db=Zs0oi;8zA! z^)S+wz>B^%X&_PK@PVG8MSposzn$zI4)690bY0Xqgb+v2gw}Q}i`EELS4Pfdh2O2< z`EEpd57b5NL17tma|PzMv!FlriY_qxY2%pEZ+FvJfwrs!3K4u-G2U_|Yn(C-QSzb5xfX`zWf3|+p;oyXK0$gUiV(2%Ji@-sdtZ5B)3xvOVQ1p#ZsPz0BlEnFY7vWrw1BNpwNUMA zxoxGwN5H!x#GMNI(+U%HQA+O77RV%yFdJhUopwpgnE z9?*?8%xnm^lpKT{SnB&^1Ju$~KGqzB3@v$UzlD>lmqwtZllhC++XjKzU+8vQi?R_q6|+7Il53cWivVqY77d~KuKb>sUF4sz)O(warD zsZj20htk2dzZy2$sK2e@oGz`(`rYRMJk=elP!<>7S|&Chu>5sU=lR)*f28~3q;K_0 zdGtYI{gb8HPOk;i+!>V9PvK=6ab1yKuy4QV0<}!~wrLw6b_`~UH6KsZt?Xt0*&9J` zq8Hd57Ge%C+-2;b0`AFM7wFIteh(SBd0KKA`o+7V9OwClUO?wXO>?ZRkK zX~WrFcYZ^nz~fKm!WBnW>Yr0Jg*3-K)UY>*t!tP0IIXR;&>-}q(|=^d2Sa$pyybs# zhkeaAy!_qOOT1pSWIPRJs^&VmKYqH+lj7+TKj;=!=f!N2p!?=k&J4Hi2qn3hHQhnc z4PcKE;?dTu>!z%W3Ec}yLQ5Nr)ACQuCUYIFyq5<@G(fHY+?KYzDZk48I7^fvlg2)Y zZ||6JcSE2B{;f)EAX{Z3yEVN)toXvQCQRUnu5OW?5E3%~)Vi2XAwH8_p6sy@fO39y zn%R#QFe+>GCp^}wGQC-H%cpz6A=93FFKci|`EXjD&C&r+@l9%SrsuCLrJIFbi{{v= z6_kwM@y3~Xp=~M@jBDDCEedCdZaEcD=_)x&3<{NJ4!$VdOTFdQUMu0TP0fDC6?66+ z3lx!%VT` zkb7RM%T9FyyqZ7W??ZFV7?5#pVB zGsvAEhTXDzL`X_8Mhm=v2C1+y91r- zdQu4I5AnIY89d}IF}>cGz14d?1a96=DpeWDi{oG729GFqMBCs$v11wz3@%OWSv{pH z)`JwM>Q|z4Bx4Sf8&PND8`C=R`@07}t?XkzC+LCHa zo0>CvIVN%Nzr7(wRnm1^iA3vq05;NJWY+JQy6_tvM}G76oaV7Zf1hWn*wsd;gGX9o~p-ti@swnw`LZ$T}NQaj{?w8kx124M<-7VEkrjy8}wCD$F#lb929_kl$7rMfq5T>1mn}8ql0-*gZr9| z?mpt;2fbdBmrfC=JJg!4RTC>JVgO*H8uaz2b=OP(#{~$Z*H(hi8fzow_Ho1OoO|uT?{!@vINAu7OQuh3-)Rb=RIkCzTyv1d*oY>)^?c> z5;_W;C^*uOJ--Ck{aRv}C=Ax8v9HqWjKWzt1%71?Zd0%;Z@#g=fFK2n^Vh!Ky8y() zA2;(9IK?V=Q-r`>*p-)ZE?SrGb}gmr#9T&TJUoke_cG!ocYeRH!51a9Dmkx0WW#e( z%&MRtTL1y>|F`CYQA>`;9rpa)ap7l50_jCJp;`ly5il4M9SppIxkwPg_ z&$WDpsz)763-^~WZ|&FU)=%7I{^gImBbD9n-W!Fq?hsNBzM1bg+XpSTYd+pGRn;9= ztulY~y6Csdjzlu-(KvvxQuV*P>Jp}=us^xi2k(rU+PV;F_np=?8Yr-+7=p7#s)l_s z;yQ_#Yf4H>0w-Wv~2vj+h)^N=-)0+Tig>mOO z-2yFC%N9R7y);ob^F==DiL4*l&n+LW2a!MaDY!LR|2u_oZBQN~Ad|jA$ zYOu{$mCp}FMa~C_MNPMs4K!=dTmVGa)%)ig^T7GY!IUa*g=@tRx?wR&5Fa9bH@U6U z&PvwtR?M1H@4qbq(`V7dox8B)1Ou61u8|vuJOlr;JH84A<`)mc71^4+4#io-eOZT2 znF2JpmP9MV|L1Ry3Lg=16Kix#t#unc1@)di~RKAfb{V` z*g<0_0vAI4onw8G_Q!(bhr4(%U^8oA9_XwN35%sM$+pAYHj6(!aI;02{?Rz2>qM&* za4Lq52`tEnX!r}T$!NwGoWnk;F+BMQJluW_@BE9?w;hC+uD1I_FmV=&+1<^8RJ&-W zJF+HP)V@Z8cnccU@88q;V=lc!g`dWeYP8locSK z6)J@82QCiYz1?8rnUE0kMm1CJbVlz840lnWhjMT_F{t95YTe|I;l;3B1kuAG>E>Uw zD^PhqqBR>IIx^_?NWk0q0-yghQ?4}e)3|0t;8`EgOWtsG(oO1EAbUBLeif|pl>~w; z-O^#pWcat8?#8VJX19N~&W|1j!%ot)>7W@fT;Egu+G96VA+qh{2@=czM(_t@K)59E zHGSg_@3h&V83AssKw`w<8JrdJcNKmsY!%-ua)KIeHQaRbOyMpH2eGeeTTeWNmkBfq zDoobyeW>$hUn$GC_pC43Xevv36%~w(?d%eZQg>5k(aOG*#{g9^cZJp8TM3G6wmxS> z6DKDuLi=aOSLZheHyC*Z*T1`^%SX?F`OjFG%c%Rph7W$)ge$bOcd?%TO`^zM2nbP z)ZSC|Kb~*&{MF&0yN{fgby!QNB3m`-jE!kNw+XqMVeuFY9o+;cy1YgN65Rh}17wc= za>R_A!y}$aPQd%F=k2NFi1T?9Xh)Q(9F7>DVN`CGgjTe+_kYvLLx$x#Lz$CMdniHo zXOw&f4&iZe{+P?^n6pa5kyu}!my5%Ad%;KQJmivS6?CpZ+{ytHOGK}rh|kC7|O zdQ#sK%zLw5sZ#y1_}yqbZZaCpyzMBuR=;@3$dLgB?xN7AqVPIr>+jl_gtHb^!%CM$ zsTpnat%0{o&=3f=z9Hb%wlUP>e%C42~4zSLJn2V zTF5!N3I-$1@vA$wugJ&muIY%+!=H|%4ls_4zW%}J={zQeKAGpvLzY9Io{F^Q`y?St zpjGC?Q8WlrFNzO1YobB z)teJ_1(Uq6I#u)W%PU8yf^XIwB&7N>)c?>4(9cG^JDFr ztG@5PON3C09ex)uGBOf&U(xhw6k;Wg?L<(CVxKJ8MD}D{<^r`k>>%;cAb${n(g!hv z$ILJ9mfAJZ*rtEBnZKyiG#*j;1YCca%iuCN8!1}E)$yY%mkkHt-S0@x>rUO?U>mqNvj3ijC z+KDzHpK)~Erw`eE+-rV4!n63bJ*3pYVseHJ1uV&Dfk@sV${pgKv&JpF_8MMMd8{MT zCf&@b1`B40SOC~0+KGlCTK^^OdM6v4Cn;AlhX!uSh%vUOIx7loji!|yZU&rh?Q9DG z$op5zh?0#3XS`~Pc@v6pm&%!tPtTkAVDI+J7xpzrd)*jU;U%T?jj^ul%m3PL(n*pjAe=gteYQR2e%%^KpVC`F5@YbztMDxi6*^>5Ia7ON5CuxiVml0tx4vjVR@PTXk+KELROb5) zkqNQSDjmMb`XyHVS&NCURbyg+DnjEP7VsPxll{TY2F`HT#?Xylhwj|01EwowpuQ4UY=59I2_^xl8 zO%^GgJE94mj?7*s>Jzc_6xblo?Bj*6JuKUKC-^UM>fo>9K1||2Tv{a~_KIphAg-G& z)T6FJAL}84yAyOp6S+EdmWWez#UZs}_jcEdru_->Pwm9KP-J6E0BDkJy6srU1!99W zqhZMRV!!d1ErmDgepv_;uV9y0HcKV(6;hQs0HH8JB3T+fZZ zBtvW~h8{)i^>)F-){bmIkO~8XrVm>ZC3|N#0s(aLV-SOsiP9y!=)}&r2`N80ZI%eo zBYf(fpIptf`wYg-3{1@YF+XoXrphwP1oJN@^?u?&1i`Wa{OiT&V&iVK)r<$}D)ybN z7NgRQ@yL8{=^rYMH$wN^QuL0UIRGS~l#WCXyNTAN{i_)gkR2LZdRn3f&yVM?JhA$qxi!eyVF{#?`nyoCB}?h)<88g+fhhMx6GPWF-$ z0DN|OAUt*M*SYXirp%efehApF5AT8m+DdClEdg--MiwY8N<~91zsHJfFm`YLk1ij4 zW`TeKj5J&9;9){77Vqi{6!x-2g|;hi{DDr5T*VvF?&6IeIwr533~=m|ZtxKC%ie>A z3D)3uNKTO1ozT`fhW{c{&g=a9_K%OI59!Z0K-qx+XzvkgFmppgyllApqq=3Yi_UQ? z*Tpvgsuq~Nj(G$cL9k(Y0`*H<&S0Z1D{BZq(r$KkW|Sg@=-{_db#P1&02Os1GJ zLatcVG6CtF`RFduztmG-f?nrDg<#PM*$X$AaX4=qhtLZ)DYtsAth%!Xg@)Y+RI4&E zpP=ZU-~JS$HxE6Y1>XvquPzZ>z?{?-Bz3P&__XluhYR?ev`l@MfaRU7C_|-(V}g{p zg&5I=9W`sg%WfO%5BB) zgImWN8(oEIowt^Ds-Ribj)5J|~H`tBd-k}VOJFB-*Ec;~D&-;D_rZpD~G7cU02|NXl z{iBw5#t(PCYeddV|Bh&=-f!j4jKupeE071N_1#wrUk^VnC7PtFS>}26 zJ3$xTKbusPC|{~4AzjTGUx-TH_CxvhWj9IP2xjd9wlONQF1@S)hd2aR!B~gG7*OSy ziDxUzgx#(Xkdx7zAFtz7g`FSx7m_jvKAb-U)7)HQh%^w13_dhOc_?M}v$3&pxL?%( z`hWW#5K1)(|Fmj*c(s^RCOHHhe|gs7_s+|)cE{>^6nSy%6W@|NWc%sW3-ZtjU_#x{ zBvu2Z1IM&6H2?C>x>~YOKjC=WmA93pRZHGd90$JUF4lO_Il#<9Sn#c|<;?QO5KVfz zy=PQxbsNIX#v3bKZ_h*sFpnXy(89|>q?eB^!cwCi7Gn)^K#BsTG`rf=L{%14f*gdIGoRH?-ab=t=Cxe_F;ws6SrwG zveck}oz3m*WgY?Hv_F)y!I!KA4MsL0VV&#@fb>Mx`mDLVA0^0B4pUI`znIuhndXbU z32~#0|AgdqpO)#e?z;y3IP!fMg_tKQ`xoA%A`euR1_qMD*Nlui{Ob?%kc0-+ZElJ} z4ud>hwl!A0X`#v`PzrI+e|4q1b3lO2dL$X5mToP-Uj@Ll2!V4%%GBM*6sbIIae4K6 zgCt+vYF=f=90SB|TBa>Rw=>@$AIsKjzqkxP?tcAde`Wb>kTaB7BhrjRFgN*`R}Ont z=ocVL#is|{dE?b@=_D#Yt;@D+3ljZ7qHXph9$#ePtAO-rNZ7*7dn&PoK!uf8&qfGby0xFxAJEadozy;%JY&8%)Aa7!6SZu@{j{Qr>!F0VN%H zM!SlL{lMOw^(=*%S$G!lwFmKF3sxrVbcNvhzCesfeLh;->3YRKtSoOGkJOx2ILR?^ zj$RrE8@fR0-=a$oV^LnlFefjB|=W5pkTv5!iB z=qy!;d#rzI@z|gjwPurbm18%i>d<-) z+jcJ8_Zl1O+GUOYv_t!tk)tD<*LF!E#akKPp46dzB4W%Gw)-mO%IKUv)rI_-(8JmF zs!B*`I#3ct57>Zqn6o%`w=$*Pf4+C}iGUDd2{!y6>2iU$}=m}y!Jl6NFm z3kt!Kh;~W`fzR+gt3-W(YsOjvQX0Ui04ecaYDYrbr#J%FN4B`yI`D&XO4+bpr3-+P z$OiwGz)d>0ojQPTeQ3AG9to=%Dfd#Nx4ps^B+hr~5G~m>9c%aR+^oxC_lVPeN>p-1$qd_{}*u*s*wBAtok8qOu5NEr{(`f)+fB zyhykVkKoq#J_}Wtz$29u<)<>33(S@e$VbU;`GR4)eD{}y60h!8nZ*R+cJzr&2ux}Tr>iuzReSX2z?ER zX?7P-`l;gaBn1Wvmq+88Z9HPZ?U{mkq8pGnAtH2a%CdDE2YgM{#_S?>^caRL!8%~~ zl9x}}YTr-siGmsZJHXFv{IkKlxi}&LrmZ!Kw@vcB#{W?rk3u+&>Y3|rD(wMUUQG@C zSD)~wCbgkIHw6K7;n6&X$QgT3Sb|nUJc{DKB$WYfa)*zvOU-~z($EKub)RsEOi9t! z{lp3%SnzCqw?UWXuo~Q&{vXeHkrOpaTD_h>UTROEf3ku5u{qX`GseeFcu5$u&cWop zW2V&4qzShLD?omHgAEl=X~^62dnAci$H^4rCr}1DuxrA!e%KQN>T@@+4n)F!5pv%i zEZ}k(*Z`CJHoovwzJ9iqI*Kg$SxwFrU4=RNpjJYNJ8O0-dOy>00%t5A+4_$F518C; zB$VI-VDvTaYWI-m(SSYJ6pfr<%UJh#%Ue?cQNkleJJ80gI0r)-yoWIjVR=5^6&zaA znGG%)6^d|VzsMU<-UUQ?;S-b>z#3<{*QDTUA~vRxNtY5QVG0m{2JW+(I1}&x2QPXCv$cG=Hz<(I$>ZH ziD70EZj9a-Z?)7W;;7d?E|vemKyev@z_o#Xn!_7et7>FiMx$;6J{4e61u-bc?C@5P z4QeO946e_;n8vbI?ei7NN7`0UUQ{wfgvJVwz}2p~oQbgS@;G1JncMK`J2iRB_G-*|?Km#a4ycd&JM7?b^bQnaC>dQ6?t82S`MBsXUg zMdVP=Rr%7Phu>e?!?jkxfy6qz`e4Oc2{3Z`bkV60!x7w38za{6eRaOa49&B}&h|UA zGtU0gh3Aj0JbNsl_|N#jEllijSV6a?{#cGV=%gbYg^#ga-eP*@lc_0%Fr2kIhfUcT zY&ex#@N>jv;cx?iino}gog7Y@=gI1QcXv=kZiI<;lyF`GAhSlhjS(HXCu86<_?0^F zvWm+plHqxCLZ2AE_8fO1-~idI^M0acTTxc%)pYrd`3shEo$`MPUJdqtW|W)!pJtp{7m^1)6BKwv9}Q4dl0T+*-k50Gp%-ofyqW1%{<+f) zGGA)Qza$|V_qA3)R=GAQHMy_a$qG0cryitVyQTQ9-DD`F8LMy+Vppc_Y%a-|pFeZE zXXlUHH>UV1D|(3)5CP6AW4+p)=F^*@oVvrMLf`^T<{J#v`a7X3V3O&&5Uk<4QxYd5 zrzAY!NGyyc{2F<9v7{I$N*7B3ciJI=!t6JgBU2pcA78yGr-5J|wUpsU#Pf-HMGzX) zwgD_YGXdP9vC8-A`*)qm?R7{6p)1}4cW}K+UfrZ#{d}%X$qSI#RW_%#4M83WNj(!* ztxE;B9OP_BwIt@@QW`hyxVNw_v4St)?&UMH{^w#!KXT>c3BM^u?eDJsO(fQKW)yrl z9226HhkUGG^C{e1X(};QtX_SxZvYE| zrx~p)?J;f|_FbQ?Ip?DTZe)QWmf6YCO@of(KxnjUws6b00o<`G8O9QE{U>);V+C@< z8+Nib^Uc!D_OgkO%CnsKw0SL7+K!)#+@?DlEf3ME^Xbkk5i?wwNObU6qe*?+RRe`*fM=#e-hlr0Ng9&qs|3DPip5q`K26OI|sm~Vuy|WQM$_O zu07hvZdj;`&$C=@MlXls#Lex;Z>K***e5=+=wB4p1}WzC4*{F+>s%u)wo~AuA?I;8 z{h?)VS;dg$7X5SIINx6M@F`y03!=CG44n(*h%1e=FuNZQCdgem{Yku`LOqo)g_bpJ zB>@Qr(}e)HPZFK;jC*t5LpS&8P6WamWCN5IZdCb3)Q_Ntb&)wxQxkX?%sG$!BvCH` zYzbst0Hu*yC;rR?-t#BhJ);{v4epgrmBkQi7J-KpB&Cjwk)Qvdb;WfZ)Lv7y3d{TYsn9kpFFWQx|LU7?Vf7aeBR^04cm&5R@ zmr&vMw)F?n)%J;P+F(n&fZR=XiF`RHD9sI=YXv`Vrak`{^bvw18}Ac>+l=1`8R%pU zM^f^^ZPwT;BZG71tlohgwD$~(&`b++xR6QT^J}B*|J;FePpnS4FD(4F%``{ln~F8W zCGk|SpME_JxZm9;B^ESGx0e{`TC2^^x>KP`zx`oXti~%+Y6uQy7g8fgtBHke^2Z`m z$%D=>Q|c@(U?xxU8sfg_>b6JRze%Y)KP_yK>vB`N+L%Q}|V*5W~Rg;DML>EBUvaekDa3DViN)kr{Hi$!kJ$0rS-Kk=D zk7G!?s{MbrzMCk?adz)Gu#Ug4*9ksX0{7xRBAv_X8X!vvEMNKy4{^sCyjo87@r+af zZ@dg`13jDd^4UpmIWx>9LoENt1)%vHygx2Ze5XVCB`+2|7I{7Z3ZkDvYG~v^#S@9s zPij9&rQ93T_7piUXwo=h@rM?Xspmkw!%1$fwjHPCZ>S5>RGcqhRn14jPm`pGK3!Ue zl0Rn#Zcju;+ezlh=abCvwG8a)i`*z9&V`D`6^y7L-5~k%sJ?v-9O;aF z^BdAx9!vis!!u;vHvT<%zB=aSsb}uReAex-5o6LCX3YG9R>(fd%al-7=Gn7nw|-My zFU`19=_06SAtlep)lo>&|4ix&YdKfl5=UK^V`Y4oqhLBU*H2pXtq1Klw6$Zes@(Cr z{%rNCj1^p@_i?(6;6lZMXMSVXx96!lUfYKZd|mD%qf;Yi#*qh% zZnlvJ>gs!Qq!ZzycW1F-MI`Cb{ZYCp^Vr9$Wn5uXPso@t9UUW?=HurQ>guUBwn!Mv zZu&vGmHc)i1I0p1#Ua|byd#AnwR6ht&>W0+qEcb7BH{FC;(kw=-QSGYUg2DKE zf5r!=Mw>9S)^>FKGG-%%!9+N@3=9%6@P#PZ+L-$btKsU{S3015U%tdAa`!6#{Xh6T z)m;jhFB?mG-iFf^u&d$EaX2t>AC~l_KPyz40`GKTu*$S(gma`zj0%+q8y*byDqp2- zo?(MMo#deM77RA|i7!S)e|Y7d=Ix6=o(YvLP}ttqrvU5a{#}U_zT4WpTX_{29!t6~ zOKY9XHcF*!SbtFB{1K38B|glTT$^PM#juf#akPyj&doW}CX>g8`Ko6|Bitgx(=n41 z#EhCmf(9p(n`D^=Hsx*maI%4xcmT8)!dU~F=xaqNqwlUh*sHnC6f185V8bu zmbtGCKB*>#5k>|w2zzz)<4V<=FjyX2dNfy*CsS+7y@uM@*|#}4bn8m$KnRsFD&Fj^ zW%Q)7i-;C`Ylyz9N9ZVi&Gx2~S3HSFyAGVWNe>EWW9< zsXFZX%154fvY1L_t{BbrLSpWeV*wPrFh)`z?p7&v^|8TUkuaFy086@V+-zYSzvsQy znVg&>D}oCR=0~f@Z$~g_JlvdF)$ybf)81N+6~5 zTA^0;=EH=A4o6dur1T(qZcf>zH1-Bd*7prSz67bXu3te&?_RGOcCJQ zR@znM1Xw!VFiXu_+se#t&(zh)*ZyZ+>_F@@o)`zf3#?5hDU%9UrCt7bTlH?g}NH~kyeABONf5if~=fna_dSuU`2xI(bAFO%oTZx zaVO#G>ZdOf3z~@1!Rqx-qE*lgZpPH?0@3sR&<3u@s4UBlkD}z!!=55Q6QSM@)`-g) zTFIhSQvRY=eqa+qt9L6i3RHCtRy)kIsDWiIz4_Plgq0%`%_@0;$eOdF5pt1(rI_O1 zi+>CLgH5`|sC3C}e`bIS*l6&v~j z$AQ%oW=Hoe?X7{xg?8LL+T~0JVJ=L9Wp0>(UPeXGH8CJk_l5d^1Z_2NjXX`R;DuBf zm5oX3+L+m|K!zKW;KY;fUdmy17|NUuc?*GY@6py0c*#JnWvnL0BI}%9f))22!~Le} z;4vNuajl8{Ly)zM^N&w?0PzuiiAFpZgw*AuE;odJf81jZSqr~(dh~|UcA{S8m|7(B zEA>4xy-Iqph5yo{g`%o!kzzwOdVS)YViU;PbGv zg~1ke(xWG2w!K6uPhCJT9TBPI(}V22zV8&_P7Zlo_L*e(I!H~YvlRV_kPMd(m+8iU z_K#Fp<~}k^^fz2b$+N&cTzx7pkC0}WJC#ito_V6Lp{`z5CjXV-LJc2Pg1g42>{!ertUH=ki>9=i-a~%mwqX_S(Ph zwTB%Lz|mDE5$)8(^QPmlPqGORs!)m3T(H}%spM@3sS;=HUOn(eD>)iHjxdqE`Y0M3 zSYtU-e$Wf&S#+Oqn!klL#H3EG>suT@(b7U5{#zZd(ena^U=gcCR`>08vn1$f35~7G z0BMi2&lw8c{#R;Jiy&9Wu8C$iFkHPqPSk0sRe?0765UMQtbJhTBa5 zJ84errlNl?(yi)myvAp`-&a*|l1mt?!K1qSi6znqIsDU4k*Ax~Y0ZTZjk0LxX(b96*bi3&qdW90w`g1n*f(#HVPxq9M zl>!3UJm}c7Y-N4t?&qso8V=06{lgr?j0>E2@dClv!rg~+3_z;3UhFC~l`L{Fs8*)* z`Ze(Yvo8KUcDIUUd)19zfiDRSoSt7UG6b+Buiut%Z-GVUpgun9Xsn>XXmXv&N(QIP z%N#jmY{zj%$nq=9iXDJA0M?&{J^5?HtGZ z#J6nd3cI8Py$m#^0*#A0ERPo}Jp!KTl!OF;H)|@r%Z96BoKZfpSYu`9eg5rNfb=2e zMnK9=j5y6*k||7hIuSWE@p^p}Y{yvhSg68r*n?cKaO#sJlbFa1B?sv;@WA5d| zURS;={7P%AVhh~OUQkfLR@vv}1&h^)5;p5;qyv6Ax1fMH-X~I{N8>#^MPlB_XPi&_ z?^^MZ1>601?MZ1xnegR7z^HbPHhp z-}P-9XSM&k1`l!J+<({q(UbnW^~oIN|9jhe=dHN`+ycGC0RQz?-SCPG{|`v^{{ck) zZ?fT=M}ZMe91?M{d_tTNb!!hR;Qjyq5cv<{|0MT+2mPMf*g6h3EC?G{Du&nbb>aUH zN^YbP^&r>V#jF%&Gy%l5OVz`u`a&vTZ%Dp#bgjB$;%H@60X|C5;J%e^Z)`qj+|i++ z-uv*P`3hvENrP*j6&$>rsdhOu)4BGZftHq$Ua_JX=>|+e$@hh}ujkS9x~_fs25Pg8 zv0f)xV3UjIK3s2EIe@{b53RXN%ZN%w@3ExB*y^Frb6E(a9#TSdSr4`)zSK4!P*Bmk zti{I&oGc>5rgFB_cZXPjqfZLn_Sl>`e<`u{!9C?_j6?q)m)(8=hv0v=%KL9>IT-An z)yF98Hc4ztPMKebbt~}OsHLMvz{CB^=!In2`#)$8sH}?}&%9+n{GkFdx#P9X7$6vM z*w#QzkDb|We1I|XUVbCT7URp|GCmM9!}ZPojY0W?grw2&k(e1_tiOQ+aCM?Zkq;6= zBomq0w*z9(rEY%Tr!B5$H$hiv$rsrIY3$&MnwCH z3>O=kKSsEPFN}RTdfN{8bJ7&i$6sYmiw}9lEzUct;Y;$!Dr}9h>TZ~#zf89eAd=MB zK)4(%A~L!}(bFmsn8bABxVy3f*vrv{_ z{~opKeZx7)P8}wr1ePU$-K7WfY0K;TTy5Y2-7dqac@F9y5Tlr|J1;0-9V z!EBw1J5h?~@yhW40Zw3_OtNUrVZL0#hq!7melWC)1s;VQKMH^l8l5YZ$#04>4rEZch}=ZxDxm`;N%S z-v>E>GG5=iuGidr4GxGp`vt9~n2!3io}dA8u{}QE&0lN9DYP6fD|ew9&rI6uz58ZLDtczZtCfIZPH zGB9*!jII6Qe#-h1YYq!*duTS~i30tE$9+o5a71ZXXxOmTqegpCDXBDJOZo%$V-LlP zO|VDH&;aR(k>5>c8d^p_`{eKyB;&Raz`(kC>igBBwkOJ1>>D+5h^v;C)?@=_0oaB0 z{UVv;mFaAC9j$@_G1JoALKVg{PcLkpM=t!wMQtyfggw4|XUJeAHDS(Mvb1!}deZx( z#&*)#dpxSBzpJZD=%fQUecMP*)hYclU>MW!s z2Av(R`^A43lB1!!+t)h(EleISFv@e!Alm%0x!q&e&|~-o5fQbqvajd%EM21Lm(|r@ zHY>z3MxmXswS7geML-g22c(+%-Xk=>u(ZCivkst%y689(FuD{OO;!tvF`wK+4XGLx z3gl2mxw*MfdF#q?=tJ1qI#j|V;G&MyR34Z@?sx9CURp4A#`Sd(`-wz)iGhJh%e0uv znvA%%w(m7a5=a@{CJFqJ#hW)w6q{ZghXKdUz6V?Cm|8I|2N+1JKl?Y9!eB;Yt;qv?N>oT&um!KE$4StXwy1=J zdumJ!GGhjgj|Z8Ww|bCZXPKT(F?-%J?cU##>+PyK&Sc@@XQ%uF2bTiQwpSlZ2f-L$ktgkGnW&=Q8U z^1ajPGUq!z*zTQe@~N;yr2DR3@GfBw{Yz+k#SU6~6O`l1Ya6W(8R*%+Op6 z8VM^h=sD6aj(?u@)qAt+yhf=wzSy9~;`Crs%zQDQh9UiG6;S#4d6QF8Vu&bFzZy@t z!?a#0GHR-OX-J_ZPRi%dY!?^(<$Xzze*SGyNc8vU$JQVW~3XR7Kk7FwbS~T$#LaLwT1} z(WnL3&Dm`sbtEui_Nu$aF*7x>JH!oXBKIO=1#2HnHF_!6WO!*0O!;fq*h-^j=pif0 zC=z&|kdROuum37I)SupfJ@(n|ej6?2T@;j{9ygkP9-r2N4XL@)?zF0p^9Zh>h^fB2 zsZ29RR!f#GZF8&HX_0fX`MfCAtwV3J#?F9<=z|_4@M5&&ORp@@Am=$h;~rE-i^So@ zh?H1am&lb7t+;ORPCQjr?)}}C4D>1B-g*Dx!>DGQR0wyM2u`OnjvWZpV%7>v`o%0W zrYC=bJS#f^V9wx$raf*AyAaPf>ufPzlRc4u`E~-WK6I@UJZS}10}DIDu;kI(*>bW* zdNc1omttk56}Ih*;b~#Qr1|()#)yIAVe9f;<~8~G`M#^oyvth%R2stXVoUO5r8Zt% zA%mlv3%ug#Fkt0{=_5rQS)BV3VL47?v81=#XhVAykMfHOCRQTE*{2bbT+@h|^lF=g z(KAqn!-&&6CvCo*UrKLq*`}r$u4x>n#AP94)5p#&B;LmTH$EFO)Z^4;rq9Ax0<-6 zrm9T2`|?FxgR9X-WK<|l-)R;7dAeJaG>mO+1-xco6vsvsK~s7&9KCoN&^t8@_z>-E z`%ps*8@9ogSOf|?IpeY|m6V#8C}ZI*9uuQ{tw9oIp^$JnG|seI54?gt3`B8QMXIxb zGVQ{pVP&4)7$CcO>CV>3H3G;=wm&JHZf~h{CgZUAQtF=u+pWA+^fv?Uw`KCUU?msq z!Or4k08^%>)#0j6a#VKtbRHp4gXv+1CT&_W>?dh}BzIK(K|(MvI(gFA=;K!6%ZEOU zvkkEcGX{m~#;3~}7frMo-bxLrmmXkzabB9?tlv&tB?m_XitaP7Q@#bh5k!5rWZK z9$pa%V7*K#S|{dFeam2L>yvx?&td3Pmx2B`b#Lby+u7leYj_axJVrSlVpTP@0WDbgjoo-Ou}`XD1`4tkz!q!%rD@h~cmsq>X%jFES|Aed-;2cel{_ z!i(CfkOY!?`_=nwS^fNYg_GtH{LpHb#puWZ`R~Jwo z(CARx{oURH1>&?@l{d>`MGi^*aw3I>3AO|r{Z+VR3)l}jr04!{vB1JR1>)CN(=CH7 zK#l^Kx=SAk=f=X?+S*2yxM@YwVU{x|eE^&5W(@v<+-EuZaIZz zrhMm~Uctkq>n$}{596`oDeZ=uFq}-Pb9NIKqJI)P=qmw^RqpSNxa`LvEjptrr}aU` z2u}QUEq#;nVdx2y-fi=}z#jHV)c!8v$xwAZ2V7#@cpX`V0Jzk%1SFx8LppE)SY^ge zYO2ct9K{7xtXEqWY=E;{3 z7mD4BJU+f90X^5>3EqPi+<<(;{@cUBAN#d&F)bh-x0wR%NnYMo%gO+ftv#sg_qQi7y$YCr8xT)og31T>NDWwHExIK?&^AhTmzk- zkht5!+tIA{!t|Uf_w7rv*--`BAq6>pM8dtgoo+{e68Y zn@}WrJjK3uQet4${wwG*mBD0r6kVDw&jZezeUGvj#is^a&Z^TKe4fXV+vfdxU`L7z zkfX9Ed9W2B9b{x=7K@?Ry-v6heKp0?Q_jYaK>tw$(9eqt#tR;t4a-TsW1SCEQK9P^ z9UXncdmh8WI{_poGk7HuXnPxrgZl1u zqjPaUdFfGZx~;g|2ORUVaEWbCOvZ9+5TQ*eY&umR|#V z!_xy2a5rTXBG=*j%hS6vmQuU~k%X9K5!T~Uz_uKpI44Q4J|hX;VjdKz++>6poPW8t z|GdNp^s+FUyf+;2AS-g143DSHi#c;?BWkFs!7s4ab7BYKS(h~_ZpFgAXp zFh21^71;>sxp(CVvag8nxcZ+SRPuWxJsutK(m(@rvp6Cc9r6E zu*_iJ(G|cM{LY@$TcZ$5%=qv}91Pr}H|aDU^$*GlsK@3$+;>6Emw3KJ6lOs19(OGb2tX*(fQ^G=;RtoVak`RM4v&QMY*>zq zftu~3encMwFp+G>hoosOOSyR%rv$0y@H=>r!K(>|zVC3#N1Dc?=nov6tLEXuKOFvS zioFNR#6U4vYiE5^qCjDs>oq6%dvDLs@gjuuI!%dnwM@X$`qtD`f4!P(=N;$c1ra~w zJI>>9!GIrph*g7{t=5bX*LrS#LH=}Nox_Xg_rX|`l%0jQ$YXC8(R5;}gP9azM2#^57rQrx_a*mjzG z_w=<*L6SEB3|{w$eckcLw*&;i`D0Y6(iamGM^?Rgw^vgE!FppFGsoba(1RmGpM5td zXgLL{HQ>m0hUL*+**lDij5b2`dt0r_u;>XKnsBnp1%zpwc!qBFL+B1KbxR6ayQ`gvM+RDPpgvV^=^ZLPm1NHLsYh>wXC%1I-OftXUUFw!Eh%5Mv!_GRZR!T(q`C%#cjX9_CfQ3#uu`?GN z5*4PuI^y$U&Kdv$@iFe=4nQ8w71L+e46}w_aI&g5Y-cYzM$H9<+qRO;E|%p!Wd z>9xI=iu<{YzMJ&FP$lcnTvZ+<=v=HpZIram6Iig`V-yq=m}w(N9W{Lqjp@$>kZ-jm zUc1$B^dDskKO+tP!MnOvN5w#zdAF2IL5r3B-Er(zzsPK|kQ|nQ4z&BO3|R>}_m0>@ zSN39Jd;_R^O>vdS4wjbTHN#?U<*eDRlbCVLl#Q$56^Q6fyNNPBkC}_J(RJ*f+ltNy z^Mmy|?hUz=Lwq5IY==VreBCwLm~?F4v`Y^s_w+XCAH7GpE^<$nFK)BlZmiIoS56os^$J`q5FZL7H_eIbmpwefZAKhRTGx6?JQO}1xQn^_bpfraIARLx$T(RqEkJOko$zbTPHZNt2`XQM$Hr=m^#r`&7d)Iv{w@Sx4K>i{xprZH0~7eJ$+T~xc@)%WQ z8F!jr^-(2GW7tX%m-f(>w3HK@13c}Rf7!U4Yua166=>&3dTdAu^n96Kz)}U%44a816Ztkvv}Y-8CiBVy51%|dBIeo0UuIC zloM;{-EEGmLTTqAvwL`(52{6Yk8X2@OIUX;5zjdyPacjTSZPvy?5D@=ynZg~Z?O}C z9`{N|-mL4&B5axR6KP!`?S7F4cfd=hU;84t+6KG!*$_zTeGq#He!6FcBw*{5gA+opp65ifIO-FTy2Wa@!5ud_k|1`Hszu0@3TtYQ)ur~ zvx#xLq*E1-S;LRt)#|?>hUm%*J50fpd7AeIF_9DkYtz{ zmx1-Cpb)$l43-JfirCt^t^EO7&F9J_Nyw1;nJvZLzbaZmxWPuef$^~L1xK{HC^o{L6xyof<3(0WOXhi9}8Vb;W znN^L!CsCl6pqs{1|FSDb!3ajRzOnBOvUO^x<0}d!e8@M(SdEIUY&WsD(==E$*2y}5 ztGN-Mm*byntw2CgK%G0;zVy)vlkQ?fL`+0&tx5rSx&;g8QEeI`lLVnn$a07}2zr{z z3PaK+N|c=kW`fyEWyC-!sFHXIbeYxFB=)OP-Phg~tEGv6>aatv@{~nT@#i(p9Q03Y z2xu>AS9%wxV-YrR6=~g^gEM=i3zM!ST4Sj_X{4Q1k*9wCPy5s`0mSh=EgfB7RHZxJ z$xOUFbjZ0d6ELl48elh==jyUr0uT<5G2}b+It3X^1+%86^9_oM~P5{5}rIjd6R%f$gWzyL;t)^^ZJ0edsaH- z%%TCkB(T->P%z};XaChC#LMfnKP6A3_F=(NDm})`(XnjI2FQ>3TDA9p6sA$zfNHD& z9e<1dd6azbmtHRa9abF{F=kMH3&WYU6k$92{dQn<@6^vXl2Z6JzQ}74Xwc~Uw0X6d z+_9iiTOZ~H<)ZL6cHI)=2f8R2r%{2cR89yxC>g0&9E8p8 zrA@gp2FJgPD~Rv4l$K;dJ1_JxWY#>yhul|mPjz#@N6^0BIHI40C&P1Q;1^I*Tnv z2xw~H8iy}ng7+fjRd*0=bUBSV$k)0&(nr0}z77Hg9wwIJY zq61Co@pbetH@87gf<`ZAUSc5-^K1>6n~lN1m<@o34J*q7`VepyvE5fQ`|QPt*7^CF zUto&IdHsW7z3KT3flX+r_p5)rGckEASB&|*ytFA)iu4^mTWAm6=T^sqlzooVpjxZf zRR(k;TMjWa+Br!`k2ixZXX~j+?N==m^Me6`z6yKP0#!Ka73iZ}-e15by@a*FJBf*L z#I)MX9uLQWeaFPnFi?5$8u0*13%BSppLLg4)ZiNGUefI&g{#EL#bBBJWu1OpZ;A!e z1(ihxKBHfH$AS8IBd>|?^sWDa{r(A>@TB_lSBKm{RKV`h5KpPQ?#|7sCr|}=02Fy! ziBs$ykZ_xo>R6?&rMrD|B|nTLjv@zc8l&X6dCUPgiRK6RC-@H%ykV-S0?d_B=N(^@ zC%C~tda6lxmv;ScG0HI8O$&PVy6R$z1hOgp+mJvpB~DJzPYP35PA|x*fDV->Qak4t zSO>AotM-9u4~NaJg=&<%|C6#DuJ+VKefKu89sk=vu^K>~?tXx&(X1M&T6b7c4gut` zy32{@@ELcwwW8X#yAao8;}_+E)p%~Muxw!1t-cRgfj1U{vFy;O(6bcM17@et-Q z?>2srE0{NWO3zK`*Y668f|6e{%!Di>Q=lS7`^*jT3DhGvg6w1d?v zw{YVeD>AIC%*;4BP+ViKRz;OsnJ2eEhw!DA3k%kKg@7!)ARfWsCWiuN4Qv{Kby<IvBmG?H7v#fa`u@_ABZWsKkYUC#k^}i;4T7?O+ zy`UfoEW%By^wxGgJR!rX0q|iJj`8idxfgG%pfAdtNmR~yOmm|+pcD{wo^Qa8C;x^y z_Oe0_`QDHlbAT+>?khV8(7_eRqB)|;9j&8f{?+djPLp+|M;!i54Sf5B`}*JYznx_< z%0d$U&zfFMEiDc50HY{TgJChP@MzfZkPm*DJ|GX*_{`PQr=8+EC_g zKeWD?FS)(oth^9A4es%lfOM*K5w5`FWA>U;`f5H-_9cI0ys%X12x2wxBE1F3uq#M( z4-|(D|N1r=ZNCu$gI>(YUY$4JmULsq);BB1r-~~H$^!MlgpYPYL4gI^D)Ah-+K96A zie1jTalaMh_fH;fE7WBtu^`%f)U0b{&9$>F2?(WU@4u`GI*6Nn+|Yt6kY$O+&>8Ed zM%BX~1#&i6yK^BI)In19xRDb11>M4YQy^t$>wN1gFyfF&R<+zh_AM)ltXeQ&rJ;g= zyEC)zB$VZ*chH!nm6cRy&`%Y2$zpF=kzTwt~2LLS2X#*rzX0Iz?rj zMEjSV6RpN8nk>>VMG?6s6elj)r_H~MhB8Z$!(ACiFDWK^zJ>OFq zrqSV08(x^OI_)f#QdVsz{ hXHnDZWaQb+Po{i5&H7(SGyzKYdaPGE^ih^J7A?Wc zbupscXH0+b*SUu+W)6?p8%G*W)#adatBzLYgT!KX=(eBf&l9Sd1JqlBOMN}O{U=oW1)p~-c9Nc`fw_hH3*?#f?$%D#Uq3zjJ) z&Q2y3rt*_Ly2mL#4@il!A60A&_O_MoE!Y6Y_Pi_{bG2K2n-efWIG*x7J>Xh!>URBtRlHk)o?U9kN?V&$*7u%)n2GzP&7XG9i@J;Gy z)LDEu#C6ml#urTU$(54giQe2qVI414(|MO@DP)G%H6SYvEvabWW?(N`Kf8K1HP9ia zj%TV5+sAt`B{A$twa}p%?(pRGnXuZUr1bQjy}i+y$Pe)sg#{Ml{nV2s9AU@>ObMLv z-GB{+6q$F?^i6uWnu8s^$z+N8ZZw!gew0(R?#4&FiXN8N)Wr3ry7oq2=jIivsH^8C zm+(Wi^5bBjt*K$tT#8($xoexP9V3@1L$@*IEV+t-r|HMTBr{UPWtV8YTni=eQ$Y(5X` zD57ELSsoEF?;Th5`gtc|nFi4yrUO097QDC5piTaS5zf*rq0AWoL$ena)Hfgrhv>Dm z%$?ux$Hc^hjSoNTELi;ikYkE6%fZ_BoqIXA8cG|4zzHhG|-+r9w|UPme6QK-X-3*VjD)7^HT z?Op}xzqQAa0f!BfWjpAZv!c9ZLS8@nboXgDXu-We>BB}A#G{-IrCltTa|Ld2$R9B3 zjfI^9Ap4L%spiN?x2v-wp5I*aIS}EXw&z4d!~%de6m$-C=A3QulQzp?KJY%hv~)@< zu}qtuJ=cS6n+scOXX}SpBWd<;{BZ?vcWJ4(b4p?uOQg3HK`;R*6B_!``=})@4YtYI zV8$AE`t3y&qM)9Ue(<0K=ap)$ho;nli?u@C4s2dtoJ)5AWMw)biN|h0sazR+Y>mn3 z5)(a2q+^6-Mw@bCUytp5|8O$8=bCHzQ#~d|GbuH-r@8aM+_B#zGz@u^!Aq~B1%Adt z@AT?nLk>p-oe7z|HvQ+w*0$6cpah3$vUFtGM%|v&;zz) z%S)aURM*nVJy18hy!b>$PG;t5rfR((to}ti%weJ+e?gXWkDtAIHsnfu8R?Vh>+Ht? zFkfTNCCiwNEjRwOMUPAB7MMuW!5n6@}_wn?R2A9Ub?Sy zbB(2X^I0pw@h$-cTKVz}ah!L$tq$|uUCiiVm$}GqJa%hIZ)iR}KHkx}d|6|Q8V#Sj zwHF!fw?gT4-f}YLyBEwT^XF)4VPVE`OiRpX8Z4>eG!U`t$)^=Yw>9}-_u9QS{byLX!`}0AuqeVmHj;w9?S$SDe?_dH_>`@qQh{c?o3YJKSZfjYTF7 z-2kS|)pj!q3-pgTWwm3^PbtjivQEj1gBe{N`_BeX_3bQ_W0SUc##}*LToWAJTDeH7 zZt`x5U-)WjN?rfQ^C!2m*SEcoZdj`I^_7kb)kTiiWqcy~>>(Yz*-7zTV3OVSlU2Q*iqzIPw< zUDUeubz`Z%$1h(w|2r2`%(ki-qv^FV)XC2$q#wv-%|MDY=ZI8r15~nB^nhLWhcHA zE4iJUvfG&AFu;v8j1f|J6j*yOadCbu!+2(Lfktf)WHe)>yd1Y@eOJyId(%XG71FWq zr*}&`jgtfhrlz{*u0gndEwfyLsfkz(e_+uL_v^o1W;7i}#pFE1UdpIzVbbA;x8m-v zXx(((;VR*gVeTmiHw}WuL0>(&%JuR6$NRT#cPn0f$aJmn3T3F4StOUD{Eb(9rn0Z_ zo?h8XTb+R-wxh+%>&4X&dwora6r^KAgIXFkRZ~hxT?*rp&K#j$IVszuFA}rz&vff{>Fy$)dOYLi zEO0?8ItUs3&@OoH#}N3kt9{Ms5NY$n{NP!aMJ4!f@MVo#eVes~JbCoU0QuZ2H^NqU zPgO~|&?*AykgD-k46R0=m1}UjJp4Y%&pH<2f%QL^1b+#b>Tk6+Bpo;B@G0L-Xz;%< zpxaAk-bwKJqkM-5?_kb`H`R5*RPL&QVS3qSjp$k+f#WD1@qGH})-O(K;|O)A2fg)} zxU}z<`O&zW$b1FD_~Ry6`NmcLMm)WU-zgQ{Md;gde-s_WWWSFrN^IqRL99W_hp(QA;3F$DPkOP)Xc}XbG$YQ+|vs7Cqi{ zC&sR0UOl?=l^4x6jc1x={`3zO=JH}EvH54bed(w$=W>CqU3#mgS*4LS{` zfmH8bTIT$wA64#VUimg@pEYIm4Ym4>l5d$y2t7?7s}!=uz*>=!XW_<2d2Q9n)q~G! z2FtMH_8gh|o|c)Br-sML?dgpV5ALF~5+IEftxuo1J`xCUziRuQgN5x`<390(Tx)91`qKM$f8){T5J~)DX}(h#IoT_*yIw_{ zi2E7cO!0+}A7ZgqKO$64I{6SBm`{-Hi-9sJ?Q5>*#`@7T?*iyw(_qdX_+(i#EYUr^ zaRu+!JC>`h7Z88dXPuO<_>-9*Q8qhm?jIdeGn!oCxjcX+%y$}}G4Y5UqrVdJDAvq* z+Zcken7Yl%jP~C2LrF-hga5J5**exJdK((B{@#xI!_t5`WBomcnN!CiW0A1OB#uYT zr+*TV(6G1Ul8$CU$}o-Zfs2>xEq@D3{qH!;S~6aF8mPcv6eiNR_R`R66~i`4001*h z60m)|SPj`?%GCVyqcM@_YD`cPU#pMyz?>|T2 zjagqG>w$5zQ3=27_?)qRR6|K!yMIi2pSZmr^-VBIwC;lC;uBNH*^H!qvF<$Vs$9{- zI6lpX%p`JLdnO{os7v?t_#O*>T`14n+}HdrP+$vOT(A$Zq$yEfuO)g^w{HCIr6)}l zZLpyh<8!BcAi`yhnmE2uzW;ss8cPWe$@{@DQ-_FYyd$!kD3xcIb%{iHOwLIp)zI`XL1#eeeg$&c6TKalr~ z{PZVat{qSXRMQ-#;VWf_HqvQpx_SgXxl<3}(;Kon*?-N>6M+BSGBpL+8my((XN+M}4Pr(Rq>!S1Ii*G4$@O)xZ>tL`&X!dSiY_Vchgm zYVLiZw0r-v>6;&xeqU8cjna$~qfS%%psHQ`6StP4aUDA0+n@ZYrm{UZ=gE!C8ofRYpTR>tE$^IA_d=-^!KaYHxydc9S@llQsNF^h1Lfr4 zk~G)ihoxGyR#j6bH~5ntyJrU9xQf&nv!ZwBN}}2AbgFQfe54&`8T&BpRUvYys8hDW z-jXirZ@bL0bb+fFdaH|#Zr7Et{?6|RX7`)lamM~h2mF;ZLo4Rf3K5fc$A`_E9rL6* z#^D0$b&$S@eq>P_lBenR>2@_Tv*vh!fZ{hbPvecsfoEs6&ECHAdAL2alIYr9ApRKSMi3cd$W!sP;al zts_Q0aK8voY6xcqw>{M5ZhmwpoP#=?(>?p@%V8h>m9URx1+Sk!pbj6+x z#qiK|=?l9+6ItF9;^B%0mQ%5U3Hge8;Lpg+9*A_IAZH&xN-I4xQ0cjED!5g*uSVx_ zln)8)w5z_;?6W`Sc_EMiXR&Mf6T!LTWv)`e$;8>ifyy1!cGtKGjuwwecX~bKAGyL| zA8V3gpZ@&$qfcw-72moB_(iUHYDT7?1^-qbB0=OD?sJxq{hFhIo|q)~ymd^szL-*U^1<@m^D^;)oAD5`=2ls!fz{&7$;QbiTxgkH01byggy!Yp| zbUnV*SCl#b8*0UB4wCm}AFn_zNXz-pt(f#@s{G$~o*zmF${mPZ>j%-FFGEJlJiesq zv|YkzXrA=Wr+p5)dK1q0+Lx7t|l;_CK$4ruxV!dEqsO!z~ zz5$;6>;JwPdOiT(GErOe+@&%^0Y|8e_)(&N#_kDZ7BY`~=E`*QPOjZxhYE;o3PHz? z7wyckj8(RmgTI#5=2j|3rdSClE87Q`@&Bd%NY2qKOcfP-1V0yiVE=S`!i(25+@P>Q zw^F~DY3(`;g}e z*r%_sMwNS*dwu^sk^6f*GS1$%DSE9hk5J6f z5DK_!*<)Ubz-Ywun#H~mo}H`8kZG{gXzTr zmw~5uujn4Gc+*|hjO4xvyANbyMWu(Amq7GREA-jk6nI#~lftp*a#xiqOh0OrgU7hq z@{#@N(y!Ktv0ag+{>5`+e{rE{5d+mj49U2s&wM7?;;P_tq4%*DPO%a)fc%NLY&V?U zlk03pCD!tFZ&y)7E1SC*H zIy!Y~&PD$=)(c%xe!c(s2#04#WXh|`S~BN>k#=t8hX^P}sQoGN8}_D=)j%4KJEUD# z+)2xfqUzlqEwW$96rI+{nw0%@?5FzX^<0VL%&V;6(O_BW*@q=Vwppmvi5NRXs*ZNh zK5ZiyNq(#IX3as7F3iDzA z;{%Aa!ZVRuLp+ov1}nj{_qzIHCAo1C;~(1Ib4+GHz1gFrEc&TteX zv%b?azIs*s$5}NGm?8VtD54oR4&!j|&{=-PnA?qYnm5&Kq2bWf%;4WVR3a%SWlnB- zPaXn+?#y=Zeh~QUhNZj=>|@6*{f}MdWY*Q921-vp$bR=2S0;MtAl$E>1>SlWsok)d zHcj*GG4Gwv&)W+&DTURZyA9asb&6r62jJ}XdWpMqpBBlqDUv@tCi&8f@f#C+_kcuW zbQuqy=}Hf`U5);aQETu48B#N4#?jRq8Przt_3L{C98|lxDE;=imfGnZw;4z0(vPzx0)-Z`{wBW@wBX~k*rny(+U&Ql-X2=?Z;HNKOvAnTr{B=Mn7I@ z*f7$zWPFyHWYw}ZWfNwyT(r%)^>X{}(hokz>jFL)A>!XC0aL3Qt#_gaS7~`K z+~xdw-0W1dWf;|G-kWV0a$no0QqTR}F9b~dtJ^_IuO8msxROCtl~^YgOA=C~+Ya66 z-jUR()>g>L<)?#p`kd)5gxgb+{Dd6)l1GS!Yc`{Sor) zRi{c7LI=Do{S+ep>H}P?q(k!{#*BD`I===3vC-^f!~zGnK%0zLXUP-k2e6ZNpk zhL%}j2H#@w2CUpfcgahn--7hjZHcg)H*Jy-SFzP}WWlBqN1qgN>aFcG##Ra5{O3s7 zWR33-CfPjH)56L3d9vye#WnqI&QQYol!cI6lhC4I`_9`hs2e5_8;;C5t^q8CAdJLk zD}C_(9wn*=NNwShz`AzAx z5T`?KyQqFR7abtA@z`ZH4E#)|ZSDTJA7b*&h-&2h`3?s^Mwzu_)lUT<$u)fR=eHaMA>?drU~axQ<9sTX`xan2Ti=_LCA`4ko27UC*l#XT zl@~`+*N{F&dAjkwzyGA#NWkeYT*>@LyKa5s1x;usWpAlYn1sT_-?H+p2X9tZ(wcG{ z&J5$6+qs*6FyE9AVWO!uw<-N(s&Mn(z9{7@HnOk1OSVOZgrAz~Jdr*Jy$w4~=Ph_L zY=RC{xgCtRUBpK2q;P)67wT_b)dy=8rxv2QVexbJykcJ->Qc$8B>fg6KL(+e zlB#>K(C)uKQTWszlFx57eA!GM86H#<`^`yx#dOhv)80P?|LDe_J|14Z_XonBC3R>4 z5R^JpUMKh3v>}d{*_sdD`2+P3+E%Zd$DcW<%-DZ4XI;A!`Zl^f%f$uqhg(+0Z3`}^ zdcf$`iU+d2dyrOk-s6qd-S=fPM;q*y#E`PZscKP^(xzP7NW{}pf1z>dEhk7(8qQ=B z{n9vEDukqx&Qm|D!rZE=eKlm=PC60TM*1vBmqbAGQPLr(nVAPda=vyY8g(sw(bUr? zs@8gG0248=>n5qa`KPn}GZ=L7aTq~jV>u2TTQ&{ zkgx0bfj`Q$B(c3P8FH=YMF`#-?$P_qR5W{8y=!=Us)P@ej`2SRxi?T+nrqhzHi;jBz?CJRNEzEJCTKBh%Oo!V*wfirn!by_8Nw@g4s=#uQj2r!) z+`oTPZC+^@3nT%*FUrb!|F*N2dd`;EufF@j>6|LqTxM~~aJ68P$H(@$7mYsmi?TL8 zt5iLdOz7{(*PNz*EGD#OI!t47*DrO4WlQs;opN-c-*rU!0e|(6nnmRfBfI6#F{h5> z(^Sy)$L~2!34fksu>MsP-8V<5cjSB2O?6lmA~=I>XfvB`s@!Yl@VSiW>B`F?!6Zjg z-RrmTm2ptW9dEff-qt-l^pf1I-B-`^7n>X9GKouhsx2$^HbEQN?BCk51g zuyc3}BI>5@FBO+YKG*MzlD~)OqqG;KtoT4>yUii{(waP z>0!${)N?8(T`<;9Am^4*WhVm=+>EyCb7wsF_K9{w&b~BJepuZd3=Zg2_djxhv^Iky zJgr5U%BpN+I~lwIVgq%18fSlfJWNno>*e141@BT=!BKv;^gk-!FD(B?Ib}+EGX!gP z(8=wdZ5_;D72YAzk>@md2M=;kH^I3Wl>>*iw?ZE_7ma8GA~ZX`BX!%PN)yt~PXixJ zrDSAumTnydV;Teq))|xL{x6!YIx4Cz+7FF@bazN8jndsncXtXycXv0aG)RMVcSv_g zH!?IsN%y;c?>!dGTC*1a+QxT#FN5**t3x8E?VB+1|Gu9jPjd%n zj!J!cx7T9kvQ|iZpOZR~O|RUDogKf;3;=?LJ zQ?|Pv(RC<$42IS$W>NUZFCWLepm}8X4TiU>lI`nKC1gb>qsiUJLjk^2SclrzAD^9X zukHQ#KkC$h;$dqju(FZ2AmdpXg60tX)^ls_pO$^^`yLs z&>c)i3fIbOw@#AlkF_j_VoT}hAA?$c3g+!2xDKHy;5f{j4_+a0bR=YlrCE=%S`_}c z`lgm~mn?!LH0W&ZVZ*nVYF^|0zEKQUL!hLFtb}#*O7R~s9h5^1RVNY_r-sTeEsKe@ z;?afz+ceC}Ssgl7sHSKc=;~oc>&2BK+Bq))|ARvdKz|JvCop-?D-Y{A9|nUGK-BB# zL}uD=^`WGzLap&lekUyldn<)JyWr~lrZQnL`FliMl3@wb-rA=e$&1iITL&2Nn&Hz1 zO8HouqUa;v#^cM}%?JLcy^>o{&)9qdW<7nNVB~=qsD%CU;S0&fFAoaXZc6^k0gnpU zhapDKPuw$_7{NYWcLU<94ZD_^e^RWng0x7z8S)u=1#j0Q#5XR<^<7@>4O^=>eK}cL zwoxwqa|LgDfJS^heFEy)Xg`aW6S^c)|L{rQWgzt;Ydxp(VP?I%3nx~4NjvU0Ij3s1 zLU+{o1wEk~LCQY!f;sp>yGV%*-M)HJ+buidw5@H5#Jt^MvBm5YwDEp^%HK?r>#X(h zR68CDeDXkk%K-ql<5o9C(2$^iW0`LXO&>d7Y0H-WcomwmHb z*2{@ki{Svm0~cv#U7-9Pf9BM69Cr3|Ww<;Yg!#oBbZKTOvKT5F$c8)}Mg1{T!MqMN zHXDP-!qHB=fxA$)K%gSR03ly_D~TLH*nnVK*=$W`_%u&Zbf2sR`{LwRzc)Nz z=pj;pdISeYas|(iXH1>~foc@tkDe~&h9FdO?YyPNbGSi-ZKF8_^+WdV9PG0M{|+Yp z8Jxv=J1Dq)YPr_p^(4fL3WQiKudzPMMwMaQJt)b`v;RFY4|S(^uGXHOa1M2cH?aV? zq#2v06pGZd?tKRb*z;n>w1%}M(jHpShM0td)!uOm0-|>&0L{AB$9Y#qNi{|xermVh zS?5lC`)K*?O-Pbf{ae+-p?j zi)*ETDKt~MClu%9`tVF+iPsTrpDrW16YX2C^%G{igiT8lXh$D9P4*=)(hRg?@WPh_ zTor%!-%gZLLXD1e)mLL(_2$1?^d^ zZ)Ypl7u_9h_9?(EfH7&5I)+`9hRVfrVTVSgOpCAIszqyz<&6SD({))Ok;Ed;L$p$7H+E+airx=6-7t>@ylDjGnxDICapu7-JD$^ z{+9TfDpoYk0|{nAD-HfXk=dpnyf4U{ElW#K?=VV&F6!S-XZtq7tnlVcjlC}k^@nQSI7%Tr#r}hm^+jxom|Ap)x=+K*&Qcm z_57v1pY3>%*K#i{+^f($q(|QQ_;h)ZWhDSNwe*D^8nEW%c`zdl)35i{&~K7AjX5EQ zR~RS!E_Gj+BDd?btrm$r!tJ>eQ$zkT>N!7+_2oFSX+J~Fo!}#reKDe0608~ z!lp`~ts78|f<(Z*-C!XPNK>KdIyBUL_Jr*?7`9VTMQjU}#AV^)NS+H4r7K^NWk+&x zQqr!lHym}DY?A<)`jTipzHz*!T}xz($YFvgp)lmxV|4TdfuX8rfTi@U@2?n~YNf%2 zMjrYu#CX>M^57f;N63+P8gh*(EuCBEHcv}7uTyQU^M^=TanmE9eq(yN;XG-v3_x41 zmN|NcnYPuKgDR15x*e*{uWP1Ns!JW)A}z&BQ$ZDXtS%c;zrRJg9c+6{?(vmMcEkDaX9QGEY$0O z4yOuZekt8fv#M74mEJbs=t@va!G)F*M%*<^vNy)c~|6B4I?CZ5Z#bqyL&o`^wIA*S8c+fPsvF40@Xlv`4mbaWdx~iEaua zLJrmz5m!W&IuaYv^i2=9&0`#=^M=Ms-X<`cSR%{E60@yKW5T~*fDWBP?plfEe#Zzl ze(fJzGDu3qUw>D>a`CAW_w{4s*M7q8X01SJZwNW5*z8&qtIi5ZST`GzmX<~N)4`AF z4XO?vUtKxPVC1(uUF+Jlt&JY)YdC1M`t+a)%|G_= zX~tD-Enfh18<_ZUZlEsIt)MEJeCI>c;~@b{s0&5={oY-Fx>d%!RzSzCq3^*_`NT!1 z`zD!#*ZMKO<>q%imIGhWG&((p+JOdzgE7sqHKG4yE=8fKoBVd-n#8Da3aQbO=3;u% zjT>w#A7I(k$XVgq!mah+#MfXSG+!q&_Bp99#pJE_(@Z;^?c7Kdj<%voOxy@Y-L>L5 zX}3l_>%ZY4{S(eH(w{Vu{~0Gb?l{Km_)T84A@QNPq{q~u|ByjZ)(@9W3Ra(34!%IU zFb0t=Lm2ntMl0JH)MR#d>GN$%ArFESIyBF5$bAeNM>;s6u&PmI zsKJ!-QMs@!c2^xiu))SA_BEP??c4a2_&s0cAm!7aP#cxB4Xvq$MS|oq#0<(au>yp^ zHjy59Ra|{1TOE^?$u>5U(nd@+P6-Qlf=Hutep#6%EH+ za#Dzm<9}IUv`TSN=~M)p%yG|C7ZvG}IzLhq7iR$l!iI7KtphUiii7?DC{(1tm4dc{KP4G0+a5vKK4#OZ|M{X7%Rlp;F83uV2mOn;R|( zUe8;77@2mx4*>c9CtbUWhh_i@eVPe8<;Cyr- z%tB-l5GyF+zGY#kUl)w8`mv8K6z99&MeQ%iO&h}eraEdI3;HtKFT$B&!=2q1|a4#ZzQoo|p*l(1UAqJ%}slPdKJnWQuM z<^R7Hz{|L)`%r5TS*vZVRnhi0@2&ZVLbs)ZoqUqIQLglm*peVO|hyjNkmX5zs-`g zytg~~UJ_;4hQL}|2CiSS-lTYO`{<{H)o#t6*!nXh%lU8i-#eGTql~*TmkNjUKZ%?E zTW{D+Bu9A8*HQ<@H{q`AQSvwrYd#KHKKHwkS(LYr8#i1P>DdO3>l|-bE6mC3mo5Dg z0`6vW2LTAOEa|A@WkJvBxw09Z={A z)tIIeE~;82k?i5_YF#p0SF>>(A${=59OQNdukb(mu=dJ7v1)=V>;G7)wR;O2RlmjC zWlsG(9GZtc-s1GsqS{%cO7BdEvczn0vS?x_sO&vNpCA`~%$wJ)nwdC4HQ4x<7t!Bb3 z$Pzw-()=v@M2uRcx5!!ne)<~qJmzNMRog|@P;a$vb~oAjekz`Gk8l5!Cb)6T3yrPL zj!-3Po%O50ZtDiYh=TY5@4<@gM|6|e6|dQql1|M=E6gP9oPIcyX6#^M0_HB0lG%!E zRXs!gKgwm)ja6Y}GbrpI5O{ysQhGqI()w=Z*B4|;%FKtpAc|Y)MV-_?M)Y1yb=Gi+ z$GJDCHLX)qfc{-{wy9W$}%Qf=&@&es7591crQ;<{G;YSYwV>1}0QOZnoznPz` zkvx2CiWoo6={A17IW`@M`|ar_@j~s91JLkhJ5C_?lK7<+`|`j zaW89v`n9jJ(~;6tN~Vc33$rg2hN=+rR8wx@%RI)rokGr7vY`g`GD9Jfc&#YyPmS)@ z+2forR5otvuggiW19q!fA0Nc7RDXy^8P3@5G+|EuYW#N zY)m`#Pe`7LQ+PQqqz9KG|l zTlW-x`_nxLzsqXpd=93Aq9=V^;ECxZ+@(C5@K*2~^zS?dy;N#DpkDLd&o;)gCI6h#5xCa7kTKm~~ETEUxx(4fRg^kM^S~i)TCqzrd zHk6ePU);3yAkGN_R}3%SMz5Pul@zzy;QO=*wH4Ayd$Yx~MRVm$!DF#*TaK*f(?+7# z476K8wyx(NXF-fj=VzkTT(*tx{hjv{o*!Vw1$FQLusU=<>dJ2-DLq2bK$)h8)-ZRJ zfof@9>)1{0qMQthY>|q%d8*|_;%l9$$elwqoULDrN6pMw<=u`sE zdd0K3EQk2BUjiJEFSv|RztD6Ve)eZmQ7tcc!_85%@}_ZLm_xp+@~a$x?j(+c4x6`| z6E{wfx9{14{9{KRmr)sCr$C0Q1rad=c9EP+H}Xgw#z|wUYtw`FW(PP(%>%{~D!vK@ z46uW^tsixn9WwL9Sdb74W@0rCt}Sr@omnf`z2X5Tkc?h1}1!RR#el zGnS^R3DiugQWHrel3EHABysVQZ;7F(VI-6)E>unG`~1VCE?1krVFR3BrRlNHp@WMW z_H~8}krxBUeSE~tdc>W~7#<#1PLg#PNt=H{96k%_Z3_uO8BHO%?l`@&DV`N2oR5O> zV7iGJ;^aWgJdY*mT4h$270fDy6w^vjuBbG@T-7UOassk{NKD8VyQEbtZ?)=qmGbMU zd}XG+q%kGB?3$VmMqE?|d{m&##1%gq3S4|y-HuXP#Rqi-EGE1<9?hXa;jpsfif~$e zv3mH^?=cE;(mKutJ_KUpaGEI!{9;VuB3i1Bzv5CGb!&{OnhH<%jLt{CU3(?~_4oxm zuCj@zjxIWM5$y;3P1$?4ecd&xng6c0o&TX49;E*~U%frhej5FJv*rTjI`x3AUL#D2 z5e^3R<R6K`d!4ubM7+k2Ra=*kwLu7kpPrqs$2R}F zb!0uO>Gz8%)fuXW%%vGYNJBPOg(--)jM3C=_;i#epv!O3+**Qa?@hXNHE^Ds!ml(q zIZ=uA$jnefMC=rDO6__BeyW!16?R8-mS-#b>^yVcH-&fLuCrgACL6H3Izu4lpO-ma zz6;sw<4L^u+|mvSp&!Gw2?a;xKBAy;50)qBJg%QOUC~cilAI{wzWOIs{WgFSvi>zk z0pxXD^XY`$%@a!C$F_T~gKxFFsw&K?E=@4M@lzUgJO*ykv$b8ovV~O&EUDsLB_))V zKcrYyX-m$kJo~S5*N^um=?TZ=*Ktd`4u$BW?@m^jIBp)6ZN(?cMtE_l_nm(_5wR5K zxMN)7ip3x@i;{?85PI$;y%6i7AlH{$eIKSYX`KdhC5?mu72SZ?XeIE0kn#DXyn`JM)2m7zriu>yrpqHPkKe(@ena7e0D@FFLZi5i zC~EbrhW&I(kuq)g9zYmF*DhD2DNctrw9)<1IqPa!!`Ve&$F*HzomLf|WzWF$Y&x`* zmZhSTeF#U3_Nnr{UlQuD)3*A0mF+3t^$0nPu9rQT@GQx$^1|^&sC5L5d7~N>dLmoQ zDtpV#%Qs10F)1F2wNZ%1>LchhMCiXt`e7{!CKRS_S-xVBTd~#O*s&T}K(4*2#;Kz6 zZE>vo*X00fPQ_NA7{^a6@oH75UW%>n&-iww)W0@N#ST#_rA_q30i+^|xxl{tM}PD! z8OxW+7CdmhyIjY~_+t9)tHZw4R?+JdYf6osoy75jJy92TE4tg`K>`5 zFMKv*OobB8Hl2{{Uk6x0An6<@#FsDo*%x2w1xza3Pc?4r>JDvuPctbf%F#u&Z8m(a zmI1lh-ebFd>unGaHUO+o&8l23zlH6;iTO<}uK&FQ4C%o5qQcK!-(N;cDh#-_BgM8g zBgN(P^Zn63bjtu=Jd4bZ>OYWjk`)+qE$RU^XPVZs!Adr|%{AZWXZ(h1D(5CG*5TeP zyb)zR+_#Z=J{G@C4-DUZVhpd@#-fQ1!uCs(XWI}~lpx{S%V9W()=lQ_V=!&tC##7U z4guj!&HGK;J=W?!R^t!8GZG(4*7(t4tG*m%n;8N|>L-*F!KK1ifHUEeNPE+H!Ld7@ zuc34U`Fbrq*~BN2wF1OU1{j+zLIp$46D*XuH5#8%%%mtoX-oErFIc zeDi}un};4IvalYoZ~_R~&s4JIT9$opZ$rPM#uZb}jWg`&8MBAza<jP8=ewEPY1b%c3 z!3PEqW$MKC&-$rBKq(4rl3GB@jpny8km<#J*AS^$U0>X&(rFuzc64&H8tVoC;vw{B zgbpz7eRjOkE>0EN=x$$y;}8Gr0Y_Y$?Sr%BG=;8y`5YYI_Ro1 zN=Ydlgr9iUZo|85*-U6i^Zxz2q13N#?gs~OWn+N@T`GQfJ+o=|27M^{AVBpIxAvCjROLTU_&Uvgz#qt3%hQT(0di!ba#$cgfl5xCM@w23cg|92>g~(rG`nk zb21JQ-u?K#;+n1t%KbI0<{Iqg8Y8{W`AU+BG6RIKDHEZT)D5e4kexPkzg}98hbhfw zI70gM6=Ug%*O^h$p%F{2pT@HX=AawdDn?}D2q2}S zHEGV%N$Ww_A=Q9cFh^StZEHNB!g_2H!*2Rx1Sd%vBW<`2GI*FXYjigq-9!Jnn)o&n^4SU}$1qGhej$8XwxpbK1*5_Ut8mTj~Xy z)CH^xn-~hFB^+zl_)d6vW90BFnPL~`Nr{bPG9(pWYw?nx#>oq(N=Z*-w29fHwkE#J zrywV`%p)dF;s5}erc>KN9a-tG-_irPk4C7SiGuW5+~;U48~FS9k0wG<1al{-bB`56 zv}IHZo27gy9T9j|3{AW^8G~Znpx#ijqn&k^BATvH2?{Hk!J8}>O2vtx_?Ch4F}_r; zkSK^Uonb30XSzI;fjBQ_(`XiNSAjUJu^vwaS}1)Jr;*{xyVrHvkD^pDt8^43Qoc&W z{0$qM(!4H@7-vZ5y79vXULDzC*TT;HHni>NO*9lvB15gpcDm2BLdIouUT=!gYRTU^ z^WT;94)zr~=q|!7g{5Oy?M2Y*H-n551U-;2tv>%lUm}Fg9`qarmMNN75j&lm*Uy`{ zJMzlcYz=QXNS`tm({3pqpY|{A9sFJ1kyN)|NYMywnpLk$^J!rgkH{I}#Yh1=$IEST zW-(ZSZ*jvhJ<+KtdtHSSBvDa`h#EevqvrGZ%rn6NEetweH} zQxjun z(`FLi6Sh@y!inCBCwI3wczRZR7Q4J+u-p1Qv^^R9`B5^Gf~)ZooTY2lHCY4O7{D0Y zP1NmPmvImh&uN>b>nC%oQ#Ri?OA%wWgyYu0e{rTohlUxN$HA<6Z9UcE0 zh~M6i62NRj#XT$E%eZKk>^j;x#CGaFNT#5aIz51_iOq#h<4Sbi2*^3L?d3;RUTFds z*)C7VpXvdvb>X?v)T=ZYm`Ff9sok7wEXo)!&u2VacMyf6D?9Q_LSN`tHSh1jXG>-m z7)t(iUI9xZ^bm}I`>|=Rm#NohqqRwQy+0H=wX@UvZ+aV+y;4g|%k9YFKzG~CU7sv$ zf8TF6cfSQK`JX^)`qXlH{%@$^VC;Sp0zJZbl5@T~in*bP|EO~Q^;c!?r{Br@ffU*hqW>d(r5%aTGq!Z>uFs2jh!$kZJD}TA5^r84NU?P)m2xs)_Lwh(F_6InMYk z>XKI5D&7}vdn)q|QFzk-G=aM>sfW#N z!fEMt5>{2C=yqa;tO$nPO=BUhti(!IX)@E5Q=SNz*%;Z&GS%R>ARu?+y~}j3t4bGA z2?TaniO`DCcvXjwh|x-fpTnx6u`tUgW_M~7NerT|jvS+}+)F~fds8Mdv5Zk1dt$sd z(?DDCpdCt*!)r+kXw*8G`}4HPcmI=lsLTbA>N)GuH3|LK>$PJ)LwrrxTvy?W-lQcb zXoxyhafc_p=BLXE)CMcT-_ub6X;?O|bm;fXG4F2VE$65Gww!90e|F2+C^gx^&sU{- z6{hf-9esE=F#K|IG# zkRogi4rhP~AWlXz2N==fx>nz#wqwULxMzYrDV0#Tcwur3fh){FZBPH*Wh=A#PqyAU zYUBG(*Sz~_ln)P|5gd4Kmhv=WCOuHIP(kexin3<}hGX@By618o1~Z$VbDo+z9~1Id=|BQxw@q_T>9F~1N^qcRdr z8=%|^I1^=tS$qW_tkC6q{>rZ5AZ$?nXh%Y$v}I~K?2ooSsOm=Aq=dF!D5~P52H=Q( zN;`<**Np2;$C)XHgf^!0=8!r*focN3y}G=pqGny@C3V_(q0sh%S1!Z~@WK(+DwSH> zB7;va0m`@)*Wd9A&0hFWTpqokB;Lu$3YoztiT8uh21Pcag-#fn_HQZK3{LwpSuJhl zgDQB0&lp%82!)p4KMJa~@mD9tmZflFK8LaNfei{rhjUqgJ1pOYw6#3$iwqDhQ7Do- z9MoZADA(*j#LmKXsZf$sJAqShpZ2``%V&zkj$)T5Su?`fHn3wX1vL(`Q9CJSlSCprrB1Wi55>&omXhT1hrF9jHl6TU4GsDidCXn476C0?8!n~W6TtY z2i;fP6><3Dpv)FE{ zFHBYJu%v>X@zVqI?bcz!NsYZigji{9h&|$q?ACff{e&`d#uxY_1=6J5`=oG55ym$v zZIC~b)^H2CEfYBIYIOzE+^%9M`TR~%9V7P`rs6qG6d$zN5A3`hgz-5ObiLQ}|BK@* zX_t33*k>3qWZ$`~eS*^aartj;CS;4|rcct!Fq*`^9gw|l+@9C%3p%V={;}oW1W@@a z8c>gkboZM~`vrayU@d}cr~$X;D?(s1=Vdd!T`U{&Hx{wi&N|pExV;6 zDLIH*BI*na;Lg1eO-GVch=_JoRR7L>D4r~*Ls7F#f@d+%;Z-McI8!dMtG838 zZlor{igzek7aRJS2?J0&t##aY=HsnfT-q zpJ9-Nd~Sa{*_X_33B}(koF16n>6uze&Y6+?&4dzMlXO8DD2`d8g&Q>X)$8$1M85Jk zO*A#B_ummG?;S=Cqsr}bH6;X4g|1*sGpWnge?BV51OAQ3iKZo7kmH<=)t{v6;}V;x zO>!@I=`4Rf&{nOULsZCS(#@3ZTibLd6 z>DZOaV?dSAg8ib0>Gr38JSem$>=9L8o{5a@!cMQUQg&!s$3YrC%^-N3w_@!6hLA?1 zTWUi3UhNSul*)PxYUduYw+Zva|bX^I< zgY%tvPIYYu-dFEnf0;v_Ea*l&JMZauVF{dt!#nNyx=wSB$(6)83Q>b=dhe+Nv(xSi z2e4Z}z)>rP5-m|pELpQ%&@FGwx6vl+%2YP%YInTnDq6;A;}KcEp|l@G&o?MWQ;go` zYV)1yhl~c_c*ve0ljkZy?Rp(F%`Kz4%Qi;22$2B?9d3xX!$r+#XM#IbM0MOKH%4XgZ{6z}%aX-@Kt=V|?3qcFebP z+85!WGoBKQhx0`*b}7u@xrMyC^jNo_qNNO9Ez4O=;9|IhgqqnEMn9xtI&3zKW%8P2 z=WD@O5+G;Mc1OeE1xO*#Kk5)t;V|B-?lrEdw>2T%i3M_8o$?QF&T(Iv1DjZqdiK7# z8#wbv0(lO}Mwnb@Txb@f^g91QW}XDHmnlKA5~At?YQ0V+uKE({m%ux?8t`t{d86G@2_RMqJFThXx<*;CQT71ydEG7+PdS67t3S#Py^`yxJ1G)#`r-jFz4o$ zFO-~0Mxs=%SVN_dMSG|>al?w8`tikNoeAME?98`d6|};X*m{pQ`lJJ*89had)G8%T z+<{=zgNH00d14-`C1n4MMmqmfcnv!@T?K5~hr+N==EpEpxntC^8eBjL9^J}G56s5~ z(u|taPhjiK$b-Jh(T;zYOUq_VCr{(yZKbm8EJ{2fhcl*b;J5p@V#h`(YTf+d67u_t zc)ndN&4QrL7ZMl9j5k^cWsQ?ZxJv#3nD?RGcu;SO<6V{Lk0bNj#5Y#-RmiI=Jhh&4 z{>`MB*~kH^?+W%gz1a_10I(3713GcA4|+*YH<}m^(3kK50XPKsa}hNVLnBflle_S9 z=5wXx-1)sP%f^|q_IEV->NIM{+T>u@pqPu(;pd*5_G3?Js@g~g!t7}PT;Y5 zrkh}+cMBG0e|gjt)m}&znIv?E$Um>t{|r?hOzBe7Q^X%$W!S>* zx`7TghDxas=z;+JnFo)10 z8ZRlWt9JJ18(#jfuj_4stf=0f!ELjLKW4x%XrZ`2l*b=Y^%|AK*SJfv8QhP#Mt)cT#5`u8(}JA~B<{k0X`|fLC8P(D{AcErV>(##wkw z=;MG$_OD<$5P6+2;5nkc#bOu$18haXyzcLt@@u}M&-y7Np$y+< zZ@KY`r+!>Te;G26_GAc(X-_Jl(RMtJ^J6jsC4JXr7bmE>|}29xd9F1IU|RF;Kl0arOMa;hB8)=b2X@yH`ALgRF8N<>~kwiBfddCTN0X4 zNr8cO?44}bgxuj(1 z(cpX!M(bvr#xWy)5{q%k|g9mR+6e2RQJv;?+D}^8xf-lxKDPG2%udTQH?WmvZFeFOf<^ zX>*Psy*E*-TFpWR-IHsTsL38(-}07DvbUA^RFLAN;N&k%r+ld#_F&d3wy-#<1>-?7 zQ4S)?y;+`yG}AgxOYyWc>_LYI(#f0z8yhl~X>d#BW}dO4kNb9t1O=bkgo1= zFx${Z6Im{RG==Z%WFP{XN#7R}OLD>IGuUA!3o{a8Tue*Lu{1qyjPTE$X;TI23`{od zZI#8?^YEkSCPZfah=S9&=MQ0n00TdZY#P#Scphlx*6EOFYBKS zMtp?jN+@-ODh{(; z^=3xt77)rEFG|42Q-35@XedAjiP0e|4_jgJ!jg&A!QJp3LRIs=hfOCV;-^0su zhxU^MpVJr4$@VAbr=#2MA^Ir+oci4XA9O!gd-Q7IJwo5d?|L8*zrc0W-87!n*v?l< zWSYxz{(umqmxtyqix;QG*NEkLPC4@=HdqbNe@S5_?M5AJ_`prfRzw0^ya29ryblD% zu(1A2K=0SXozN=ZOYhKrzhtK#YN61LDVxzFiKIqP>o^l5p#W7M_|r+)h9kWgBLX>z z)n=|h`_W9y;g;d9@uY8srLv7h=Fu#Mt(QtbvtUDD3LqlR_e{DI_=K^#^+93_mNd;Y zTTGsF?2i50xS98ZIZ3_Cca0h?W6F*n{@Dfi*uxHcStYv7b64KPoZv>rz-)wa-cw%tVtJP@8kWIJb7FEx0ur zRHTp|5~q*D!IiG!!xHTqbR$7u%9Od50H%01>*#Bykk8`qOa}c&UIR$dd+T4uc`>sI zzr^sP@g9R~uz>j68Jp`(a{u`wozT3ew?;nR6t9p$@m$gXUtK*jM zP6#aSww`rCss=o?;r95vKkHzq47U#Zr8?IGUFFbl0=R6|Iyvk^bL?>1SSM?JSt2MY zKOQl&1$x&9>2t+^>B=oAYOt|CV6vwV&vyjl9DsciuAot`b7@u`YbVj<-bHRVTbRK zgU-zNiWCa6gPDRdKy=Ge9-lCtU}Jp zGS`?rQR21uH5_c7+|}0UjGSo4kTqQj3>MWk5QAf2hfzEvBPX}b-}c{X--m;L0TIPKVdIlhI zV+SAf+CPpI-D9y^H#_Um)42JFoAbP800J3x-&;cOqP4chPy+R^2E6(}A97!#LKFqC z0=j@O)`p8ApR<9NA+m`5)Ankt7O2m3xzl_j#jgwnO{K!O{}`d=OEVCw@!n!ok40ae zI!nI#`?R|`0ONJ}hQgOUV$lesL~3&jTOqLES_u;bjg1-`7e|NoNRA;wTbq_BgJLK& z=6ShXF}cs-3ikv^#62{y=nQ{K(!BSrs1KA-%vwu;B%38fzirPz#lz()Cdo$1bh)M; zm8T04V=qbWz|5H70%Q&=C-FEgP3)d1uJVQ?I8!9nIP!OEQBKV(Wa`JCT&df)IE=<= z(8Nm6(~=q>;LYWv8i?G>t2~wm0VSv5hD8*##mjA#J(jg78;9M=T`*_kQ=?t24bSw2 zCwGp0@peV%a8_2GTT)zgxz^4&T+c}YV6QP#?l1tZf2Iu96C;o;HKYdtNLT7d4hC_S zj}GtFfk;(GAFfNeGtJJpSE8r^Cy4-G^9IfYZcLaq0_*661!_CWb_3)MOzZ@jOq5II zgYOb^^mtkP)NodphxJik$ln_1f)uornRLG+)uBkh1oFy@fjI~sika=EkXR61oIkL< z3?r>;MQgBHw{KRdT%56P-oDi6lpy6lvP1*eI{vc@r6(esZP&6&{D0U&HZt<|_se@y z=hg~{`NLz>_I%uOyzj zkUEKh_x(ceMzyv>v<$+!1)t8fuV3z89xq;AUmT!2k(QCj5oFJF`Y&NI@A^V(R1zmF zoHmL|whCP~qD;#I8KNEM8yB~~_?$)+O!A>_zK$qiO3ui*x#uHqc0$leogNOCysA6T zm#h8Wj>rC$e^Zk4YM*tVmy(!tf&h&CpuYaeLA2F3Df`x-Dbu|(#Z^p`zdNX2QfBi5Qp^*R$h@&*|D+<2;hO&~qgz=^i1nhy47`4F%9wn#I1$}Wb zeCg9k*t7B@TVm!2h=#r#c1fjC&&i9$Q9CJdtC^JnGSa;o{i$wx3rd#jU8>*VaS3Z9 zqO#!>vvgLshVJHCHA^rfvB# zXu!ooN6*3S+N0>(V^I22ukMoh$oDK}GeA6F^y1%| zN$zNZluY*2(p!b>%sy`KDqvEJc@>BHmdEKbYmQ2d|8Jhna5xo^Psovu7EI~*La9e> zDWMXoSsrFt9_CIhk~U_k%z$S>@%LLGgn?GJSj&8$1-!NG|5c z{!VMEv)RF83azgS_Ps{QHvyXEa-VZF->e)ZN?Kjnc zpl04CW;{XoZ;s>VyrI9SK=GzL!dgxl=7K$wty0`hRe?AWlL!&X)q4mMSZWkl`)n3} z6sU5@H8iOdiP5XMxA#jHPYR4~L{*@_k5e6ye_m&N5YwYh`y&~GgcUZWt&@Lcn2N_f zXVhsZ?pHyjq9umsq?o*$qC?^Iny+T-r%vtOAPdjNAp||(&w+fbiy?F0=KmFTK~2$z zQ&+&^Hy5TcEcn^+t1BJP;>-b?$4~uQPL{G5&L%l)axMObwJnbyk=y)226{{!Trt@)LP+-YaK#Aakz z`{eFX>j^K%WsTG6XjM4WMd%*Ewaviy07xB;5PH-hZFqh0yh+Ik74}|(oNtL^3{U|E zpb!im(6#Q{=eqtTAT-L(V?B(-p%c&O@uvA=7bx+yPQUg!gX+a|f`D7!r`hffTqJVe z9+Vpn8sNvQRaC-A_X`Qfcl>K9vPWq9n-fi>Y z6;u0aqwl@BdhTV8RMf66zF;DsZ?z?9pA?di^>+w!1eD-eqA~(i_hyjwjjNQz9HfKf zVDN(^n$~e;i)b}zdo{Gb6O45KQCX3W@1P#%L{)wdp-xYM9*U2ZAnl^tOq%%ml3ED+ z3jGgP-yEIS7qlBRjT*eMoraC=#%gTaNn_i#8#K0)#dw(Z>0-?zSX*S&ka=dZI~ zojrTznVDy1Lcy*HGHs9$wdX8Y(L@kL(7Xes?&J!f!L#Jt37Z`1*!MDowjlU*m)fav zA_BgXL1e)_%uI#7;{rU6S6JDTcR-LjrwS1B^LEwH;Ko_T0tDk5OCP9X== zAby-E+nyWIyerh>l%ebFF+nyo$e7@lQqvOR2Tn&kqb0q zPx*1h@S#+Btk7I8QSiDqw*V)L+V1iVsSlRW6aGEh#}g#8eog$knDT+UCWGm+=0VTr zz3%q-=yo9SH=(OU?eI(MEvcP_Bn%CMDOe~B9`$Z)_S{F%$im(1?7h-HG_G-fBKv~Jij zZ%(Z5JpROA8CLGzKR0+}{wSUk@oJtVgt?zJ`_Tn1LMuX&5bF(7g!g1e!Sl0?D=V1g z)U~JEV@4>tTFVm6ERfGl?hChqB^u@NkJ}gW5pP|N)7o1~DI~sgtbreY^)R8shoXO6 z?%_7z!2SJYPl5;j`(zr)YA{R=ca6{+h%wdr}4AuUx<<4vkOAujVsW9K95B}!t)KmxL zQd=lmm*=XWQCj?vQ%XwlLb{OBZmOOj;9R^-JCTdX`N*B%8T)%OnRQrUPd19poj49`i+{qiw=|y3K4jJ zlHq?Lla~FlGZWFcZK?bE8E81%SnV*Fn0U3m(~-#yUAgx2W88H)n+GJzzfbiTP{fOo zfcrIh_BJxI9WL*ai3ikv&FX5|AO)#mkQ^E!aF2nJGg_xAMyHWtngWY&7^Kj=&bhUL z%lU0Oy-$m$1!eW<=1El0^qIMN)jp~B6I~_DDg{gsr;*y;6eNvg50a)PN;AZht1Bzd zx6Q;(y8L9bI&lXwg0O@?X&&Ep<;nnJW=~p7cmR#>fEs>O4OcN)qH$O)Eo%1{u}7JE zI1)^4G*+|*hz5;s*uBD*27Kw!wl;kJ zRmyVM~ z;JIDo%D;=^(VYsz)=W5x_Rx=!9W-Xai&pFDEs+U?J#@kL`}~~Mdc?!Qg5zORr4HlQ zb@uB&btcmi9U%UP0sw7==X&@P&oAX;U}I;m>dj--ZYA@vf6}Jw&&ov~aP|DV?t!LC zACM2dZv?i;h#en(O&gGiJ-t3BIh@9lq60kD`m>*TPGmn|CZA{d1v_=OlYiMr@#%7( zulcqKxR!cW<-q9UhtaMy-1pUHTk#58sPLZQ zeUAa0L4ViVOW(Bpz&sWR%%~3Q^xDV+JcyLr*y8p++e-9cmZma%Mq?F%<$hoga#~XTKAJM^8y71 zp3XnqkWuj64?Y-P3(hQaHPEh2?N6+d!8|_3_N)1IrUiXM$aV&%ElYVD;}DO+9%q`n zfo>^ci#fZtj%^>hHHBvzUU(A&_TIj7=?{|JP)nKb+Et~l;nB@U>f5mnsRQ9lAz&QY zl>DxI!d888>IT&mIt*X9_T+fO@z+0cmRToDMa7#f*_uE3YT%${X1j zOiyKwUPKewv|~Mp3c;hQupgM$K_zqd`0ncF zS0ZnP!W*M7n}ZO}XqC^0Y8j*;5ruEP;yu?xR(H^>gH4D}g&zP{geZv^GlB(Jc`S7J zy5~<6hIws#*wYauLs}&d4^|mZrzEM7z-k9qw+8-PXsT1hy0T<-m&nXC$2wbWqiNU-wCu%b)8o8J=+Y+4JLIbuhjHW@Ds#n&i>r8EBTYTo?F5}k`V@$I25_pc@^hZYw`sk%nq5ppO z|6Tpvo-&*Vjw1iWY&7EUJ5wuM3Kx;BKAdLBsjxJYq-dmLU+K;Asu=9hj@Zf*_Nh zx!ZJ=!t4SBKM#0TE%QQb7kS5SMFp6q8V~)x#_My}-pa2z&I*=P(%NgrK(1U}$0a?1 z?Tiq7A$71h$379G%tl-rl{f4aLRHQ>(2Xn=7C+!6ijqlKCrp!_1PnS>6s0MV|W zv+>U2qU~1IKUG*0#+OFzR3T0Y3tBsqW2ZnNckp{HN_CtzUc6;Ip-QoXj{pe?$+_h= z=`l%u?e27OQ0{Z+g=mqM7#TW3$xyJgPvl|0nQOehJ|mp#l@UCLQ|aF{8Talum3(tj z$1u$0tHgffnXBSJ_4;Pp`KLcwe8D`jjO=IsoT&eA)g&`w#sE%Y$G#qg(-wL@JC5FflG6nr`CM{+*V80YQ4TBPLui?@xWJb1vWZ2 z=7NG04Ah{eCN|48=nOI(fI}o4^?TiI6WC${MaK;ai5K z_n_(>OA6CCXE?U!ya{j-PIQ15LBnKV%+(7~2|M=ly)ooOR1ka}%LTO-lgf~|$EiYF z$ynkbi^V3OotCmEu$bc(#xtx_D<=i7J{NfKUYS4 zz=lXY5pVLAY}P(#;yaHx`wm2|5qE;1cJ<7fCZx235n~##s6g>FMe|b%w!1VhN1Lf5&acPgdE$8!Ysk;|5g$0usV6st>Pt4XZrlZ)V=Tm+~ zkq0$OVkv{mMiCM_ZXqC=W=qACX7K#%;P^`~eq8gAzO~TbBu|(=Rs^^xr~N}DDUp#P zU8`|F|4Lw!*b-lbP$P12H!GEpJ6V+5yB6c4k=7$`YULVzx8idur(u&IcGiNYa9Xx3 zH$0*#Mbb8lrDNNc5~&rm6~}WNgij!TGeA484jyff7IGB8hnkk`rizRNr_(V^B0nBQ z)!Op^T3G7No^`_Dm(cffOLw9hy?gz#R_NI0*^djQC?h+8Ys5EYx(d!(OTXtwe5QSS z&opHY{OP9xUZxX_ntqOhBLhYJXQjjVRrDk~LsPzgJ~^qO+t%Bri`_qK1K68oF&WiF z;0)C)Gpuavsk=H-T4OtcU!}=4*qD(y(%|WxGsTW52hW6~vcS26o@}XvETXQn@~7uB z19FVFitXDHNRw&M1_t<4SW`wzV9&B!Ok8?N# z&k742{6H)#CWa`|j1MSclILNYeiwI-zz8ne5h~)znxG1xGo;8P9E-ezTg11X>up6p zk|@}y1Uvl^7iuA`AMfMJFC_VkY5qlvoottnoI>g>gljhMDs`~xNkm-LU#x{ z+b6}L!UyS!Xlhs*OL_LW;X52Catr&&OENleK_}5S`Ou2v@|1#<=OwCSN8!~DyVJkF zm6~Oe{^VE-;oD~^LZf@C9q9CavnOR(FJgT}J|!V2!_pr}^N?=4 z2%i#ZwV;5yXKU~>nQj)}-VrW{U_J3f3RcI9>K0M^pKY<8HaKOE&%@WZ_B19V;nR#G>lU&I!IJIRzSu3Bw2WBR2D%J~5x4eOg=S40g@4Qq zsBrQq@w&lY7Ykm3Itd)-t0=5-l8}qtqSBLh=v0vPt~D$+I_4<1CGrJAEWvKW13k4T z7ohOQJ>CDwp}0}pC|vI1SP^g=e} z^5P8)UZz?bO|-@8Jd*|%g&ypKG1bUu%%#}q92LVjspsE_zt4n49B6;a-#Qoud=-o! z4Ubb(sEN*hW$eMg#Do+U_)EVfl`Srgr=;8Stw^28ZLA-%aiI`I1|DXmC~iTD#1Yan zhx4kr5jN6#Jod+u z0$RRYyS{M6tdWcJc$=$R(9Q8HYm$u;0WW%^FkIq1vM7&!Kfzd?W&W9DITivbsg1!sAwAz>wwXD6toYn6L9Uy27q|5@n8h=Ol{wj{+U^6s&o*Yo&v z=^QaT%PTGNF4R-kbj+XDUj2K$iGNeU%6TqrU0w$Uqb3^W$=(=yTW*vd$|uwe{<#J0 zQPDvv5DiB%abGCS020Y{w;vigr|_qpaY4a1o)hG{rM|Sm)jyS3Je04>CB-Awrx?yW z33f~qoaBp8{HmliOBXCooM)K$(Dt-1UdS*750^=1v;?BAkTj=$>Z`7XtsSE>#i1%g zMR2!GOUU4ej&b_dCZdeVs&TF{<>A7XWDbX!84(k0L$*m!K&%U` zsf9$hBJotS6ZEvGLsw_?(=sGA*UZ!MyY;2)DhX?%qr!nAUZ2y7`a&Q~tQGT0x{Y9R zID5I8#AtdJg4E{5L5cI^AfK48fR5#@)AFS^M#|EPJw@3(GLvEQf|GeYXm905W~B!A zVoqaJ3bs+0)SeD$LPzn`a;oCu8>&LbGCC0vdP^#&4B{O`4v#uUrz9DBH zJaZUbv*)^}``0;UCZ>C)e}^___WXAw-0fy@qsqeX$Td-A{j4_V9^Y8VULZ7y$W@|< z=ZG`_aw>sTB=S1nG$>6cuF(kc0YA{NnEI!PsdAE$J(Ri%T)vlCQvVX3TqGXjyw;{=*qB#KV9@rYEeqXcy}hw60gq=_5V}M1CpDob#z@Z zRqs^3mk(zZRh};I+(~gY;!WG!synX^9S}r59ZXCZxNqKJ+T2BUi+@_}Hh5PKXnl6* zy@Sd+K1g40(?7bS7B?cT8#jVV@LQ)Y?ozs!{|VC?B#68x*`_hXoByL-V>C5WtO|pL zr)3MjS98RLi5)w}V;}{VY+5QYMI{P+l&F{lu|#-7uM!8#h!SB9fBk0W&$nGl{mP(4 zW1VFJp1n#&UD~*Ac+)^^hBJ=1_t3Y(Z+t`M&X{`Ks?SV3)Fk}Yh;%I+S9!(tf3EtV~%BPB=Nc4}$Dxg!5op7oL^SyC((W;_Wn1)zqa1 zpM&TE&_~x14UC9abQzs*yX8~wQ-dZwpO-(wx4(M&{V~#_F-K@SET? z0+LR#xzygbQ(GuM_z(d{YArp;$XJm;r06wD(**?cO@0dHVzp1ecsG(R5EO?l=2>_S z3_d*hws;sEZfVzjZ5M+~!xwcdVJ7Ru_N+EBVM^ZaB!Wsg?QD)^IyiGJV`3p>F;$N& zI@t1G#4@JkAqKcw0nnSdVB}Q2+vw)Qr0V6v9Eaf((X9@?z{q!;>3*&rF8=*yscenn zrmth2Fu^FwDjB0o1Zi%DAzFD|eV|?UF@vsEb4cgN+ePMNG|%{64?+>Dqn$OUs+BXu z<+F*Y2RuQWom`c`jeWZc${xXgxXciik(V_Jb>sSdx1o%#^Yek%z0~7ur|UhOIv`+t z0>Z8*Wirw_tcfu5 zxI+C4I{D9jDYbh6gP|w?6=??_foBjW&++5Ap}w5e_>mfo)TFWWoC79FM}CO3(}%Dy zkp^B0xPn_&zM4(_`zK@Ox(H~!4< z0MIW0fIhkapuhEf4m6n00Q*H+45yBwHnpG4Bx|e2ish(>Qj}gg1J5=kq=-{P zTH&7>%Wf~;Bs@4_;;IlkzNa=1uIO06`jed731CgdL5g`0)0tbyi4IwROKdPs+7i!+hHq*f%Za(zcX?z zkYS5kLN0tDaiB)Bb*VNYDW0is7fKVs1j@c-NN?;d2^PHI41aKUlGzqL1x59VU7WfjNu4F{Z6$)dlp1VOKfB*7*N#VRB)HucpOwOG?ZoJgim*ect9U!?N zG`N4`z5p;xMDRoArTl8c*}31Mtm~|~>wrU6I07z(YFBAwG=!s3=IQx2d+R6 zPFNla4;%Y4IjuYE9;j$AE|eK@%4{v?-IihQ4+S;CEJ9I+J|7O?0+lBQd92hV+;Iw^}3EvY?L z1bLJtxj(Cl2DA(Dcw>=#VuH`(1$nAN7<1mf^>F?dV@Cis1=t#qZxnXJOWd&{bfb~A zw9`k9A)N=j%V&rKgTF?tlm~3`wtbmD_tDeZN+=ysOB07J97oFy@NPuPtOGsKb^oRd8;IFw1@c+yIVjs?i8UKlOK@hhS# z5}5ReXi1k0_kk|$Mfvsn5Kx{+wGp6zLlqv>(CH7j`9fC+#f1P2Z>!((`bTr4V` z_C&iQqbrll_Knm&dme28=9iyqZ<;ZCl-$KvSXtkRW7}&?knZ5N?ss+$7-GfH0}Fp) zQ#x7kb!Ofm84rYDOJ42mVH(46LwdMQ?M@aTKXR+CZ{r*{klEPJ>;J;&Au`WcI(2({ zz_St^c<#ELV_DY@i|-rCu8M5OZ(Mc6tpq53wtElWfi#^jLRv3**^_BZ#hh%x(7c=A z9NX2swtYDv+wVYPeE7-^7_6=r@KnM__>*n=?2dt#Ip9bIezpR`WcxyU->qzIAoF28 z;$OO)ebpY`rtMB;tezFZu4t|Mj=vLp@#FQg=iBJUC*%cKB#%BJ+qvnOzKhrQyi0B| z!mtpY*GpP)AcC@FSYN0~`UJ;Emj1C&jz5OqA2eF>*!yW%+|`kZemTH}mb!!mx%s>} zp1~ctl6lVZ6P;1HQ!+)=G|#5MWlvC;pU{%ypEOdBIv62+Vd^m&Su(#6VwN3L>WU_FsTmqBWf zWJzrz)PK62BHx>3Ern0pXjAPL0krTE5lP}3%9}UUQNTW_*_JrXShnUm9y;P$2LUdE zPr{cF8#jk=&lX{ALKLb2)NZj>Zv2K447VFkGZsT$(g>|&Y=_J~^TuVf=%_t3gfgr; zYW*l8QoEqY9mC8cmiUM`N?UN)ke&$+?zrg~awnWEEm~tVLZ}{oNZkRlXaXAfQQ6q~IY#wX#wnvTCet8IO8b!Sl8Am20*kKg70mlBpjyPA&stmA=+vo*Y#=kmL8-um zp}G}`P-i9`&nekY9aa}ZJWG?Qc-JvOx^X^0oC2JHVh zY1+fkdWq28JkEam((X;T?(up$xVUA?-+`F@wsZgv_F}ajNWpW*=z0#H9ahA%18Y_p zFQj#&o=kg_vkHJ-(BZ@L;RMO+4KOHzD>W5QSG0`j{uAlPCryI2>!{Zj-0r+z4=fb1 zlB)3mxp9;Yu$F=Wa+QC-3*!=_z#Ao`VOwG}*{b`JmNBqwAv+w7U6nctvNvSXB$`q{ zz(LDib(KoIB%FWEhd|zwHhgx^+54tx1CqJ{mpAN;h7S_TJ$1n94qC{4wZEezolLNQ z{>l_VK8BA(G^iRwl@=SW+T*Dq^n;F)m2&I(PO|U$j;OjJ;en;c(j80{VXwI?pFiFj zhv1h*4^_JsNj~>saPZPdTMO$FoYu^Hl(c5z(=D(61HqaNQo9V&8z@e}cZhe(M`N%|l1{hSgwa7b!h@z1u?-BDZjDD&=ff4(gD+hovv z@i+Jj=cNRh7z{edz z>5MIu7q^xHh|bpI!eVDc1bv(10u#XMxNvT`0E~8 z9e328SF2UqquHHU5361q0%>0C);-f=1Yv_b$MUYHc?3Zl9=oJ9lfm-|?+2TZh+W;# zc)lC_*F(E^K-UJs*IkPLMz^-|KZ80P?&h0L);++%xLu^TMh~9buJ*{qg*i}+uL zIrb;B{3zbH4C}CX0ZgxxnwG|`tO<+?tK&@0YpDbuV-JUSnCLN-5;hx~$Q$haEon*} zQi2W^lpoL7*3>}rM>p2Kq8Ezp*&Agp;N=s=v|0uwR_R#~WQ_kot*raxO55TGx5d{ac3=%!|hv8Gw(T-(;=mN1|gJ4<{4N#_NF;=5DnaMw?N&@$Oo-F$5@w6^Q~Lj4P8MeH^9X7*Tg1 z+>i~b+(`o35%ILJ#^;;8{Wto8RpbLQuJHMKp@mwxNE9FbPy#ECzPTI|=xCwqpxSLg z3XLz?m}aSMa`4>Aa!DdiJZ4RXdnlSPdV8D(hSOW~mJ%PV+h`%NaMJkvI={ZO#AQ)( z6`yt}p3cT*l&M@P9QkoH$Uu?(F=YZL`VnL#6&LBP#t{p%^aIyDD)at0KDvUY>q%>; zy~hC^iXIV>vZqHxa3d^%zygsi4NXYF)N{iwwZFb>o*{zCTSNH7alcMUIXmV#(s9nrQI*|Tabep3yxX2V3DWG=H^uK;&kz%p9u$OB-*3u%ZMW()Xz*Aq)Zw5 zTQ6G5xfAuv__#RG^hL_jbvo*S@_p`2XLLo1H(`v&^|aJ~h^1RgJ{}7*^TWyWpp$;k zF#Gn>D$ilEpA2}Xa&N5+*mF-zi1D8yqwh`W!>ddY{7QEw7QP{lX8yjP-Swq zZ2Ey;KX~4Y^DZCrqT?6;X>rek5dOZ#sx}l%&mG*Rn=B6oz#F~cdm+zw_)D*U)A6#2 zJ?TaLk2-kuScI23{4eC5b6DR>DaCKfDTv%_wOa2U=!YGEg=w<9jofSoi;h*fhnh`*q^q8D@sZEs5a%|Q?BqcNb5pF z5wjl%8Z^cu9krI0sA8c)=sfH53*TWc9Qa)mVPEYI>ZJwH>aom!m<0rp%Yk#>YW(6< z8eo$V2S;oka(+ZUkN1s*qYBM+1r0oxkX3%!(7QVHgYCjP+wF(z7g1#ODOW<1jB}$x zw8-6NH$Ec`xxJ$n-g@ueWdNW0P>@#15 z#CXvT;G8h04}(JRgGmv&zxZ60n{Iji^d#+Y>PP2zDAVo7d_U>5eYihcs_~+jc-qCZ zouKIS)%_UP?d9*-BD_33;P?95M|YzkhR7=iWX5W=fZlMLXKpDMch3M?c@h}42nN-v zjd9~VYw>WI*PEG3xK2qvr>Y5Rgl$y~gKmHS=B30rMUHL~9KGrOegq4y#9^z1^5raV z&*08YV}>E0BoJ19Y0sCqAcI<-qzF0e^B4>=%=(MK25uI|E8Dav9@uQOVXX!i!Mpr- zBzV!8`rBU4Rkg}oQ7SD^Kf7J|&Q~a91+bC|l~a@#Dn+iLLfpEYbwA~W;#6uz$^GwV zn>xp6OMIo;p7fky1ZW2$f7miulKQF`cY5M1_Q#8W_$KN1ETBYd3Mle>Cz-QkWx+*= zWL@~lf_iW}btueSXnG8=bIskqVzkwp0N6Svhm$WlSB=+2_I`@lr1$xCx01>AV%o;Z z`6S)DQ`m)|XoD#ksiZZv2Z2Z54p#UjPK%eMjYOB8_yNprVvAwPbC14lhd%qaD?{`g zP-k0FbgTrD`?6nqyWZlKM4ix*TTNOcgzqwKg?lEsCEYOzhlfDu1JRvQ(BwM9RG{q$ z1Nyead0SqpZ>r{quixY9*VTYwyN^_eDvv0zEjD7tt>aN}UQenG8ulOiqTi%qZG_%Y zZ}_|ohwsyxQ75nJKh;kc{W%jNm*ra$zPdS0H27ct;cdEbeaf-2^(s$tG9KevHT>%| zCKr7uo6sl^dO)HJolkozwVAhLxxmInA%A_PsM+BARbyv>66Hi|Thaq=Hg~dw_0nnH zOO_rLeA`LO>wK2pJ%O)y!=?St?c}rDXy>*)UXk6Xu=Kv)IkCM@`=}Ad0H6ussf-Va z#_a!c0TRguWUHPCJ?{-an*ZIW<)v%g^?0l+dP8`>R;Nez8x^h#JK%pidVEln>HfCy z_?hp$>LZ-rZ5ws5qN^ZWLw<7@=of(0@ig9a6fb4FbyT!NK1dMpcK;U|%yv!ICrq{N z@y_-6;tiXQ;~}^DC>i*5i+S@FNWz7g@HZ0Hi8c1AnK25WU@0AJPcJ%xc7A8I;bQB3P#y4!ua_c!moTXpsFAoa(9!Ym*V)d7givL2wEf7Rq&pH#L>^z zVX+wxRLK6p9uc&HK6tGyBU)g(6Et`GL;Tb5b@z8Yg8{lf8dxvz3H}uL?1tnIN#YN% zlzi0TSlT9fpK@HnGigZmzO(j3S_lZ!^sG9r`eVP2_WCD%*M~(8p+{8P9BT*Ot%nqC z-vZ{9@C;8HmFA$p$T$0f{)Y`z+ZDxLnp*ohelb z%R*zkpvZZ+6E!k(wkMfKJ#Xyv#mw==d(UaT@1TNF% zkR{Zz7y-u_X>|!jq3w~uI-Ol>N#Ma2C&P_wZ=zQn;9#z=aqhD6z(lKs>Jj#b9)ziE79VwIX2nth~9>HN3# z=TT&&@nFf%7b0h?jpmib%vxjpMPsAWACF^Vll>pByU%MK=ZW74`vCEm(gS$2Gy17b zd%xcv24R82Wz&4Ckl{5W;kr)vPCW2yoYO*syXk5{^XdlIrpt+ajpf4fxB=(=&@QG| z?2lD<6;NR!k@CUpJe(tnt_t%Z%ZKO((nqu6u(Jb`ukQ6^BetDE zx9J=?DMCT9QS!k~Fe#V}rLP#Hy2u;S9z?+C7Tt$~-g)N${T(uk!cDl~<VR4Kbk}|qZjIZ{S80}C#TBIb z@E};14(@lW3QC4)D}$Q>qDTGj-WaV$<>ckrve(oiog2Eg!Wb8@nfK=+zQbxb$m;rn zcTSLYyEB*Jv`-j|WN=Xa*^=A&D%6Xsxz`csZLiZ6TvthRz*xD{u)@ALry960#bSSd zCG?62M7#Qef^NLjLK@^jRb4Q4;i;C-gR_4skFSy68H-1RihEM^ncYEN`|6F*&HzUgBd7%4~K1cIXbR=V|rj<-BfEu4c5dSR zp7JG*rgzTy8_^IkMa&j9qPX!R6iu0SYQ!s2ZiQk{d6N*@y~4wtg4<5+}P5mqv3 z*l!SV8oSo6W!gr4Zd&-Nf3~YZ$DDl?T5hxhVmdK?azF&zwpc^ttv09HdkRNT%vLU} zI7t+wPN)hJuog6l+MLGjpqatGs%E%G5?$s*g0MRxRaQOIO`>&iRH=X zZO`$Js`5i$A6a-v@H~(5W+ig(ZS@-0!)|y_p}P-4w9w#R%=`{SV5oB_GSU5&GQ_xb zuiE`FWnu1`dxrgK+oOL~cYmXjQKgRFDrT5oM6l)}dN&*xT7Vljrjcp3ORT7i!ZL{q z4pdJBFBf)Bt}+IBcXrl(2Dm!3oPXN($rAT^-j3_|t~s?HW_9Uu|C7d|jyFfE z&Yy$+RUdO9ANWB0H&~<|NWEQMB@n*hO?tn642T@~;Dgz2cD!t7e%#7FJ^`J~R6BOb zmlzlsZO8jH8vzIUNS{eHtucarV+?||sO@R=x~oGizX57&Bb-b(9Wwt& ze_G*Dl7e_< zLTTf^e)jXkLoIR&3nfqcgzKj5ARW_U)64QIY;?B2sL8!7(Y8hZPl(JWc!Pg0%f6zXpSn!y(V$3=M~MJGCw zW_+2}3W}%ea^X&sMW_tSYdyD>*w`^9d468(PV)<8HHGSr|*Y_s)UBG!x6{{7$Uu0Dwdb_7X*EX582g*Zg0UQ>olyFRV z+6oUF13&++Mibf)K3~gI2#<6=^|C*xrmr|Z2a&|8-Q+K_AXzODiHd>}CONHmO+*xB zsUApX{vj$_+p%K4W-llrz&&O9JB7pAWwzWvf|G&4C#*a{Oz`1NBdNcAIx|q8Bjg@+ z7%S`UPR2R<{uuYU%Ez~qw{g-})gXAf|E?W!fN55UnxCf?3X}9C8p}Q7=H6pCs!*`Z zCzM!RqLa}i`+EFFUo}eJ+g8{v=7k8B=?vZKd>&uzOFM)0bAq7RxMjYlG7bCGVw^T6 z#}WpSD;ky2v+W@epe0OCOwR%&m2Y%hA1D6;zYoRH-kp6bIvz75>Oj$j_a#4nGeI`r zP6lr&sb`0b4jDjc!63|j>2u?_m!Ka2*b864T!(80w-0om;B?*^eYllYdt7@x)&nrx z&z)SSPjni!3M;Vz$D)laTzlQ~^@=ha0*Jd2>Nt*FxlVHPwKYL^*tg_HMk+`2Z??B) z(v9%$ZZcya<-Kns?oC7I=4hU;RF}lbQ7D3R)xVfCfR@SH*oF0p<4QR-*hbkhL=VLg zNw0}Tal4^tmBJ9Z<#I}QvH0j#2}zm+t>@>i<9dT?53jXF?i>FbLR|VS)rFJJl@C0+jYs_F*ZF@$#q>TtF8c zdaQXkaDBRp-+f1K#38g#muBSY;Smp{V%;ta1S#u6ef0L(K_3S&7qxY{hH_^Ke{xrw z?o>}jCy@Dg*LWEkqQduUW!~^Ecnh7+1&dG>7SSjEA<}=aOM{WiUaE5gY4vIBi~F0W zcs(3OtJQjwyaG4iDNCQNCIv7Vl~V&08x(y;<=r(K`fLVWiLv9fI$Ry9!uLW@T2uH$ zk0ikmN03n;HiL1KdQv6FPCsUnZ6qyM%{GK)L|qID2r|VWC(=uzN)nhoX7_!`-#^pK zUc$0gql9IcDnvl2gDex9A0sxAaXz+~Wyud|i$uhi31yl(#z-EV2wTjCfX9>$&f3bS zk1*;Y0oy0FKT7#@6o) z5O)RgYJkZ}jM1|!%$&spPOcD;`fb~}E25Ls-gvFL*xZJv*G_B!Bp4phw0*qc@qJCV zmKy`)x=#xvYJdQ{0&cqN9e*2C6|Xlu*BRp1^dFwL)<6HjOZ7(cuw>jQcl@93e@8D1 zW@QJzzg!?)@UFj1Ank|@;>F;vxK!4=0Vx!zQ0LY%>eyx~I&t^Mx=w zRa)+xzZ7$~n%wfcbU4W$PIM_@g1>3tN$-sO_{UE2FsK@G-f86(CNchQHt&-jf=LS| zFB~M%c*XS|$c6ZW_Y~8IhG@71a1y3U?T|frf=za*HHyEexe-T70uEAkFN>W6rEWZc ziY(g3Noego6w;QNw8eltjk2Q{YmIxa$Bt;j@9FLl+?-uSiX%lUyxHwxau;{*#9S_D zoYC_qOKs+}EkC5{QHmEWmfGw{2acV<1Uh#^Z`838Yq)?+vs9pS8R^qA1|;)rg-98V z;RD0zi;tRGv#__pD=bL1I$K;wm~lY9%Xt1E8hS>QqXr)6HY=j#IIJL*4DA>f%=B(VwZZP(-(E9+#nnvM4wz^60NjNZv%7Xc4u7ZIfJ}|R zz&h^xr7&3=hE{Z4n4UdiYl%n=Yp(t*W=1+pwt#_MR`((e8fQO!(Rp1xsH|2#L6!9y zGqio;JlMPv!-oQEI*q^B+M{>Z#`tY&RIV6HQLh<6A$@fB{8vo3-xg9Dn)DQ^dn{lRywWKhGTQ85N}@Qz+1_#moGt0wPVU zB>vvqw)lsd8wu}eB{JFmK**U2hS;J8#zQR-h4a$ZT3=zD#%}^NW1a6Ph%>zs4v>T+ z!}jBa7sK!v(>})b6n@S7DeYv1hLS~lfi4L5tD0k|GSUbn2}aGnK42Vy&r7lp9)-4x zfi7zMWaZbjbs00bi5q5w_hH%f6Bk0`Ek9-J{PnHv#UJ_dEEC`|yez7ooSKy$N1OpT z<%I~i3LwRS+%C?LAGmCK_MUhGP0&R}Cib5iB9;9BvJJ%JOkUj(71GFz)KEp_UN7Zc zGn`m3jLMv8txi)YxS%5+%7Jir^Y^VtRP+`uotBR(nYLx&V>!uIit)&K!nh6t zc1mQWIU(9)58{;%gVHQP?O5PL3{dWrCs9ixP~UT}O}MF|QA0E$-&8_qOV3!1et2Sy zNGYMqyAHBtl;j-?M5tEXSm1l8i}!GC9~}$tM^iuOGj*8A503w3jMbkN7g+etp4Y6J zvvLG9cPZBy%Zm5K z>a|Mu;|~3gh1U)^Kw7BEbo;7fe_8`3_^AOY%WxIG$D9`7^>Z#I1T(fPQ7ys7#UYkJ94sErac$)87G)n{BNu64e4@W_GY}6eD zqm^10l{pP`!|t@BlgLKZVGThGf_xas6Llp{j9QbSEf1w=I~41|64j}p9D_MR-}kIk zD^oeq9|4aW2_3YLoo^%h8$Lvy!q_Ooh#4O9=YdF-P3K~pBrBWSobU2# zE9muxheMuAWc&T_m=BjtT=F@xpcja%d9hi=uH_OjX%Idr4J?ZQ^hC9o)HL&N!;2yw zg;6y%18o=w*bxCa6HEv$?$&6Suv8Q}uE!j8;W#3td@u!SPqFc|8Q_Vzt|U>;TSACG z${cJ3;+p70izYr&J+p!KugJbV62cf!w7Kv|t+uuzIrp`Ohmit7JTQp!JSA<2)lckY zY+=@jjA&fL2Legsy}_WBviH`SD->g2zWVIS;=^CwP#T_5B~arHjxA1ZyU^Z zZ=`k9@LYj*m0qzKodxTa%Q%OL?*Bv6H%C?4et$Rl z$*#$^n{3zAWaBhxnlRa#Y}dGMO)aIVolq1sb@c!_^lQnm1x3* zRMJ*?{Zxj0iqcD@x73oJgx$1+y=w)e9u_N*M+;$Rm`$OD?&{Rt)0UzDWcHQINkzfi z#z~D9dIbq$F-rXAAw_^A`GtK!;A>n=%k#OJW2a}g7h4oUm59hk|zYBU{eXqaY+HUNvR$|e15n}rM4lpsTu~z+3e#Te_ zk-V|%?RqV}lrA95hjlwmB{Gj-=C1!Iieb@!pLR8ETD&M;yc!toRWAAN*}lAXE@((D z)&|g0i9J;-wgPXpj*sulH{$1;ydI$cqVxlREXHlj1|UJ zyJfZEXpJ+jZaWL53@Jqzy|!@O$U=70^^zsGb4l@s1>vlg#p6+R4JE&_;4`v;EaNb- z>!pQW-k3$SL;+BsBR6%?Y}oFa=o|vCG2&Dw_7LeL-;{pFcy&8PM;rZnCW85_qV z-TST}b*ErzoB}5GmC6v`*7L>B@lIEe2PwJyr3&`*;K<0j^Y_)vFY3f(F?;F}oF}2f zg{!BAi{sVhXJ#@U z=v@{4aajcl2juli07P<(so3xPa?z&i^t$@{6|S=FxM;5-UYH9{`%E_4+mYP<>BKa7 zJFv=gUy0;B3dp!|sqDmuuw4OCzUzNK;l5sxy!OZtFmJSCn`L+~1L1y(ZU_MTNV4=J&o+yP7=9nM%sYvV1(|0 z=(UITZRE#vAXR>{HOLSEfR|~qBk~QvkU$7YF9Yb+UC;5UWeJFaKrFNIj@83aa{``t zNLG$IM>@aN3TK`iRYB9_nms(O9e+rK7m)!}dK0^AMy2xDF?n*cevHX_GBGqVXXI#W zf@)Za&h<~d66~d?9rf6c8rkfL;|BP?K;R`e0W9MqTBQ~@L_i%8YsF|7Kek{2x+ZIP z_>HTY)YoRiZTHkBVsbFqXH`p#%U?gQdRm;G`L`FD!X(z9{k%W;_>qU`)ptf)E5d|NU{y=`r-C3CUMt)*uWGV1-$7@xUQF*PM#8a~!8MN!s~ zL;@9?S`iI*d1qr&p`LyXTBPJiUEVglJk%JI=Wr85uH#tUj@frl9f)VE1N3A!yoR&< zx7^D&5ndo3>>CM??zua`CeJk_{hTd9$@OLT)3pBFTyGc0*UOpnhneHMYCC&-g{z4B zn&{HwRFi0*UuU=OM|bW^th_B-^9sAh#z)d^t?R@mnapVufrw^+mjzmTuXgw+Q*Qh} zECttig4&`Xqt&RC?L_f)>oh;VS#8ZRbRIq9!f`IUZ-*C88FG>7y(U(Ury~e^Qk_D) zL-~!-$(6!!x}GEOKg6G&->dxxn6;I7hM4Wci2O=Yp#Jn}I3<+k`9A^Ewl&XD?=W{l9 zBVuL0ye`LAh95aSMa)#-mZC?XzkTAX#4(P94S`<=DPD{lQaUwQD?Trlfy#4f5wIj5 zDHAq;`@T=w%=Pg0%l&#YdV|~2;<+;$X6C(n1@-xT{xA$Yc}5=XK?AL!Z#a}v)uM7Z zdcl$qWVPiF*t>6tidSk32mp!HU0EV?SS*ikkP^?CF_;D(b})Wb%3A`u$;dUeObBcY->~ zdynF3I9L!#b#AWtY?R>&_*qirb3J1l&l-eJ)xkhY=xNgdn~}dOm@If}^WSE-W#JEw zi{^6$PjElSRS_nrB?kaF*fmgr8hw7VzwkqZR+b6;(n6NaXrM6uQGLXyte1Brks>zK zi|%9f#j*ApR*bA>e1c4Yw88AVw#;i+ZRe}NbqN%q#cY);E4$PyEhCN9qg3L z^YzwlfdH}XLSK@yp0O3Kb@nYQ{Y{IMC8iVMBzT4IS?o@Zn>ICHxjMm$+)?)H6=R%$ zX=OHjRldDGMne`08X25~{0^FgEa5TemY&hpFf6NVf`>CBkohWrbxL`y7M zo%#@)7rq?7%$}DQhZHLN8vhcb+M{FGm4(#Ru}an4r?1-gcW|@yj^mpb%odWq0FpcF zv0Zf9u%blV(u&)Y7fUWBY52b8!Sc!rQO~a*Lt~YZ@!}C8l9HAs)x}u2p;Hkwn|yTl zObTu7y*Q4jphvL{ zpx7ti`e~pR;v=zTlmsW^T?$7B#cG8bn#_ukG=+{ZWFFb< zE5<@>D-wCFmu9p}OXOP3!6$quU`~~oOM`i80&UgW3^x1!S^yiX^)m=%cvE-|sX;ny zgI0DvVq!_Xv}(1`eDD!oN)NhkgtLCoT@DfqhwSb{5s>j)h34BIOB|7kiy}LX11;)KN+7az~k61i8x-wXF^~GQf-Lp5JGb#&{ytEtM<+DhS9x zZBI0xe=bKBZoQ`AdH92vRF4cmZ_j0zc9R2U|9h_woSof*_CM?-J9*0(Pr?1J{1Zf% z%bFd)0m2*-3VH2>I)GfJ-(PmWv3PubKX9AsGkoa!=zamz$0PzTR_zxFst^!Wf=?!% zH-G95BGj%YqdlP?gux>J*t@Lv$03?aujg=s{>`qZ2~zTm>#OKp5)jx=+v^xOCgO$e z*#r)hqkB^?UEzqIbKt1%JFWvTDgDM*6@-Zne{VrK+b9hY#N|Q%z7!PNzOCp_>x-JRG7p9_rb)0O z^$CAWBTo9FM^D(!J+sDOL?ARA8t~#Yq9nUo_l)h#-G|&>Z$P0Z^8_PJc znyIuz-owu?Ug!ISGkPXM!8Zq%sgjrX?$_F@tZX$o!>a&>3VZ<5UK=^fI-w=N%U*nO ziIfs2uL2akj5U@&q{xdRlJ_%$wc6Mih98&ksA&e{pRPBIEq>s?v4{NRTffNgfCcVx z6hqH4Q;#>HqM~9^_|jPFb^|b(@*yGcw0=LlttV_IBGA<`xr>Mp6a{@|#t4D0`1_q_ zxv*QMNMbZ3W$Gc{4hOcQ^P0%<&t4^QfsdUg1(5F2ktsIO4qOva`7UM*&xq5 zO4V|vt^7XBWN&`j14m+?EDi634u5T-*XoH z8<`v1m`2f) z9AfL@eAVviZ-v8OC-5h@t=>6BAjHvX6X=nVQC4h(A-W|upK*XG+W~YR*=s=LfCRBM z$$v4pfQVH+X@;M?d#MAYuthnyQ7ES+4GIn;)yk=bDEEz(r0Ww;)5{zxAU9 z=f7vj5mkohSx9=uU z-^Zmfz=*d8%AB`(F?_ODNgscK_${o${+d4?`|zJnadRYEeq>D2Y~7z97y5iSe4OrB zOJVu}E{(l7`QHqA!-!x6RR}+v6ej<&V>3O-ns$kv)ysFTTZS}JLE?3euBnQ<*y#O9 zB!x5iB_|=}W6Z)a<9F66-CL|{>>4v(9bx3=!h-OABFa)kN1s7J_eJ}w6`_5|Tpp<0 zaBi<4!lQgWOS5A_isE|ZI09SJcf>AIWA5DfP<@lt7ZL6C_Npk%?Lc>v_RERWvfNe+ zfZtgIR1tYDAY1wiV`s_7e4M|i(H|xF71~FJ(6-~$`R97 zeAphDyiVNU_)G<-Y4prnrDBvU2bhqhfxkcb{=&b2WKQEJixlSxjv=MJRq0)0F$SAV zYY@juOr2qI=!#J6A~F%wWKLm8Tg1+Hir{T19jtK;q6BYD?0%$w3sh;`wBNKp8rl<* zTl?KHcu(WLPAAGZnr`AX;u2M~!_LXf($)S4EG1DB^F?wDhM_w(8l2DjH$@#?=*P)T zpM9DJE87O48v)PZG;3+XBgx9{_UIZq6KHBK1tiuj)NL~Y0{WP!c0!PU)m;d2vZNpEngp$P( zqE%cU^+l+7FV@D4_TEsCn6$i|NvX$8VOz&=jmA zDwEejc`u_|(3n0I$Kl+&VqUF5=X_wMDF!5Q&l|OpLEH$D^6?7s`88w5CERSaT1v8= zep)Hoo;+0D)cgJ};BfevArL_Op#fQ!g4vXsP1}0W!_Ov;-*%Z^6Y>`Dm zT%sS1SQq2W>BIg|`qZf>;kMMTd&ywzZboM>4|;n#gpS?&`pSQ@jlL@DW*8E$P3^Ij zgYzcqzF>v-rP@XS=End`6<3wN-7aez-A=2lhdy7v?E!Dpxa{8RHjV7UMTHdAt~Hyz zIKP4qg@=G4N6hs_-etu9LVaeXuM?yV11P>py>I^jBi_XIHE1`qEVoaYYj z|FgenQSRBam`|Mmp`Tj3fChMMa-;r-4)51F_V0KG$zj4}D{)VfcH6fMdd9t6d@t1) z=iK%&Ne^5>R9|5ZI)Bx=o0^F0Z(upI1w3q#sWtL;s^D=1C%`xyRl*y=mMcyB`qDGP zJ~`A1*fLh-_m8u|4&d6->ct}HH2;Fz{-_wFLMI#f>xXT~V_cicuOg+Ne)v>&I}*9$ zN>@{38>l8~8(Y>m&K?N$M>z%>f>x=49Kl!qZtq(GUZ3?)Pki6-;Ex@zkgxsr=bDV> z7sk5OZ!cdSWzz)H!iy&3&N0}W9W(2?I$L{Q&n&hl|MQ)?NPG(rKI{-ybhy-+4>Ov4 z2fy4r38l+Hn5MvR^L`xQAKe%;%g>hN=CKZWNS~iYLD}m?opB5Z?68 zLvrBykGc?l0ZBtZJRJ#;JB{;xDhV@e)^Z}1KeZf;z` zh9Qbo1`%UpEo<$K(p?zCRhlbtv(_eVO=~m%*WM2PQtkTkX;;U{b}fm|-?L zudnRV%Zpe5n`NNcr#JEwC7ALSV+yg{JrXLLm(k$-UvQ zo2W_{d)*W#8>$D8ml9uQDj3S_P+IHE=d!CNW*a_zoIx<6}Z`SAOTGx)A6Jyz2I(UP_`)+m*O%I8P{YM6pTqbfnnWl=D zY2rpqB(4q)+j|kE<@3zw>VL;_R|ZiEakdvx*c78(4him^ny!RFM0kn7zAQ?+SjE2; zFp)VsU&cLa$$C7U#nyri!3%Ggm0?fUpDZ1lq#hk5w|CZfF`U#+zNH98kiFpgv$|lD zMHDZ-A$d$DP+WH-hv`dQ8ZRfo^4_bXX0>78E(1u|g(HBI$MxmpZ*^pIjy_pkvZY*7 zLw7Z&?Au)Et+kx(LWIW&*@D3iQiInd#PBQ|K4#R}biSd#Gv>!i)AY#&2y6Heys*Z1iyJa=>vEizGc zkzQbM2%w#*cd&^K7}*Vks?v+AB^JO~ON+|eHJsr@k;X6_VhW=|z$)WO_P%zFd9Bv( znJL&4{s#E0KmNai_hQUq&I?u6Wi z-msRLS;=)J6qkDhU&0E_AT_QqU0d%YCPdukg5(&tS&)*0=aDSTShs`Z5mpA8d9ZW2 z_~#uL&7gVu_72P@jY2NE67&y{1SRN?|F2cW8mh)ad8PhLQevX&avw zZVqX(G@D4SSU2&x9ug?%$2M}XCqXr>d%_7_XDR-XS*=Lr+PE9sk0gz+dDxkTv$##t zZDi^yv3!}w^1f`|1s_(qV*@ePPUN=cfP0|bF8`HPr=kTFbZ$I~>aQO?-q2{lg%4=e z&6whC2|b!M+J3EaX;TOug@_;0W&$!({2CQF3E!>aL(BuY5OlSPqi@b;N22?t@$mSQ z|22hvjBTV3X=|uI>}+~nD5-M$4}L=T@8cLn+(N^K$xuQH!ABmX8SF2i6#ZrdGRg~; zCCpPqo}mou#2doBEA}gyHpH@p_)PwlKPL~8ok5&?opbH#Y?H*J%J9x#B?}X3)U|;&xWPU*L-_x+i0{9W!`B?vbRI z02^#8YP^FcSO}b$$s`X98Q`WswGISMt}}hTJ5)Qco386(;P0RILPCm%wojkwi%r-C zGO;bPA&)uqgg4TM@q6xEo-@pPi)ozZr%aPQ{{-A0?39YD@fDA$ao;D!NDd%)AZs5v z*Eqd6JGyrObUfDY&ZFE({c)En;FV7MDc)a_@%XXHZm1guM)qT8kCc?3`7?ySbvCNM zM5t8%1sO_$cR+ePm@HF1LShm6IL^(a?zW@TBUw)!iYZ>$(i50gGwUr zx{TEsV`e7!3IS7k?4QTq`E7o7o~Cv_w-syc2P(ce-Tcd1d{}fiGz$pi>df=m&7c<> z#v@%e(l(4gZRyeKD2ULXL4Ih^akwjn6T2Y2BkgqSD)v=Rz(&c3@>Jl5+mG6Uc=u9K zu)<1g`BZ87h*lMzmE{b(CJ^@iihOkU@{@Vzlc{DeR7z&Laen>6&+kTgksA5`X_}Dr zk7DRH+H4v->B`=|*pFJVMSp?yH{53;%G4IT_g*;FoWzy<*u4(h#HNYSpT33yvCvq+>T=%9O8iY0gY>2*6W_2hO>6k z;~RI!f5MN)ik~2)3B7qhSG~A9DHKuNUciE14pr3*=hZdBi-&~bvzpcl%1+N3cr8@k zGi3%XO#hy0LdP~iq+kXb_A7Y5?Rt*qTpzd9^_M+ zhvugY#n)upQeR$m;&BSE%h0xh>kewd<6nCt4fvvVujc%mnuyzFfz8l0eddTz%NHHe z%0H!+Y90$usQ51px6OzkF;7F=%%+&8`w!xxVeaqpLK zGz$o8iUmED=TEf2YrG;>wt$x>%H`%&rVxk0W0uh`Ftir>D3%5QC&i`wg-YX*qdZm^-M< zGBy|he5ZIwK}V>t9_<$$JrFmU)wpL6Kx9SExX3UKOBL$IX~!d4)vN`AWsRXdMgxdUUN70kMM(_%TJjWf-&|EK4fHgfN%!S+@5t0#LAm}T3& zf7OJtc?x%_a=Y{jS^yX)S%Jf+DQF1Ki#3NDCsc&?s^^Ud+YRo{PY^uUHPHhwBv0_~ zTL4!mj>1EV-VD(_(X`n)bkY!qhZOuc{29Q5Q9RbjcpkUmm>5V9HBDImAOW81KaebY z9iVLP9i%oC>d+thdT0z0`cE{mm@u4+aMyg!sVwazVZ*!sBEMHF4~&tMy`u!j5UhAenv|8t8zD1N&EDBzTxAz0 zd9poOdI{({H_|L@z|nwKDq6gOb4%9R&yet`hzibaP-sk(g`AQQ8EvlzZCCzqPkgN_ zCcl{gtF0<#IzN>(PiWHE=+}rJnO2&S&vDe>ZTBrLrGm&iB0ny0Cb49RYx*duV#Jjn zu4=AO>5{2c&HRr_$WpUz(>+*oo#x4Kh6Kg~$M1CLc?CC;ECpyUK4p;lRRyp;sxi%` zSjnmGSE&t2f?Lg=C@REu8Rc?F^PP*Di+psv=#f3M9^>btS39<}WDnFU=QVYWdOdTR z9vC->h-c2T5svFQntk7wOlik3fXaOMA>o6ED!wZT`FiQqTw#DJ zH(fMm+P-{0-vsxaR>47J+?HW#Hgf@Iz4VOsk(wCaA1s^$4Y=qo&D;aUjQ8}GB}3(B zQaH(dB^rk~Z9|l(&{G(a6TwCC zM_0IN4rJVp2FqTx=MYaH)yst0L9Nci=M(QpNK|qq?Cg_I2NQSO;{nEsZC?&#ag*+a zC%!)D$cXMxc=aYdtBg8_8Mt_QtIN|YtB$+`UMPRCu}rNKwHL^x=L?f!$eKqV$(ldc zt;BEf>mU`XhCQUp*e$L^-+n1%D#1>ycl6|H3~q0fu94#dSrAAsNTZ)Edz2(tB2N5( zij+EPcnVa&u<&;26@R>u%Jp5ob zFSp7B3P3iJPaf?|I{aECPZ2heKTi2y8s@42X^DD^wTSI$@&nmt&DyZ7FE!uhiAM=q zU7K~F^dA)pqCWZUh$fr#gVD8!WYXf@s|2Z<}3U#dH2o=wpOs8!r8K{p`Z`_Ls|dWQWy5 zjaK}i4njq~lPlMSQxGh~((OXkj#u{UUhU0_&8`%L;WrL`VPURwMelb9?~iIYVOOga zj;`xOpiC=79^U4%9kAXPN!o3f-BM|A{SBv#c^GHT&z9rwcUkdJW=<=!p3jg=-X>1w ziFQ;meS^FepfR&}1{1Vw###BT%z?jQ7y{ZS21bdA3%Q8p;qJ% z0a^ApYiJY8)UU$1^K__epnKwB2RS-89e?g*+BCeU2P;C+%8@s_k|N{AbWSol z8xZTzWpih{qDTf8x8kAP`5XszqJxjMDn4o$6jl@Fu%&|cZPJMhzZh1n%=Hfq{@j7W zOD#?88(JfhpF;XgQV#~`3p`og8lCdXFf6aa4#!`b+HZB5&nz8En*#n4rwY{>rkVBJ zx3oM9`ca9j28E~kn9{xIM;g5*Jp}rZ$Uog2Zlv zAPpJYu!aIWQUbZxCnzeBWpu2s5KSrJ{bHXFcSlcAVUN!DFT8^HV>*t$gh9@6sD=v| zvf^pr3qNh&J|yfyMS`_H!Nmr`-O7(6pRX-pBQUT;cZ~w2T#Ys zaziaR*ExPrbRV$`ywBFRz1mApGwmmVJs+sYw{PJAc<#ecB*T{tn#qKlPur+h%MO#; z8eV@9{w06`ksdx!7r_r+wGzC|vC_5e*e`@nCQKrvL8==bWEw;m#OfaN->v5n(*t1KGsf zNn(E`hQ#NY@C|N6|9r9ib5jIAfRPmYt5SB7n98XaqQtf;mwNmgAt^C@5*zf-?0%{@ zESFEc{D&r}QXXVwZ`hc+7rP~KE{-AG$tO*+ZVtKYRFy2)XU)j%UcGY?_e5&p7GJe> zyD$kNVT;HO_!;HKnHZ-CS`Yeg5qUe*E(qa0-#4OKo?!0tI5;^Pj&imA4PAOAn8&(% z*G^s~7qpLq{S;@5c zQ?CYope2~9jd0)@nG5=Fkplb}salYcl^&W_^OvUnK+@#nfpgMuC(^$LpBe|*NB+~4 zF-rX!Cb?MLvMD()EI0&Yq7NjJ5S*{sm>;SiXhm`-7o4i$?15s7#EfcB-HyCw zv-r&T{TfJWhj}%X3s|I&@*>9q6SZ*Rbk_b3hTfBAEXP7(A96@@YAX`JD@CC&#>O_K0NVUHr=MaYUcYz zw|}TM9|!6F->F*Rj7ai0iii~6sSTeo7vAb(UA?MsK4j) zAK&=j-!`vqR;|kmo`5xT+#qo4V#Slw6p!9ZUG{bWkVNqJe0An0)?<@mC*niPr8k2< z6VNC_9X-GuJ!o!{rOtXd;+(}CRf?SdXtC!wU*OD*z@DoJfRhcOIOO;hvay5vt}b2RjHG)!(%+EYC$Q}Vtycz%BtR8GR8@(jv_cB6qmCh zH%z|0LuDuUYoDGwU|T~Bo8&`PYB@`6{XrgdmXh%!G8700? z0!gcH^v1Oi;!UD}o8)7EDy0W!ehp6QRA?xd$Hv9|bBgYgowBL&u#i;MCdpVAe+XQ% zp|(-3?i>G(7ub5%;J|mG0Rr{Awc)4rqvMWs;NCQHbXE5^RP2^u<_`fiHJ!!ZwGj}D z##%4g%?HvOQ4p4*f2Ecjpj}LZza|<&jma(GKEAo$x$BkeThlx#?4Y79vwf!LM;BI; zU)HmV={S7M6_VS{vlP}(DCUDW^OB&$>vzgYj#7rz9N>vALsz_t8}6nYup_rBt!l$N z;XJvn`KY^XNYbY@co2SE2FGarB4goikmB{+2^_HdEgL+hLUyZ(*1Bg{d8GdNN>6N< z>aR}OS;^nln?iCmMEo7U`aKvxx`mxjL#7=Qvq+vjPbIM9gl+`pubP!n6lnr|`)Jk5 z^DrJJCsi*<-Y{N0W8~u;yy1~osBdB5>mY6flst`At3eg3O~$A9=b@t=>lQWBrdsY+ z>y5|`h=^K8&TN~<-+?b{oSFc%v4%5K2Bg>zjs$Zq}DRU}0cc)Mc?z4uH3N4CYx={-35_uJI}b-YzVXQb^f{vQyB zgcobIFhg%MB-6ea!#;2-p6AnccnlI@Yz-Ec{IIdH{qRc-t-NyY?{{v{(|f zeFYzXOSj#VrLj9I68?Qd$Fp-Zbm`bBhf#Go&`SmsgK+~f8jKH+^k@GwSi%L7zRO}R z()m7ssVpvr9#OS`S7H0VK$Z#dPRk??6UB{jikmTFCV}E9^Fg(w?JadYGGzss&+>*q zS!lENFy;l0k02~c3wW8WaV%tuVGexQ=inr+VO(Sk(Ad**eM|R>_{elH{y42S=du@N zn?d`*C*H0P4(7qD*G)~p6ek`DP*zlT7BTVkJQCtjX@ky6d%Wns3Ku7gbVt2=5(r)J zV+cE%7$`^65(TSZrQs@~7E*8MWw<&h6P0YGhNIp&yZg(&Ejm?%Ib1)4>+7GVWThHy z|98{MzXg$Fi-LJhI!)U#1PmQO$N>Pn-D^NX%&Eq|W<6d%DZnAFGyga|{0GS0K6?Q- z^tpxuZiD?@4&zw0^bDfm$2e50VZ*@i|L?=`FD-rp%rjxgBSx)|rQ2dSe9JtPjv+tdne!|_afY(9&IJd^h>Z2! zR2-8x_t3_QqcrrGM$_$sW#B*hZaH zO_$>MG>kh%~_p!K>K@XCE+ER zQUxeyHO`&ZaTjClV`zda4=Q->MWPeMKX8tG>n6sw4LwjP*#;ft84Z5ujMn>JIj<+E;neLd ze2nQkZVH;}oHqYu*?mS*yds&DJ{K zwKok$hg|li5sR-WqSUY$e1{gYY>Wiw-hAdUBV#%g=!FsZMe;Ruc4_}$HXA$K151Gn zcAi8*P6Zv58(UC?Wm)P9`pII#yLEOO<~8snOLxB1#ZcX8V}El)Z#z+Lz!oT9)oV9@ z*PB7z$ym9dKg77c-Y%Wo_diJl`|;`}6l2Yv)Tdu(=5$b)prZkcy*de|!~EiUY(qTE z%w`A}y^#4ic|$`r!i6m_JhhT!%^K60Wu%F`d&zO*;>LZSC?SWu))yK`xC*#a`o(jmg-Wj!O#p^E?TVB zE#H5#;$pZMs3F?&gZ8&`JBcAM-wkVK4+b5n!UG?& zDp$^N(jp^MGBf*Zwel7(cQ>}t02ufuC+^41x^=^}MFTMBDJ2n`YF``CMJF!PBAm6^ zQM9fz17Kee+b?CTpIrDUKbvN(zHB9OCo5lZtybU+(d&-`i@E)7ETg~~?7VEsWN=cs z%T{I2k&9RNa8Tn+GDtI0`Q76|sgl`1=Tr_w;`UJtzB#o49a}JlHGSNb@?3u|j(#OF zWBnuLdFMA~JHu;W@W1yuw*`3~MyFOE#;RAZZVw3q9V#CQ6?l(X>?WEzqY;_gkQ6;f zLo9#sp(Wi;(DB$de-ZTMi;^-h zre)~2twd^%Mg#WnJD#Ysca5K^rXY`0tP^sG~>}H zo?&iYO?@{vGIAkwPg?TLtDpP{Uw)MB=xN+y?{=Ur*BwYUKUdqR4io0GFA*RS4^Ku;NV5|u-JW=*W12_&Gj-BK2PVz+`4lW z&k0433GSoLQmALEE>XO_?Ftp7GC`3pVx3f0sAEM!0w75vgI|;ZL(>Cc? zypH3pA$|IOp9A|Mt0Hkr_3k<@w||kmk}|&*xeD@MG-U;-D8Xvz^*k{8-nmLX@U0$=`WUGnK`hmDRksRGxS*}O%uFwzfdwT0xWv`XM zBgu46x-lKD1`}IsMg~JpgPH^FW|wPEbSj1*LZnlu!$-TLB4fQkxnlv9t!wKxBC4$D z@rikaqOrPjPG)+m8Pnnfa#~cXM97v8^5f)A~Sg=md2vmdh->a$JbYj^0j-+zY$m_>)N4 zL+`3;4;yCHwZxj`wdruF?TPK#lDmu<<;ErhQO#|Pq~%-F_TD^Y+648%k3(fCL#g7$ z0X2T`njCMyGDrd}3NU6%teisfQ$}l#Dv!32p&E#I@tgl%4KzDrGyzRaRuG_=UuKOg z3Kd5#N8+MzfoKz3KgZ$IvJx*}u;{_Id{Z1->B&pqGohq~(ndm0UJ}VS4ndGvuc!b3 zzd4!4($N5kPpLV6$QLC_vJqU3nH`l;_3TNqQn~jK6ey7SbbEP^J;@L<-g;&!r`*S4 zFd?vbO`A1_V~Vlf;`@E4kW|Y)xW}-FVG_&A$G4-cV!7_TdUUROUJIm(5<-bt->zjN z?Lq0KH3+a)pOG#3^wAXH5^COhB$)3QnbaIcjL|gf>|x0^9ISjOI%yW%I-7F>b+rgj zc*}9!+?7dhHj;aE8K6cr_+1I;(4!dXm@@~aPA?D=y}wMg_N~#|Kqu4+=LOQWMxC)q zUd`~Pd_+H(LwL=ao`6dZQAz>`^SqVd0x&-g+e!QjHUx%hsmr9Kxr9~L3dBN33A}#l z6xs4=3hLouY_PAwJABchRu?sZmtj z%xD2B1QFt{rJIWHd-T9s9KFYFLIcO}abE{RM@;AR*lcty-> z#dm%iyXQ0b6?5p9+`n#=xddaCP^UvtV=DeK{F9mt0WrF}(_O@{FfTO%gNkLRf5J%1 z2pfgg>py2RStn_|aS6#5)%E=af;5ATQqF)h+=Q&dDu*0PdetdEEMZ!ESjc)tc6HszyvyLWmLP4LOzmMc|`9g4PKi)F51C4 zB&4RHVP#uxgaII0fKUVouVC;Rt{}mbH?Z70HQM`A@!OpA)foRpuR35FSK!&l5_n>Z z?#b?W-RHSD${%u<(X+uzqUvH^6I{euVHqTKP(>fwCXw|I~A!OzcC%muMH-jNaVBh({y8< zYQ#FqHCc%zEg)6kbM_$|x%ENKFKID#2d*ND)gfD*0C5L7H)k``NDIsbwn=Uj%fxR# znf`2hc1&>qxgz~l!T!UJA$Xm8y#43YsG@7nC*0+YDIGqiH;SM4bijGKF`@eHtwW}KrdrhHQ9K}G<#{NaPoY-~bxfQ;KH>9LL2H0_kg1Vq zCOBxqg)g@d;i`}vvJB?+er@?jIJIK^5X~LzyrsvaxhvFh2Sv!fD&uQ)3}T8VJ1ds) zgVX~oRhqgt5dYjDF-`(~m*=iXRR(TG?l;0zN(8eXP5N z!as{0b#YNsf9tUMUzq}gg3t=)ul5~ImVtj1ujdJc*_L>*H=)b>4zr&31n0l(foel{ zd>VnbW1cGj=Q@j(Hp=UG7l2DL4Ykqp;#3g66!1LG3%5N?V)C^4v5N$HN=x3^Tm0C_ z`tP_2dUbO#mIT(n=evv&0eQQ%Ll&AE)Vr~Q+LCclzs(d39LSi{aSb?Y+ zIcnLXLtg4>v%`7m#*o=0-vMWd-QyWeR|sy_t=>S@v44KO8TolmM?lyTm7S_M z6e$H|ur+pZ)|oWVeucoDvZ5)JvS;4ot%OKIh?S>R_-e6jmD& z(DR2a6|N3=HiZLrMd$KBphpWc2MOlA& z{G+#DNB>X}LSA^TL;$qsg?qw1^g^=g#i#XA(NAMRZcZ6r77u}E){CDtU3r{cYDe5M zn^DLYEpW1L4oR>0^RTXlQ+#U|F49J9H>Kny%^P+-E7D&2^oHaNBPJ8C+QF)2^v|1Z zsUIsa!)qHc@%WhSO{ADoC&=qLO0>3OdRI-;7l3MLsAN4{EK;u(vH7n6@Iu*}jCkwi zM2e&j)ZLy_Tr714pMk`Q)gkhKyD7*7fPktzS4PfjHL}BA0H*pm`O72ZzVF1%*wvQ| z!oNr2eVgS3WUKF9E93RPj)zRH-7u<2yOTDG&j4g)w)TKN-nb5z<*^Zbzq8^-dv~|! zM&*0A4cfwZdA_T8@wwH@(b&^3 z#W+(yo#xqTcChyvJf(rDc=|qX^-}}GPrq%paO>EGZC|+^_)st(Z@4G!LOLG=0oyoX z`JSch39S$vu6{;11&vb;gr^`fJFkD_l3xy?T;-@oUQC1sTTlgyNMt@_85 zt~d3Ui}k+9ez z*Fgc9X4+0f--k?043R*_ep^F~d$}vGxezhio+rI6pX)Opi_e+At83E3^k58GNsNJ4 z`;2hiRHs;3@GTGKYhdaxa}EYG`-khiv&Q+XgBJ2p>fe4{JZw#8!V|Uqg>hE&P-a^q z^+v$8lc^=V%;h+F2@&1~lDX0t7MM$(iDJV(!9r5`&6XbWfXX%>OIUp9DCue2O$N^>r|s6LzsANkW->p&ei`*#bL80X=W%VG z_griPf?qfoyzidQ>Ja(Tk3Rq{&hlU8RQ@e?ZZ0=q+fz%}3xaG}Rw_)Yh>jBv|}f44#l{DBACL=S>P93pX) z+G=$l_;5NM*cu)r5)PHqlo;2>#n-mpEbQ&{P+i@w2&|R4U$zfLzlp!6TpqsHp*0S@ zfCDMpQd7n?mUI$9HQUc;_1_RiMBl)GdG3zVAemK!eLEY#9fIOf=cw%Tk&5J>kQMYM zdcm{s>5ajM6+VZuRSD+!v`+9P=c4HBM@nDV6xCrjY};4ZBNR1Uw!Fe=Eq!SxxL2sy z7`7b-DI)R`9>XMES8(`1R_M`SW>e*CbLW*a0#$cLNYXlC_H0Fx`yE9mPS#D`WOh**mjDp@}BI(Z3odE~koEyI@ z;0%zA<3p!eVaWo<5Ve0Kq~%)~K}B(**~hV>`3}AKMbJCP1Ut|cp6~9gBpe1Do|xU% z4;epiAuIYuHOts0T$bfU_P!sD9v!x-NO1ZZ8&fHQ_JEbvqStt6O zRJd$TtZc3q;J`lq1-vl@fbUmuxYI~0V3=G0wiNFgvEp1Fq9Yf}_f|4Vf;Y zY-KC9kS65sk|=q^t4V?+-|ol%gm7`Ffb(3X?JH41x5k4Vyaq(A-D=dCo}1o@^yE+p zGT#*^Bx3Jn-03`Ok0g4iBpk1};`M*K@=tdts>kkQLa}lBEMd0+$E>JMBh?`GY+Zjm>~MmM%!g1FoFhFS7}e z~GJmN#J1MSbCN@A-v#5m1~x!1>=O9sQVtLuQ0t;vm=PmSKK=d_lW0V;LJ( zw(Fjg$O&4iGg@6n4b47H3j-0I3awzo=zL(_o7Ae+P@m3E7R{d>c&NwH%--Dt1C?Z2 zR#xZswisrs^AjK`LVylG!N(-~4%leu+nnM#zvV7!u7pb5e4p%kkL2d4xECamFVwOk z;bpuN%v@H-iDr%b!SQ1`5XeodbbHx;W^Goq6IUB2Wm7y7`c=P7cO$Uo_NE=g?8t7ZYOv<7u21JOJ=Q2bq z!==h?3co$Xj&fonD*4{5hOvIk?pk5wdrP>77>^oVVwXc3sH>gSsACHM%POfz1ynPN zvw;+;BO-xLErX2}_WqN6ePhtIJjpMlO(;9TvZo3@c4Zj84M*_0>Njv6sxc3WVBsHZ zzUK3DNA*YM`*oM4uUFQ^q?7zrBx!an|m4GE+O>7j7r zCp>)gTdc~6K`SJTY|Gl~IO>KVz1EBmD zWf-2A=mO_Le8*iF{auJ;VWFi9KAbkcZC!G7G&`dkRwMpzbH1=DXInd?yxS%y-T9y> zS--09$36t%~j3Js$Xc@jI!yTUrv#j)aid3N>QD?KyTFm`<+0dv2oklY2B zH0tWnaemsEFKca< zR()HstA(PYRCfTc0n-_)?eUIL&Lu%jYE!HeJlHG+NL|IYfx)qUIF#-;?<3G#Svxbq zd~m`J1$1CI3353JV3Z$KxHLu}Ge@Ulq~_z^k4VC(b4^n=xrRrcFas3Ku{k5V- zmXkaJt#&Almr=r0rY5s_9}p3-{~l*|8#ROILeefPvawIv7hIvp%~W%M+VVjSYh%-? z<9mna5k!Jbfp9y$OXh8(zDPkp+9=&#RMw&9$IY3%WN}#~M@CV+g8()pHDhv>CeJAx zUIjQ51f$4Gy;GVHF;%PVWOq=4=b#OGq^d*k(3bjJ6TK92)4@nDDg9%yEeIb?yo|uf z-A}SeqSd1zHgecK67Au#@H?`eE>^l`#FC9utY8+Z)`B-w0^n_uU`i)G1#r$_-cuMQ zkKz?uisHh)uhwHti2G{JSN0HHtIv}bmHG$(rRV>YX+jqDI$XQ=MVo0`5EPhw*XH}v zhN`|f4V(Uks^3xH^lAtJ5|3iz!qG-E@wZ+V&Q;CKg?~@Sfrx_V-+#06N0$sqkIKm# zc{;K^7u~6DL;@B)KyT=SZJ&Y-2jycc%k_q@l7ZF0RWze#1%TOsdm( z#A+eyCd8Be4@zEfe)LFgX@N6`_zFboT96d#h+PYh8P~`LYfQ8? z3-J}2XYtezQK7Zq)GmxVe4UZAUW{!)b(gZOX2S66@GvJ{|i6*ujC>%sMou=n}n&|nG4x1C9-N~t| z`B4-xj$CgpqEuTSxX?+3k~!~w4p5%8-9?hYjr|c__NZGFGlJsx=)VInhk53dQh^1X z3$RC#2%d11c2y4Q;R!avlbAzzo9LI!#_IgqO{@2h&hdiI%4+L$!KHrXQo_W8=QhRF zZ4+pi8&cU_I}{s<*Y$BlviOYQ7itGn7LE=x)4poACRSNxJPF*XT91vF#2QU$XVGEUMg)a2-FrKOM04Ww~F;Pa|A5<_4f0NKDre%x;RoXlA zH|kMr&OMaUM0>)kx_rb&2hYX**oERHOsxSR0<435v+qo<+qL=KX4!+NAiM9rLQx*4 zsSNW)S^{L_+#LA>IPVEgdyK+24BzXkg={O+kUkjpvdm?zaswh4ENs#DOEwwP%l{4D zYK_+hzM}iE$wg2RUrN=Aa}RSPAVx4S;pfV3*L?A1`Slk7@yvdpqC>1CXkX`-ZBL5r zA6GBZY^TN-cs~S0Qt$Ulx6hm2&VKyiYN zoZHV`c@eFw*ZNmQgO>HQ;J_8lSR zTF*t4u+y;04-g54Q1ya&f|P@04FV>E?`Yj03s;AQcjzPpO%LYq<6^Lt6q0{yEK z3E~q1+eGwe^w6FpUh*H^I2ciUe9dJW#{4*^twx9Eg(ykDDaxa}v%Bi4NgKv9p^rJvujm&Ez)1P4CZ8 zl%AD}q8^puKw|Lft21!smi->!%D85Cz!v;e1p)zyfvqS$$i_UIs~@vX&rz10sT)k< zkq_|hYDLqc)Rq)JbG;phEmZWrqyDsYH)SoM+{jfm{ZNtU2#3N9felLm&4s>__Aqwsz^fn;!ag{sXc;FT>&E^X!kZ ztp6bX)@RGP_VM$}K|1}h-`ZbRfE89!LN6z;XzckFB~djIP>1UE@iX(Q>=8yJ4+}*1 z#r&`t{^dU@GQ*^4{aa)>|I+*3g-`~{DdFKedJGzBR^(DVy6#UA?LInZ}sqF{%y;w1veen+m5l}K=$CR&%GbuL9 zmeyL~2_>09gq+77fv4<_R&$8(ZZElw>@5^(yE!7pbEs&OpC@e-raWL zNq0JA*2J6nuT_=}!a?2??&=eYpF*n#!ROen+`}6hN#Pv*G)|4Pa6t_yK29ycJ6Is3 z2q+WKE^VB$8}`fa%L|mO0Qq?eyR$|TF=B>o!XP>sX}P<$af7y6%+APe{`m@}w^+yo zy3Zz3hfZx`hN9ESHgMJ^X-DOc#rFPg!|Tq5c_`O7pWr~+UQtdJnzVLU`TW}sXDPP# zkHM)L{YDz=PYchOoX^J}NS@CF)vTc(OVxHb`5~}of&`ZaXEC>S#^hXGJxQ8508~;-I5(6;|10aeSjm9K2tZ@V zHI2^L$|t|)SiKGLBg&k3`PZTfAo71#D=Sws{(B1QeV^)(bvn(^ZP(hi-QJ)&c{kv3 z6bPNIr1T_`ZZz_Z81m`Mv(5|LG=F%ITTa+0U%@R6t3HTAJwFtDSc&)hCK;h8WGjae z_l3*F$DIT4D?Gw>`Vn*4p5$ro*hYnoL2hpHC0kJX?eansCn#18Ccns0nVn27y-1b) z{CqoHFWlvlo5>3)XMoRJkkU<2UU7N1_nG7dT4h;g#BDzga9Ut2qU7p!a=Zq1m2uIZ zP8%k`m5Zx^k84(MMg1TCa+aGk#*^dpw2C;tF_SFi`e63s@ocC%e)$s3gRMVHLH)u| znVFx~U_ZlLxeArRm@U93{TIClEgZ2*TB5QRy$-U9Gyc{aaMy>MVUnwGha6O0=Q5H7 z+8cML)l?Rdjy3WXY2NTU0YAGFmov+f_c>qg$u^-8yP^8e@AdeUA=^cSbf5Sk27A@& z(o3^ak~`XFyM2+)3ed03O+QIwFcb|CJyY;)rg1?p<&)4aE&I6CYq6&>Q15m%d-A^UKwhlSa}#X7kz%A@p&FKtxuiYR#5TyE3``!C{q#?2CJG% zhnuQd0h!=Zc^J z!VO&|ALB^$D$;5;u;d%o91$zqjjx~whwd&Jlo>dnn6`09Lnyi}b&_MVavry78`|*d zms!3y91Un-&P8eZ?!EV4rOlDf(u>12&F*gC4UOcd*|%Y-cZ-g4i?E^9!C@Xe+v(mI z#ZCkx?nC(9 z$+mNU^igq?PZ@PRaGsy-e^bLv9-HH3uwV$v>dE6HQJe7y8O+t6V}7Gr4Qz{?z1+9z z5em(beu{6LD4&o((G3zwUh2a&`4^V$H{aKCQ%$!~J^>l1*Op_5ciP<`V(uuMI1Bs?Djq#3PG*NJQrSXWR|f}YUX zgs;)!BI5Hn0!gq-0ifSY{)`JuuuNE;oiHprE#T|^n|rDJME7a1E>cQ!)5Ra{hC|-0 z0vZIi{H7*iUV@;A8RB)Sp_H?I5Dd~f$SSTm^r(E#(AUP|QBMC-z!X+<+6u1=t1(IW zK0E(Y-;g58Q?HX!vthxb?w%5_pq!80f7?v|dplOJ=;v&UzjAS?6TIA!Gm=!u;!E5M zMV-as!Mz~!XtJlHd_kvqBMnKkR%t(fR!~kOe92LVJb0X?Q-Z*%p5O0atoVL<(bi*6 z(LkuLz3{qg(V{ci7>#_ zwMdcirPh6ggnONfEsK$;8|5<-suKH@#;HVGdL)UxeYk{0zEP7jIr@VuOm8Rn)HKTz z^SQsAznRwemvRz24Rn^OFwMDV8>gC^mvd3b3s>3~Pj+W;H2wsS%R5{0qV;V`@nkeO z=`qiJKri9oYeJR6&XL*!5P8+1MkAE}JNS%tjEM1H!4ypai7RVl!9B5}u0K~)e9)2a z?Lz+w|J+|PnU%wjTWqGgi(d+$wTtT(Z5O4vH;Ir~^vf2F z>2AmCg0ET~!9>Pvul4LtH>)c6*rfTT~0F~<)hNLpN4!t3zFRDC?lmt=6 z9PP^a+H*jhvKms+i?mc5DU{Xg8z)A6>L^N-6(0?619$_@o z>TOT%__GDs#D??Rim4&pi1XzWXWRW&t#11ITRLs9uUcWF-#1CN-7)hGDfQ0}ieLp~ z+(ClrU8RaR(xqV)nRp^2p@f91h;Agd0JRiTC}8BXPt@eDcBdL2{y9noz6LCaJzqek z8%MBKU^Ah|2=3zoJYKoZ$|EIyEG9QzCotCRoL0c(K3WV!UE0f!PKpPEbL36%;|ln( z9U0W{sDlxe&WWUfG*QZY8I{Z% zkX$eL*!BbcpE91Pv{Z>*qAy7JJFmOkf3ja-4y=#K;J7my*fz>FqPFIK=Zm?DM7LIA z_DP02#qJBc#nqOqE|74Veh)bJm!XAo2br?A>rW>HQCw2DOKD?6Fr~w9H=$upePas= ze-FHt*!_>`-_L89GO0<^jdRI-#O?|z+psPpEqwS_cNYf&b^l;5-6=Fq^{fUZq7+pI zgVCENfq{;Dt2BLq>2XhmUDz-cfwo+4zNgDr^GI&HcL%3z8*4IeZe%=)QE(|Ag70!TtV+-tX<@b~X9%s}CHPPcKw68UV)ZM6at z8HlFdLZh~!xtsEZ-3itD;bfIkT!eEGa%yq2;!Pe&``N~<5gR9oa;^CigqD*keoq*5oM-<2RUM!X2fN3joQY!8tc zW+Y-DuazvP=$#^Ijsp0|oUOa8X)1%Ve8ZwLNc;mfyude)zU|5a8SAP!wx5&g_)V%3 zpa1M?J!Sin!r}np3I9bP|NF)pL!>`O^DPLHcm!TF0dj~OaVoj*k4Y@93_%#76&H@~ zDv;-W)i8*;wjW6>8FANv^g7&9s=YLIej$=B zm$)|_34WWq>Ep`xGlMItPJgND{2RoQs#_6ivblhM>Wj{k8YSbviS>|n(3EFEK>(v(>|q|X6K_7Zz?cGTIw{Aah&4+Wlr3i^U9%7;Wz zcj9E21~tjevLc^DrjJVi2}b3-czpI@?r1Vb-=Zz6QeVQYugb);miqZ!RE!9{S<}Jl z*s^MK>W3-Fr9$k=ifY9**Tv744jxTvo>rp^B@^_{%Ks2ZR{oVfF28g7-=_B849{qw z##FyzKAPLMl{XxHiv+W+-XeBCzZ)J|l4J&RLE77NTvej|v5U+{{*h9w4 zN|B^_ALEb=Sxv~cABl{gjv#2u48<*|v+v+`TdJ)A^LE=vIl6A5cyH#rCxtAHe8nV9 zz@3e^jMu`+-6VwpKJnbdj(x@9m^f%JVUI>GKF13kd^{&KVFtp84)Gz&Ya?Ap$;HID zs|magiJJYWAW?Mr;UfWg>yN)E*kQ_h)lzboI?GOxH3vX<+7=jTdD}zKn4u_R4^Byv zv|_rSJ;$B$#~!iYy|CV|cMzNK80rkCKu8wxjR3dKvm2{Ab#I6P)?Gr}+Y*fTIa#gg79Yb# z26>q&4bAbX#OYnks5a0^QDA~8*AG6>$ip{9t~ro5Y4!;}bl6f9FsDG1TZavDYDlnK8z(cKHOXqT4wb2Y2B!YHT=_-;2DY{g5VPZC( zSn5=ZAnswN_FB(Wk$+)kiR$v9FH;MAEJ(Am#Z)?`*eKz1D@+Q?Z|f?p#JAULC#EIl zl`TYPj>3|YzNu@)9Q&>q?{>7?!w%P$3sh%*RPaH!$ZuI?HOQDOJpB5R$foyzmeRx$K0qcV=2kbBdXL~ z;IaRyljk`Jpx~i=Fy-dF?B4WwXVCNPIT!e|@`D!!MTk0&zk$zX)b8VsJ^jMe&J#@Y zs3$rpjIYPQI4M5={RW2CZQb2+JwmFU;~exLrN5-iE1r**BALul8C!fxni--%7)#Xg zK2>D9HaIecNZnN~t^dOm?yM-K0E1NsgS)>?qIQfW8qA(%J$%}kl(?|OD%yl33DWyHxz)_c1E4R%)fy-j9QM~YrY`Or z(@7V5v*sz3+Y*V4&@pTld`bbM;^4Oi)BGFIA^Ept6=J^;AZ%BIow`3d3s2kc$THjQ zy9W1MX~A4a*w@W%HI}Wvs3n)HK+SaFadM&6??=sO9d=Ug6!ndpb!S{#RGN=m491=n z@m-qUeGo{CX!h1EkjWDm`Iy8~F<*&C&x~BTUqh|WVpgQlrPY^sc9iA|(5?T!$4e6D zo}No`Cvs?L)LLX~nWo}WWh`0cgjx1x)wRfHL(Yz}Y}K1hU;x-q^Mo}%(ulM>`XPxh7Cfw) zG?&%rBl~%!Pm0z-ax)w{Z;x#j_`4Z8OcM#I60^>NZ;!Leu6V(GivPr+^gxg2lda?* z{JB|?kIRmRaq7mZM;6%_TG)+ddBU~TBH&85!K>ke(eV8I3u^)#lOOAGSqoWdx5ZBd zW?`^ZV_oYtS)3{I5V1FqTV;-M8J*pInn#bNwGUUGi*E!3^=a21J2yiLCwWZ@i6jlffz zN)->ffA7JMJ_`x@xC7U=Jhfq2Y&#bS&Br)q{$PKx%5s?QO+x0fPj#^`N*->`e`h%| zzBMgd*_+bR0H(La4k$itKU7?VI`Bc>|6!Cl{}`Ys`H!19wDrxD<`H*cfHtzr3CY!- z)%14{yLwBI4{l=%?TUNJ#|!RQSG{ADV|7kPb>lPo#KIT8sET9?AI)&6F^VGKmR-B_X`IG4cBU~ zxSp%3_yc3GN5s&twv6BAZYw2x|!u$Md$1}`B z37V!|UYuCG!}l~!`Ah;ZaG+CMr!+FBNbV0tJ}_gMBQ97;`+P3oTH5!LkGP78Szb17 z{A+3Sh)IW(7hyR+sduJaw)!vjBawCevjIW;Wsm@G>%ZHYk#Q3)g3T-zU$dbD5Ki;H z7Zc7&%0_UdgCL(T(xo77o)y6{&eMB=2|zc2IR;j*~#CU(3RQ`;mj`H1XY9 za99^b*L2nA)s6+Acr3Z_Niz-z`hJ`ips(fSbfKlN)YF!Pj9iCD@3{z}sML1&{r&@) zkT9ayPA;7@@-U9z0_UI7it7LkC(_6F%)xM?DyhBYSbYjKZtQ+Q-lHAznpqR!-F<%p zXx@hjBxQ0+zO6xrP1@aRBWR!+(ddR@i|a+YFy<)n#GT5S>Ia3YiC}hE&^STA?s6oU zRDeJZIVBtLk6j=q1SHeJVq6 z8ui%7j%Y8O0J+fKvV>K23hB|IC@aP|fI zEmYF=tE2|msv+y^)(w6XjlCvuFRHtby3w~{TiexSs8rs#qexEz5t8KchG6-1w$~UN ze|Ur*NNmt6dQskXOte2g+=G}QiXH!&i7x`j1efy6f8Ifc`3vq2@11jW>Q{Be*40v5 zR(B>Tf=ow3f1jqUiiYRmrdAD4+~u@-_B?xK(Iua${v#a}0ZR{S4g@KNx?d@}H6~%w z{UfN)ehn{cnE&)XbZ-HYK$xbpHX9MifIf9kaFjh3C8nb)$Bi*`j1+suepI44pWi}> zU+6~!DBbS*5{gFrkQG|~eOP&Q2atJWrzxGx;W%7jjKP0k5?_Zq)-8rUt)2-01O00- zFnou8|Nf(4sOPE=qz?bkA;(1YP!R?WsG9L0<9GF1CAbN+LRCctX0@Z-QYBT=s$HFO zt;_N&4oF`<<^;V~LrKU~tS2Z(e@-0L;%AAxQHnbSv}|C}e1wQ5>;IQ3v=BaW5Wgor z!9xB=e2>7#u>W*m=l?;b!k02|Hwh{QR%Fc=eW64bAE(g>E3FlE!q zxf|Lsh7+oM+gB%RQ`pY+va}4^8z;jb!w46+3!c#LmHq3^G*C90fDr@q+ONDQr#!xi ziAk--!ysfSo}kAFI3Lgy=3qF(WL(;BBVQ%hBSC5orJ~}+> z(-^bmvK3_wPXG_$_ALO{7%CMLB=F==NVPG7*ZGJsVVYR4!^4y8dNsz_Q&ChliHBni zOk8oHgTmcJ2$_Qj58OI)*cru8kwHB^k+Lv;ktms{+f5OPCe_=N#9QXYwoUA)5@Mj? z+39e*QR3KMSiWHKysf=zKH259zro9NyKm}SVN&Tn7iDqmwvV`wi_DMv zMkK2i1oot$HAxwVeVFJ62X}1FQ8NGGiZ8|CWXiINdut!CJR{>Nco06kSB)MXDT6&7 zS1sX35r0?Cgr3^*%y#VfyLsp}zCv6O4KiQ>%;xjE$H3&u?g%4#VrTqHK>LaSKU6@H zGX)YT`_L-2cVRSj=pbvc18Zt;bZZI?RfP+asmMlGFJR2KoBbGd_zfjg zfD+7pp$U(rW3OOY{2{wFN0NMxrY$0yo2hxi_i4S@oGf0~Yf>1accbItXk`2GF6bnX{iy6Uv5=9>N{c5c|Loo;>Zg+Kye3im#&$?bz58zf;vzjPE_RKK zgoBeK#rln#sMsfGi&>9UzP(~ZDJfC1U}OB}mAQpPhV7?M{guS;Lgp}DksPJWJ(+R} zCBMu10L~wBZPsC(G^X6+1ek&SWwGZrFLA+)k+Aqg7H43YG@*;H#%P1AlzAfJJ^4#N zQr{J%zR!!S9c_9D2c?qQS2fPw=XH+v0m>J9U!f^mzDHUBUDIr@!IJy%N_>T>|Kf5; zPBu#Mau@oOW~$hQftK*07Y$`);jITx77R)b30v^&^Y!45_9`vD7&6r}>r>ToZG$VH zEpFxj2G8Evy)t-U+BQ2F+`O_1wcOhSRofo9GL5>i5|kSlzcx|cg|rc_dU@adS=gLy z$O&2V-aK3HXm{U$PPG0@_KQ?q^CWtmkg;`IG}QcHcYh#%f8ODZ4Y^-`X|Pywd-?n1 za7{tGZu{+?R`=rO8=xX}`km-MRC8t%=|9U<$Boa6y(XUG@AC%*-_NubXU*#5jU4#r zw4cqvr^7%KIyS*n2h28wiXJN20%Z7wR@VR2-rz>8Mcq)~yIJx*(p|{n@p@@q|HjFQ z`BJ9U&I~`AQl!@9FF8x(kvVqHmB&lJ>!3D z697gcLGn5&WIAU}pt?VMlSjA5one5c&ud1n*Q34~r7$Fd&Qhw$EQ004UEro{Aym10 zDJXCJTZ7+|i!LwR7lNcN7L*%|kt`liHtd?Pmp>=}QEc%%{GsshaY|pe_Cu6&Rij#u zHy6of7CVS`Kyo8Kln*Y}eYPjTy2J71XhNxn^P_tkjXjlXA)7|-Wk3(N!XAhzq06g;e&nt>_MUirzHA*~a<%8cbLeeX@hs}iL~Z3MVDc!)3HFxvlO?3Kxm>-vF0qL$ zzFQ4FknASRC@YYZ{`HlkNgiY1o#jM`l_X*UW0Y6L9#P)|tufIcyNMwpmMaM$B3t(d z{)L~HH&(x@qhOEE-`CH-sR_Ymr5Wu{!x;Dh(DmZaXBgukxHXPiJB(Gz+=cGm8n-4; zob+YMyu*>{-|)@)O>g?spATX&!dU@FPavWNP9e_6_PCK#Vy{*bLZvue*aBZXeul_~< zOHOt$`m1=*^ZW~sZzv?WUBN4N$&V)(dw^OJRt-x1hYNK!h@^00J`$V*yGo%&a7e^m zFA&X{&A7R#oPMMWvC^rxr{Rze)lEQA&Iym#e~6j&bF)IxO(sAOp(E;3=&N5z+;{Z^ z(ln*7k(vLQ5ekP|0OB{|%0ZZ4Rsm5DGc72SEFjPTyxd_5@Ah52_FVvVX@FEb+naF^ zx&o^M2KJJkM=?OtWw*@Ff6e{UcX|&h0zJr04>w%TDWFfo2Zc0pu6^yz{Zml z-uq@J^w)89l9$<{O)Lx#Br<2f|JMI$1>>&c%%{f3HKoI?Vc7u@+;qqQSXu6*ojF&# zjI`Y^)3%4P3)UgCy!5PfL0T_Nm-pJADhyHG$Wv;Ut9^jjF(kn731b0S7wBi{B`2z) z;GN07Nk;zmXFw-H!}QnBoT4a4!rdk;1k|i-kaD0CIt{tLx(yfPL-LkemvzWv;Ci9@ zPx8*Ew}hdGT(T3b7Q_1UUJitP`DaM+?RBBzem6#l8w=!D#Y$R4* zb^tzQjeqA2*8Snht9vGIL)*C@2s$ORY69U-m#9vuCc^k@GCwTt0nuY7auzfv} zo1cBR5J~3mEGOVWxxE)aArFn`+0xoew36I3(`FJ=cgOvVr!Zu?`Anxq_LJ4QMz?AY zm2e2CJgoG&K&|f8m`uAHd{tbI^}d=M_q~6VV#K1pxEc5fejxzd+}ak&eiRi=S~YxW z=Ai;IU{=AF&bOZdkq5M&e{6s1Fym73EOUbtKJ}g(CgR|9$!{6@1JieQ9T*t7GY8Ox z6C*26?33`@({FMAX%&>csjIu)?CJO6EO$;$iK=>DSUBGm^rE%v zxB+>ea7&T~r;@ml#P}Vm*1QNj%?dOCLuh1=>xfr-FMlI63`c(1a_t=%4D5~bgZ2zO z=>bL4NVm2JgNq>yAN-g5D!;&2^roeaKjbD_mZcqzoabiiK2-Gug~ffyfl)6z{~xBu_1%ExXEjre>WQ6NsR&{(#p}NN`N0_WwpF;5vLUSLq9+)7YoK&16Z#o=MWb;3xw8<~a2b&(Qu#{b!811{^ih{a(33W}tarMM6~ z8Ow@+Ctq#}@n_Iq__y zD8skJ>w|uNC`H+pfP_hKG`7loKytkRks6ptUYdEIEL_RrAXk@g*J@3h>ya&T^gF{r z(uO!)+um>A@J@uE1WLw8X1O)yAT#RAEw!~JK&#!WkJ;^8pINGI)AluY4A&#_Z@*sT zpW#E{*_0z4FWKaq{eY-kx%ohomh-1GOD5IKWPF)TdMW%!%TwyUQbwwep6Y-1@ri$L zyd~~~<|PPEbkNSZ4*yO(|DX;Tc%I$-#4$6}jJe)Kj}~_(-Q3xE7~3%fAi~4FmaY;=E1{!NN4GJ)*Wg_Eil$t^JMHTYVcSY+}?N z*mAZMAn4PVdH%%W&TRMaV9Tgii1Iqn+j_56W%_-DitG~88!$yCT)UqwIv-&17?S!v zLI=oTtp^nel9GE3@SbP0PxM|v9sua(_!l>zzP=Xt^7pVqR1xdu2w^v24anwG;N`3L zNPd>JN?8z$CCm)Tg)Nw$POLr{ydQpcYf7!n+Wd1g?Ug)Fb?(}Z{o@aEs=`v3 zoby(R?NUpNu@{~!PXJ4m<3l7s(MTmP9pnz(GT_qRzU-wU4}IcaZyy1h%n*W@p3aVA z&JXn8(!7fYA~vvt5(arG#cGgJ5}K+T8O*boN?DcX;cCx+T`;qvME*lYwyPJB2ibAo zOYKkQi=fvYDXX}{%gf#I3jab5q7rPE-KDGzmNB z*4oa(cX>)k7Z$kuI@)njeT^?|N|RIbOEFOW@;w?l+#`OOZRoy$+Jk&b6pBMYHl*PM z3m-3-cu(zj-4u!!-RP>$fK>Q}a1iIF*Vim39O-vvh(p*3QC6&MS<< zNQXqRakx%{f9G6+C>C_fCSAu9uX1@sTIRYNdl-p#P0EUA%CJmhRV^o!1{_o_nUSmJ zbFvfOEFXGp!o;0)&@=X(Xv-M6pzLv6aT&RYu-D08J9vbBY4@Ia=Ik@@E*Pi^*Gu5) z+@=z#*;aAUBpeR&EZsh|=sg+&IsdG*76t!tiMo+n!p*K;T_TCi*N{cc@Fv)^3lgQc zmijP7l`b}@lDp^V@w1^Y$w@0ui4J!qz=mgJ?WNHMK|$~lF3WS$0SGKqn(Slp%-1*{HOt3ax^?oZ~c^*63 zD6%Ab-(MOl?>;44Gc6=&dz)B)sp{!|_~xl_W;&_gVm$NDhvCPR2oX91&ZiaBk@hFp zv-XGYXV2&Z9|y)JPP1e;P$deBZ+ma^M4dHwKLiG4Y-^miGetUF=t+Mb9jkA|riBPe5rsMLR2CPk)<0iU7y&-*F+ z1@t7JgXu5a$52IA-m_BW-&t7-mk&kx+7aN|R-6p(p?)9Hp!~YG0XQN(Y#3_#1%=#Vv&wMaQL=0YD?I0oom+P2iIGVLG zKJTp%T3z%sQjnH{YcG*LYt4wEda^qCf&~eJGNj?!qQ9N$wleK&>Wbg@v4+F5mKbwL zTBz|d;G1@6ljQk$EFnyeYxtzGGf4e${%88{ZbCC<$Q1d`lHdL0xv9Uz9tF#F2{DQ%s#YOaNPW3;`rt;J?G{+ z#lYs)o#0Wym-Oe;Bw2@%Pkyj4Hth#LGyx&i^>Sn!?+TQPegSyI&AF$ufkt?A7?{?p z{-^u7IFpN>=^d9U+1I6WgnH`Bfgjzf!f=sx0Ln!jzoEh_@ow< zLIHj;5wKfap?e}Hbs+*KEm{~B{lo?-N2!FaE1D%J>B;*FQ!MsjSogv~aLo9mIy4ce zif;FGYc4RI3Dm@ph zjmULD$h5|8;9YXs`7f|ZN~`)$8Mae+XPK>fh3$^FBoPPA40aR3dAa#6w#2pBeBfCZ zQrn{?BhC1n%_%zVpx~^VAj|+$zL;IH0JjA-FYP5V>Ad}My7)*avGNdWRo1X=cXEl( zile;?Q*0b%s)CsH5|jMD#oZ9Zr}a2Wr9Fx!H1zO*2Wg8yTk0C&H%7ZS#a&UfO?Eov zA`f1cT&lD^`-vF;0;}*@F0%c$8{sEsaZA!dFathr{UzQl`%>P2#L{-c>sM$2rh%h5 z3ZxUkY6&V3XeigMWG=cLM&f0nbx9dKGAzZjTpwciKH?uhGZplV`9-2L|1oQc`@!5d zy7#f8qIhFMV~Eswy05|oA{d+9EsRRJzIh0*I@gF4362WYEea{U57U$1#KRd-yt7 zm_WpLox~V?{@;0zCntF_agg~uXXMkoFNa|K&pPx%RQ-Hb-(pD*$x?%8erf<06q}U( zvjGEHfwx^8a|3n7hCJ_Nc~^O?LJWGgbnreg^%zS(v@u}()}$pIS(hc~NomY8om1Vp z?N7VLDZ~W{`S<4&HAmg0Zam@f^$2psub3B7d{{k`Q%{~UPl*uQz!Sd<_BEF=zf<*s zrJ44tmj8>UtBh)^Yu2H-mSCY2cemp1P@u&r?(XjH5Zv907I$|mUfiL$6?ebk{nq`P z>@zcu%${-oW{3c`fHiw4SajGAzyw;!BQb*da8( zp|Id*(^8`lvlTWMOcc}dngBQ$(rQOUU{$xJ6n|HR(s&$Uh$CYX*eAo!t z6Z;UZR=#;7K?b}wv)NNHU@es;w$Bi$$;%aEL<%-TNMacq08r9rQS-;iEr)RD)a>Kb zSOHMD ziIIn0FuA2CZ-MKpjPG9hvkMqdd*sM9yWh{Tir6)AbmZugS?JhStUafoUaF0?mkg*l zUgnuq8{fawLL@>A{u3`dPtl$aLhv)Zc4aZZl|hI{oG^~U8suxr15?nSelxssb4iu$pN2v{_3J7L~u^6e?=@N|`03qsdo zu_rCccEJPu?Yk2gD42QsL*h&a+2IEKL5oZj;OW#wp>w7$zPMM=%RZuvEa;S1uyPa) zli{zcNEx4c4)5rr;7IRy~ddzF;qnB zKm@A3skp5lrwmElH2-~%h0QR7biP3cEarbC0U9UVC(<;8>qR1OK{G$4AUH3vCt=Sj z_PsP8!*cn|J`f8hcB8NBP=@Kn3CQ}R?HV8v4pxdGGTEx^EGOet3i{u9>9_NtQ)> zjSiL=1s;jncS>Gk^n}PE_xl?y#wrme+V^K0NU>e39f#SGyM2578m-Vqa$im*BS~(#riB@qZ!Km zaGFubwfU!x2_JFsa<-|f=cu+Sb;r4GYBQDZ2$LkkpW`YN7`}Ovk zY;tqb_gONuN%%cCW=S%)Krc;%I1rNI`yn)Xy2#MVgV zNO$C12Jkgy=8sMbNVWt{I~`&&cIUw{Sd=pSzZU>IKcJZwL2G&Y6hv+u{UgAd>L|sY z-A0)0=&wG4@Y;?7q{7eiAY17N@0dR~H~fL>t4Tx5}%KZ;HZI$UZfAO4N$UfZD~H`)!I}3yqT# z^Xb5fS=hQS%uZjNdn&@S9!D_bAz&W_w_IdYK19tJse$Sa?8r5QzzMH?_z}S)3d&;R zI2mXm{Q!UDVnDS$2s=ub_LiFDNakw`A9qz&g(~{oeyu(|nq(FF@y2Tl_9hgB%n` zq5JxAD3Y51l<8qk9Ouk{bqTBGus+9(0`1MQjvKS?q!b#Y??MIyZ%$>{h~z|ZhUnuq z@3faGnB{609O$?KGg-1d+|WW!9B>I=hZ0aNCwCL7M0t{g$?*pRA-IC!>CRS7JBc{x zZ)I6!uir@{G~oGSg!f{*7CUP?*(0}+PLUcb;!(l=SEgJga@=zzFad~8M3+TMpx>RFTnxP?b!DGc;QZJPD-4lo6Pa^i|uB( zS$GdBc?VYSb^eL{m$9`*SO-j?T6jf4uW}dmaPTLE#MV#s%B(u?LndJ^Py{E+J@dw^ zBfTi;iC33tKf#<&mu6*SQyse@bm1tpE1h=2Qv4>&4?>R=uoC;`9ul)eG?nTbXf)r4 zs+yy@pQU+IeG-z&^%($@#+~|@xw0eMPac+L6x{qkJEGy|z!P~HLK@t6fHSxMFU~w+cZ{F1YB;7gHY0wGZ`7g~qZ8v$;=PCv_WTvij z9>CuKOu7EpHJ38Whlcpbp^KDJMrab4G$$P2_R9&#_5Wq$3|0a5y$y0k^I#C6$|_GU zj(@s<=}0h35$~GQ2c8bo)f`H0cm`W?&HBTLzKw~dN}3zvbRWCkV6Gz1cn3~y7@{(^ zP`yP1#HNG&B%FE-mvMGN6#@k2byMNOAGN+|Wl5V;` z8z(cpdsdt1>G6yOTtpTlqv`uUq$01cZENOd06{XEC$&!$o8IwZ5Bf}aNiQ3WuKiO` zbnA5zvX`?^g83Qm^oDZ~}FWi6N!acDfDx)!4s9Rx; zv8Rnc^1_fahCp#n^b}n(Ko5;|@9+1Z5(>kJwlEkbQT^_Q9jmV`BpK?cj&dztVha9V zaLXbbYJ-em1P-UuXjZWKWZ)G`vQD(HqBc=LH(7h;)6Z+$uB${C=ii0z_o{haMk80t z?f)WqvfVbp1Y+tjC1SYE>iVaXKSo~^y)qVM`y^;?45RNIQaVY3AfXqt0I0cI?yZQ| z>Bso3TUR%p={C9Z9Le5MjkY`x$PnnK(YDz4-G#$Y`1{>=v^_ zTI(^Vk?A@;aNlKb`gf(OtIV-XR?(Vfm1El$;HP`q{$((Ro`|8w43}%?UtP^^wf>^R zBJ*=sAX@Jhg$&=E<59gi-^P4j=yuc{T@37C41W0gMS#DJpL|7W{gia`^zOZJHoSHT z@SBIK?2j9KgLTeLFnFd*oCxAc6bln)WaO1i* zaAnPHg?s8=>!6$t0R(e9tjd7X!YXx61$R)Op)q7Fyj4Dg^Y*;1xzipJb$6De#4uKa`^mt3Hfd{l_VDnJ_y+ zG2JS+;ode6aWqe!zgwd<+b`iNAt)=D{2n*w+GllgW1=-`*I7Bd!)s{ZoK$8pSz@nP z7)C1~^Ie@1qtVs|e=5=Xt>e{nIiJgpPpQdqYMrZMUQXSs;W)B<+t*mRs|k8>CXC1Y z1G0Uv_JDwfLscuaKn|w#H=w7cCGUm?HT8p*&T>)7^veubd>DQ``Mc+@K4z41Ys>8i zjg^(MiOL$OGOX7jHl%^a|8_8iO4M+?E^Vlag*u8Alcaf!gn*!&J2^kC$d|^V&B8{MnxvTz&qhoRd)q_WsTs z6nXrsufz$fab^NE4m_7bG%o#De>PXb!wd!*so1ipQ6*)5SO%e zH%_|*Z*fn(k7($18<0kSRP?fJ59(KGmxaoho~SoCphARUUBW7?x~+}nxmRJ^Rg!!MP4`(5cwr;7o# zRxkGfzA6TdAoHg6k({J*txqE{-#Gcq@_-q#CGiJO2uSwrJ!?!tQ3>)8)O-)MS>J1DduEV^DPXhe6I{W1?x||4@IDmgdkH#Q#EuY}qUo z%&Lt9+_PV_cV9=S9*s+m5i-qq3R1~sPW)XWM)$$hss{n5kf`6Gz4zF7`rwZ zF-}_7l&4_jNkQVAd67U;++VwwVVVWapZ4+z$no~X*r=(Me7}$&DWxD=|LkYA&@w`a zzvvC3d9FyBNS*|!l7D0js2RtlEs5!gqMTw*IZH8O4o}fZUPg74rZExZX=;@HP~(Qu zCwX>EclMVg@K4(rW#@7B)AffP=%8*#8$*=uOic}~{SzY~pC zl%bG#h`4>5=J#>^r2wsh)%_@s8{n502yeI{9Qdo~Z8%wTYvOR`VLt|kX%O~{Y4W$X zVUX_MfKOlU_j{n>{zimj@;6vRe#`81u2-6cB#!=UMX+adQLJn5{0GzS(EZ2Hjyc^R zl198X-y8w1n}x2*^iGPje&_}5A?y1j%Z06GFyqz-7pgM+ea_<*kZ;$ewA@xq#pB&j z`1TMqV2}SvTKhEZy*g;+N%A3TfAV=qK8~h7+~d|~%x)oog$ktp!u*k$Der^?9S-E0KPyg*<{dzba?Z$9oj?H3&uaH`zK4jRQw_pw5rW<>3Ha+c6(28{&lvMb$z=n}`=7F#+0L;OVM4Hg-ANex_iZQKhEt5cI&iVWJAWWBrS+8QGQaYe zxxB(}OLZsFqCdDI2tb@LE>eZw@!MSh7(<4IwVJKyJ;!O0In~Uk%uuK)CDUyKCW_%q%nsengQB$!Rh#+0z)it^-onw-V>tq zBPsN#vh$#$rD-dU(0S(*>RDXMEX5JgGSBex-msuPK73L=Neg??$ZHV*8x=-2{vpad zV@(Cp`xdl9fQi~6y<7?f+aLH0=|2X4iL3k-_@qMHK{9S-2JmB5{{*>5c z(>HjvjS+|l&7q5OOC2$?8!Py_>atiO`Egayk+PRC%gvze{hDO22f@h)EF?}=DAJZN zd1?Ez9HPN<|IkfHJY7g^ie>s+2-1NE;PW|^n67xeW9~6z#=kirNWTqZ+l$LWW0u!2 z#r>XCg{xPi^USPRk-&e>o4p^1%ibh|B zI4}IL)>eTv;@2_(Oy@rXCbhI;;ZN@xH!Yz3SvEa;nLPvl+Qyak4lBiKx$bC8#FksTE%PzScdOYIPPBZ*XpzqbzL*4BVmwFF_Br z?qU}hu$bMwD8Qlqh_#fHbqet*&@t?$f^L79$e1J3M1|88MVf_HWV9|1 zHVomhJ`rUJsTp)Mb5+d+$vBxGr$G@nP!tXd)G)N^5&@KcD=a!Fj>FWX)16U4g{E-r zCARjz0vY-;K27B-YO^||#u;IMEx*2nRS$_R(QCSlP{4Y?VU5lp)p6}W=nOSuzInjS z@r-3P5mfwm<6hcx=rQS}&*r6M(s~U{A4Xdy04iV(TJ%=?P0Rmfmg7&$>`3h` z0r>OIvGc4-fSopldmC3&n1~@R-13Sd1mp0h=u#g%+iluy&D_t9Mw;_fp1)U?{~Qo(vpc#!5+_&9TP1jZ zl=gC>xT|rI+k=3H7~_o>c}Ic4SpC2$$Df3qS6>EU&WDa+2^_OC_j!FA7{HmNsfvfl zm>FDN$3fxg#5b5zDU1`PeqD>m66(2*Bag(#ZCHwws-bFd$H(n%_Joq>g@L+)yKjNo z_-AYXbep84v2C?Mxj;*G#}+<~g~mB@IQ`cHDK4#<-fvB22Pe^H2NQ-3VnQHuqzoT# zZKle*sWa>d4FyPAz6;{g872O-HzCVt+>EyuPdl#&gE@lgsNm1IeDO~*;j>V3+;=O~ zfZSE%!3e!-wGfP5)r7_GiytysL%7RURBteBL)@d1<=>+mUsp9GAA57G!E~(_bHHaM zPO1^nJuA^$H6TXC^jw8a!|y!a)=aDhw-zaWnKs;N8r zaJcikbpx!H+g!i78%|LZHlOmGj#TvY#yZh`QF)&2I1es(IxlZ>30HQV5yb*fNYAxgx z$qhAXT0wQ=gI-LIl%K1oy?SH%RFV~#;~FAv>`l5i9I?~9 z)0xoX4noO~TVh?=1z(8s&!W%6-8=igsU4dQnLO93WfdkbP^jP7Q6krtfS%z44LsYf0FLN^r|td9>|Vl361hAddSi7 zYGnjVtN}rnBi=vjbGUR<=VA3QFs=xWJ-oDwc0`(fzSW%${H#LoPVzfHrQ}F-|MB2% z?_ZV_kfd$i`K$dtw7K(Sgl%NORzBkPmJJdgR8E!*ri5zDib|dRsrAG~W0qgf+bhZF z?nhT(b$NtOfPdWiMONk~%^-BNFNEUBEAa#MWh$=VCZRYcCw>w#$V2PP9A8U;ajJ>L zaXgbZ;lo_PF_pkjTjUWwk|Cy59^2A`RE~V(pJ_ht)mH3{GvD>Csw4A#`<-HVokx~y z-cwOW4A-fT>$b=8rcWAJHmM-&Z3A%xl};}G7!Hj=y8x3HIsBTe5E#2=^ZHAzwtefS zfD1$*hzm9=c-B>)B#qF^Ji2mF2$eolS;(CVz?Y^`EJaz?RAP?Ujk?LlHl|P%EfEKD zihIyzF)HL)2IX>}+VZm0c^Bo`;10sknk=JNeSME8b0rHnG`nuM;UH$K1<{MiE`E)f zv;B7#8BjfG)AsP|&Q#MjYK5sI(f9T5)g;Sd>v6T)Fh-{1ZqoC8H-Sqxihf3thW?4+ zi3;^|to6C$;(B^-;l6fMU+4>5j_;-TlGD5H0MOf5bG_RYI$K(e^qt5YzN%E~z#Gzb z0;*PMgAJ*^i3oEJY0etD-y&a`L*$Wi%gej|124mgihwA=2k2N38G2 z#%lbR{tF`doOX1JOt91)rahv&S^-WYD$enl@=;m!ex%;h zbjyzo3bt0K3Ik8RTmB`uBii-r!DV9zi3kzeAZ`ld8LVK0UHzQbD>r(|hxHj%w(EF= zgPLWs+^fc55ib&pDWJJ_-r}E&J0n`G&!n>QAHLG-M2Mb<;3GbG@z(56$)Xs(NT%ZY zf8Lv2_CW9>DQi+coUKlx!wOMpL;r==Sev@Cqjf;amW7PfoYr@9B(^hr{{tCxxgPS()O;h>nZ!{xdrk-?abO{TI>q=@Kl8nL@A=BUXDkii_ha21J}{c=!>DSiv1NLQXJzZJJ%n$h22Va(jUO_s zrzTz1-z(xpKy?yvv>~NKKjJ1I_6&lJ*cC$Ro2Fq}8gF{rE;WL&W*Zj_b#AV>Cbdwh zK6Xz(Ly_E!-wCKVfNbu%=gTCozU6mg_}l}mf?Y4=ttje*et1Vyh7v9s-6&{Z_OUyo zj?aceF}+>7o|CSx#YFCCyl9J+9wMByV+zdoy;6X!ULDWP!mRHa_#;n#EhRB#cwy8Q zH4_-stoWor$mw>EL*aiyX==PqWLJ$J76$|nWx~XRC2C(M`nf17Rli>Ey7&e`JEwQq zJx&&i*8~ubKe+lSqx(7+yk#m9XHAgiFcHT^lI@_U$&*aWpuf30lKML*cV&u1hoAwz zZ8957>20fjo6*ApGow%}t2!~gv+NA^FR0ikj;{&2gUtJJoLZ=kALOCM13$n8Lv`oE zg$e7++ifp1TY-amBVD>j$r>;E@JuD{gNB6uB#zF(PXuNOuf)7g^&gP>MpYQtDpWZO4#yr=4yuNGxck7Snfw!vzy3qIC zzhB@|t~s~d3iE}(@Ai;$7gtU^%QDU)cKO~ma}hmo zOx0coWXuItIL=Em_HG({If{z^ta-pU_X^^>J;6g7%yOz#Tw72bxzfP1hmrh z9GbM~kTDLORBXnV<}~kxRcFlK1TI;lmZw@5!}-gzvrQ9k)ozor|5jqpHeMrSFm8RN~O9 z^(2L3VL-jpNq@6Y7}asQ$?Rdb9HDde5;Eg3^#GO_uUXIU37-L!M>$r2IZ8G0vKxeG zjsWWNYxs&8gw&tyRqPd_b6K(iI(C63)^&6S!d=8lP@b!bhmL~9Ez3KD^5D^WBF*hL zG;2DUk13u{Y5U{te?7!5^$Tp1XqMAKY8xv%t7fLo( zNv;*QOIh*mzZ@4mKMW+O!=rudV@QfrhU=2*k(1l$n`2{`&CRX$-X9?K#IfGs)}(JC zd7O0q&+8I4m>)Lq^Vt>#Gtx}#5n28VJ)Vapt#LBl{X|yWbl@zMkTuP(0~d&?N5sFj zSAoRexkgQSp2{Ps?{b{kW$qnUp>O1H?eK(FNY|VSV)WULE4d%624*fFQZiO5M**UcuM<8&fBi9UBEMpb&x<{r0F*-LN8GtqmuCde4-0J1@iK##Lwi_aOuJb&W^J`((u9Q)a*%vP2s54VG%Jr&h ztITPKKa}d{#xBGyIAbBV8nL;UMu8z|LrPTJS>Zja(*=7$*>-gzysJYxX?JiC{5}9jqg9$D(&?8`_4>tx|B=*L}GL~97+^T_K}BLe#vjOlPIM^o-~E= z_sDM9`A9qG`6Y7Ic2vqn^5YNJyjyGC&OYufX`G&?ZscAww(P7fk-~q$4?Dps-v%Vy#g0(iFXvI!XRZTt>;~<)ETf`*rz;Q zX)^g?(}`s>{xZP5qZ<7IH4d10kw-~K>!!0UPZ-LmjvK4IgmF`9F*-m8e#5>0GQrfr zg`6_rFYwQ&G2ibCbyAEF>VpQ)|DBBb00H_T`oVNeSWdXDP=Ua@fy#qk7bg>3Pz4L{C~`CUwL z!%ZQAMST3kX;%7}Y3m6)gTL>YSi2usl^ly|MJfhoU`|6pUyUwjYhG(*pK_xUXnnrY z>U5#82&^+sO!xlEgmq86w4_q_qSD6QqD2@iB8(KL6XW?41TNGkKX#fNxTP7YdnX%L z?;pXo7bB1z1YwN&GOF6QJt_2E|CSBN*v*zG+0ELb_05(|icaeA-?unhT77m)(CPTF zaI>5*9^VZMh<8>ig!_Ghxl(b!m-(S?Qb42JstJkD>rBbbexi)aa{BA@;vl~#9OK;# zQ&)e)Tv?&vg<3h|!~;Y%%(^=EicZ6ZY`H0ZVrG!`k^5Sv`~o;xTd1W<<2tVHV6yj8 zAbI4O{GI}8PqYa%l;$I08HbhENF1EheT)0g zGBLh|qH^||cMsUHAQXy)5PO0gj!MG>%y!inrVK)rt}fGU>vq#^%te zDptNWaz&vu+ce}rfcv=7q^iopl94Tr{s9Jv-GF^y!23Yh+|Cl@s@i7O;#=+WdlX&q z_rf-pgsi>{ZPH+CLxq{G99hQb&t?*d2Qxs3aNJkZhyC2aDq+-u>BIQ#2N9?xF9G=_ zKzE}XGyucSk^&OzJx_pL437VB>MWqlm1-_Qm>IO?c;0DY8~zWBQqW4Oo| zs-OHfcD;F0;`zm4h}^xx>v90ptTz}LzumOzN|f!rnMbYuZn|`BEfqd7jTtbPp6Q- zB1D_8StiGMT9M8Bet)Uw8(yRK#ULce;@&-|5L|ir5YY1C#NEuK(MWL5co<)$l$z=q z21`w?Yi0U0G7usXLEk5aP$(cZb$D0{n2eJUkkN{6Q34ZbE;x_58|a{N8?k-sJLn5} znmB{Ae9Pr`6@DA%ywRRmsbcD_J@YLWm7&FVX^`37?VfH&EWp(I-K(|Uc%}9IcadxV zC69q(jW~eXY(XQpI%v-Gv4$NPq_~D32bj zLR{yt==fn185}=(z{#PL_TaZ0tR09K7}KIrDi58cFa+gGZCwk##zF&G#yGFfBEB@H zFgfXK0Xi+-KQU&bMIj*$r_7KRYQWzQFr0mvVd4K=mflof^Bj4PvwyY&cY`Y%Re*+C z-43R(@|8b=5<8hxaz^(DI<+2O7QJI^e;7HlD#(%!((Wuf6=~$nBJI*pFR6FognDgB zBbV|sf)s%P`TE3JBe@mq!6Kc1zd2S~wMF2vrE-<00H{KVeu12(kS;Dz_)da z5qXH!G{Q!XM7MjbNzjjkH*%mMWi`^a^HJB7)4aoY_fm!HsTpjyb?;bx?JKA^<8!M@ zE|bD^r)|TNF~E{Qc`Kaug#>2|e?o861AD za*|IBA()pOEF?oPxIOq~-rB!TJFw2mg2vQnCGfXG6!}1;Ooq1A=VZQ|(Vra+1ZlDp zee-7{3mRxHcY%)+$gPalN?2&Y_fL?2eG;NTw82JQgh|zb&3m1t5Da02EG>C!mof`v ziCj4Gx1ce;&OcbV{(2)ne8qITcF7JRVr6!+x_bS*TC4cM+4(S$8_s9B=KB&U!4!eOTs9+E<>ohCD;IrRPXFa3}PP;JJhvuC$C8o^uVD+6#OGgy!l5>rneH}SQ zCik_32RfDIvuuB^Qvs44~Ybf9SW(T zK(bs>4?5j0`AoN1ac}!Z@WUEdybr6XppN2IXP55o;|6yRJY1m}h%`5p4V6FsYkx%z z3t$HccIShHsHq74H*w(~PG6K`eo#wS`(9o>@Ilx!cG(ZSCZ`mlL*KV%qoD!7COnKn z#<4&4CP3J33V#flV_GUwbW}%E9~vGh0{7c+cjk!Kth}FtsN&=pm4;xWK{&SOKyk;? zNmSP_?QXh$qWk@#^vi)_^HgFiIQr%Ud5}WUh@zoZtV1DP zo4;ea8qI)=UE63ICnhH=kZJ{i(@rZlc6k5tevKx@;9Y*3gxyG1B)Ph|+jtteyB#9h z-pa7q%DG$dc9rEnVY^;3BYRiGR+nD7j7RMt2As~7CNZ;(qL+m#1ZmoMFeHtz!CA<^ zr}Tt>0UDVkXjG)__tPZz^(SFRg#t1wf@ihIvF;H(KO1457|ep0yyqhHz~Y$0Fd>9o z1iEG#8!%&1+BpwHW+>iLu6Npm@=Fo=VQ3Bg~1+KOqix#Gm--ko|#?ut)L&XbC zPm#2&7hz7O_A7L8&Tjc~9H*y=&931s@c0Mlj}l-?Fhab<;+(tlpM3k&hrX+>cmTcEopwRpQu<|; zwPjyT0;PS%I*pZn0BEor7TN9z`s2OD@#=yOG~jx}Yv$(r&VSaKN2Pc7w`E{u%7y>@ zFK7F3Ersv)@-}OkZ4%$d7{BzAdC@(Fw#aJXB9?vpqJtMO^vdUfzw z`-7t3B2|?HX;*)=5`Dj`RibR@fQJ%sFety?i&da{6iP@PQEm87@SbdzoqdFu5U?MrF8Je4;mxlEq*U3O!+hA zb-!MGzeo4B@?iCnz;FT9ZmKc_OE1;?5}_hKYWns3 zq}ytiD*|uiIi2i;()+QsGC8;CPtQNg03#W^d-bO<)fLuZ+P(>M2`?6u2xU(s33%#1 zh`^9fK@A_OKLQu-?2vy*ErFlx1MzlUGA+1*05xhTQ)-yk0nrdy14SBAJB#(Me+#&E z(ooH#!o1yJ1&i^ab*Kf|e7Y)?h1;~l&BKE+N>n_UCnm)Rcbh2wk8ut4e7i=k%<<9e zI}RWC88&2y5Zo6g){77<+G`1u7yH7Ek4T1(MuLUZ!;FFjhKn=+h6pRr<3RXOpLR1W z;fn2nd?<_e(%7}~Yr;3arZ>p7 z=Tln)?Hv(=O20vN)A!+O*SC_WRb_>yUr0BrZ!&`)u5e5y4Y{-~Ge4kbi{CyEPv+|< z66&_KVp}ehTi&y`Os$fI&rI+W7H3}h-ronl{rw$BMV2tSIl#HzT@`|Mqc!nqrg%G} zaBl-s1mU#xh_+K4xV<$aH$->V9{A4O0+@FPKiAxK`{OqEp=BS_9Pni8LfTiE4gS4m zU;QVC^#$Q!omii&a_)TkG2~=iMO5<~+vuqUO_F?-fPPxMz3%jlIzbUVN@@;6AxTgC zk~oDhl5fVAK4JhBadKMK|hUvLj+RB`46xG2dgWd)6={ z$i15GevN-#i2+;F???hN6o4_Ij1dRnKnt`F72RP8v2XpYAg1qc$FVKWQzgRsF8xlqJnbqu&B6}%OnkmP$QYIaS_Sum1rA>4B&hDedUbZ;#RnI zlj3C22G6o98;&rh@=ThV6J3Bpv--1)In<5?t&s5>^w^6iw3X$+FSKA$1R!d^2W9vT zpT$4-e}9>M(wyLytcF5dsQ~#k)CL#SZ$5o-%x@mZ9zAuxDH2A%9^JUnhe(yMF)0;P zSz1Da@m8{>^CV@!`(0mPwfDUlrt4qBwGwf)At*oKV!qeaerf0ULrUFTqo!V&HK*i; zkN2M@UEAx!h0l z-8J|!|GOs35uDZ_$S&eBb@yG{zuRl0=`Hm&2kWd&&3z3R&}E5nr!}8 z3;qP}N1N$9jt!!!XH1*cBRK+9BE97us!V&fiF79nj^$=5fZkmPoWW0s%r$=G{C+># z;*7o?=fZp}wuEn9uZUE7vjR_v1v6}@?@diEf?EjXT5UKG=sNU0JFRd>ho=ed9NBchdCd%V*T0UFS=Gn zB-wVIAbsW=<$Sr$5J8G|x`TIa#1>!4uriG=V~S+nU%3Y&B=az~;EH_~ql&!)9ylFI z9y!D@#9%c(lZexP#~@;S#Gmqi;zmK}F#~1mg#nc^B(r3j%v)2JByysVVv)25)w4rF zoM&ZAYE|byVRtPMTd=Y}ZAdmir-Yy0u9hO)8*LH#DQfZaQ_SjTP3tysXpMs$4=z$m z{bKFLp`Fo*K`3~%()7j+6K@v1CW4Eeww%AO>UDhKT7+4=AYb<#;Oj$k;K#w5?ZKpP zZ=+eRgV>l<1|w0N9{_t@50sT{$BbG|BQ%7SaLvBSE!q=)Yc674zW$UcT<^ujswSc^bX}Jq;m+g(M%a%<(uN?yKu6j@hOig5=8{v+VPWImHVH)-XX`##dq9o^eI6&J_!Gk3gKTI!K7dPwxVKjSjigLgVE7~PX=#MOn{)D*lH0bus#K36M^E_4qvne}{+4-4Wo~1TOL4eeogR6#cEica2*N$*k zLlJyUEOvlpg%f2G4c+rE7!n~aED0rY1EewbB}W^k`cr&7pEvv<5xlL7)UrhZgK#Zs zzsw;sMgth9ZY`LjNI%B-u%WzT9w$1FZ?stw&4mL>Y)&0&VpAi<`MGqhWCU$q+Ia_C z1xjh@l)3C8=uzw>OBj+d+2c~=24)r!)B{GJAa)GcL*-VFUeeWvB5u*6~+mwbjGfE#yof>qU9qzCgKEG!}ZlNjiRyY@_wsOa+LWqZw5)8jb z14NliLD0gTDlt#}4Cw_a^O{^!J{UJvK2Rh`Ce4Z)-*4${$AHzAT#vw=!MY(tQ~b}E z1ouO>6AD5$-DY+!NbuY5!BTDIwfGK&ZgfR<33y>f^Pc=>q_TtZbAta?{QYCXcu<3Zcebw?lrZ5gx-;QAk)-PMA=!?2rRjL_lR7M*5p570; z`5vA(B0nL7(t>+G;hZ(_$i{fA8+g z7dY?$K4@7_g_FghV|<-4U0975qbFpCWn}Mu_9WbLXxTG78+||=@6&m4-kkx89PMq4 zn>e`XH@*$z3mG=j{_59xI`fa>INarZ8v+aT#WOuiR+fHTe}bw=%=Ta^)1Yng$rv}W zTxN_!|B|mK9_<%;>&;2Lq0x-*d>S^x7pbkolRIUU3Q&S>Svu@zCG z-;<#^hQA|XPw7AzO}5QRj1TwMLohc>4KF4_Yz#f%iV1ONIJ%P79a_8~yBITci1)?1pVS_fl`VhL<`OZfqz2?KX&#cf^$fm7lW;lRw7qa2!^~Y86uxu4s~u-b|rYA z3@$FG4F1PBTpWhxcncRbGDi>hmi61r5yzX-ckuY`#}W3LqvMUgNWg+yCra?TzKlhy-YY}c&P zuP{nP@1m1?6G6=`M~3J3v$-6dLn?MGq|IE>kZoO8{=F6*syae%LWr$l&ebPmCgpT5 zl;cSzNh}E|_$KZyVfs}PKP#eDnYgiUJ$2M396;V=Runqq5qI9#;a!NKoLHM%#+h|mDLc+vxMZU%viz?kjhB`FkY-S$rqHkR$2nU7 zFD4*Sedm|F)$ezPPCstg&Cw1h5^ME66>Xb#1iEs)GI#5i^xWlF_jptcwXbfLG`mxz z{?%HOOwGXt(c=V>Tt73LkP)^Z%CaNqdZnDnN3C`B$19V-8(xlg{bGXB%$Hf8(j}|B z+08XawXRw5Pdb$wADHp2(O1O6nAvE*$UAGU$);-S)0gJAWh-FBM2H!k?V($@uf5y5dCUsv4fI0 zY4~ph?^%CEiq=-T4P?;zzk|Zg-N`FNW#n%3TceZX75fTBOxg1v0)4KM^YnWQ(9CygsZx?Ob5)d zup6XpY{AY>3- zHVvP+;?HqXFp%=1RY#06MZCUr*m<+~@a?uszD{+6SCjY`FhEU~0bRvOu2qkoHaNeg z`Na?0IZLiY^|6Nvke-o%aPieBrmGqIA7RtSS@+rij0Kxa!>Vc4UFT%}FLZiXDS7ZG z$29%yb)XJK8h#R(pC3Ofh?*D9I;{o0DN%gOqF!OyLEHaReC2B$7g1L?JmhAM9i&6A z!k7Y@UEXElz(D-j!rihCIoAEL3LPa>)Xe;AehYs%fFpOqv`kNU<8#D0C2&tCP3r1a4K#r<~>izIJ>DQ z=z(;roKG(KYMj9^3cchEWWk??dFFINe;j}D9REL>t}&_-{_8f`wrjF&V`{QBxhC7L znW=8JYqD+IwmI=;oA2%UulHN6bwAYa9`3WxKHxZD%a+M!j)ya5fk|CL&or4nR|Bn$ zRT>)Q+JENWFJZvCL1<*JHcsYz$(bd`|4>0SsuRaw796XAfpY+QhVuCL)mFlIp9joB z@tFbpkpi&a_A0mEoLHm!JT2g%)``NL)HnTcMq8-qp`l6~CUqH}V}Z|qCDO=odGEm# zElVy97>~xTZixKDKAPSX1(GyIK@6CyXIcBDn6J&w%^ChHzO2RnWQ%fX2A-!@^n%{u z0nB;~3dix4+^K0RNMT|lT$cqMNnp}k)Tp5ngtUtg$2Re)ZEO-Vd722uHN{l}384}h z+!can!o4aT(&lyd;4{rSq@{InypkFN%i)JuwdpVm7N;4;ryT=+UK%Md6Uld)OW$ZJC<2#0Tmo{60y@{*;=K?qa zA(o65tv~wTzdj(VEhf-U4N&=VK^I_B>-n$>>9jX9ffxZkIRSZ-!X#TvKcK;yT@Hdy zCXyWNio5VY!vr+MK9=m0fmsY>98Dg=>uTwmbt?rcOPyj=xj#Iw@rAenunICjH+D?7 zPN&~k@N{hqB^5XNgN9|=oT?zP$md?;@13(C+45z;Q&j*<>rr& z;65^X3bz6h?KNB@k~0!T9L_4kxtn2Jxuz4?adJGqN_1--&VJ*T1C7^T?pBmOmy2Z= zhEKIvLe3EB_ZNRey`K?=2oowAH^94aoBv$Af;cuFmggs~HfaAgVKz8+m}oP0rAJtR z7cx;JdJ4qLHBK!wV>u$+Fj_o8XpDV+zSqBl4uC zl3Ig~mc;PmCcc9Oh|;dAlqhJAEN4!NFsFg1dkB;^l6^vjcEe-LYE9|TD0qROX8bH* zks~-8;{+5{hccZY^`A_+m^u%9K#TcPd<}ADOCVt?Ja;(=FrPXXS}I+KFV~c1&;+ub zO5K47Ox@hF$>3mS>#Rs^=kMXjw&L!4H;SFz*CZMm^4ylsE6e#)gGAH0gE2^t40eq_ zg>@f*W0$>c(MID&Ur)&M51X_NUY~jhP%Xni8O!j~NNc=Y|2bLjXV6#mTZe-ZuEJjr z!a)-D%D%Pi&p*BLkA4p{rry?7^NTS^;QBsgONl8Z(f$dn#2JV?MA20sfvOkWSQZ}& z-(Rt4^s+K=5~K42U!@PvyRiQ&!8Bp-ZvjU2MM@qX=^Edq;m)M|wUK5a{ z)x2skd9iS9f?z4%lYqr3?E=8iC`9ER0I9{@bYG`u={=VXStx)aB5{WfYSk|Is07<&Ua>idMR7xn!?lD4Y6a8?Qb|9@D8f;&=x=^kvl zLe5x92{VCJpgvc%dLXCQ3a$uW9~YNxBAK*)7D3YdyHhxq`}4i&=e%;c+CpzB z7-jRR*{bz>^52aw6_$i}SwHeo#TKli-;4%Yo8@4n}vN~lZx*p4ETiu->wFy$n%)ZsDm*g{ybMM#GddtD(ay9sis zOtbh`C*oe8$aSE+t@0Q8Xvs#mS6*PHgU)kNrh^f<^KU+M9_)~$mjY5ZaRJrJa(`wY z?rGy0P}djKalh5){_a%``crF`{Mue7t8iS#J;_t1hbl1mE_hu#(V&=^3}Tv_Rc|k^ zEBl^t3!MBhC3Nkad8%_8l|(7_X*TH6uR~-KUHBQ&RE`>T3vw%%zJsNIzC5wuj~MB} z9Lu|`cRRc9*G{Ubh|$HfXnP1y^^Hw8M}&2ZbUHb?-g*Dom}!3U(;H$CM_|2DD!L33 z^8Fx(!=8gnu80VFl@fp27E^iWYzb$32<#6ASS7a>K4ELn;H_~ALO~)TACa$2c?!~I1_F(Y zq&8DzaxTHjVXH~^DXuiQ2*vR$@jBEGy;Pku7f=I%!FqeRFnf9VXGRN?wJa*vD7&G9 z2nzV1VxE#sWxs%d3|KrlEB@>Vx3fS~hjMZun9oVr{j#?qOhYm2W9S|m2&_-JSrl*H z&$O<-Q*5*mDH~1j5JVkM`#yn~cXb6MS+3b3)JF93Eh>_UdYS-pI==CA^sr^LGGkG@f7l8tf z%)&`K;UL21O9;kA6k`yBa6Ts1h7*@g8a910DIeMb)M?#*9p*+_EK=;c$(vz6?*V#%)Hp@tv~5gSNYv&Aza%4FQA=k=+M7_QNxkuK_D ztY5#-Qi>Z#;K1e?z~6HgLT@HR&&?`a6Eu|T{nt8YIaifSiXuoA=eX8dYUWS0##f2u zLJQxkq_M|PCgRY*nLH`>xQWo<)yhCrjwXt1?JZ5dbjcrlXWq(Xnrtl@>d`B%<0q%D zKwXep%Hov#3T7DJ4#zB9&BBI_y#%XMphZl=pOS9*@Zh9;%E0dIe?JhE=_76XFi^=) zh3UjR=VVrqWUtE5A_;&hGVlRPb}nn?Kd-`ZzP7Ks@<+x1GriD)+CQof_|Iwu8=p$J zrTp^bLX$ElmhB()K?FPc&TE3;Un|i<(eYDHUC$iF8UF?(3wlqDXFw!!Um5~b6;vyP z>cDM64pgNcmZI_{SiNw`;8;yTCBNUR_D|PvnHzjY0b^iEAFSHfP3(#xH%Ozlb@JZ7E>PlYA$2@FNLh;{zIg&o6&rOF-tgU#>kC*} z$Gq;1WvE7qL4zq{*4;OBDpdHPqhp@gd6OENg6>_Eab&e`g2VgQmCjK5Pfl0pKF{00 zWyfx}N?<6~TR#5vwY22|3q5QCev-Ye0%%isOv>)5?W{f*U2>Uj4BeVl6pIWD@gy}y z!oaME3N;hXFT(TaY}adsg#`T1Z`YqmQ3deaBR5(aPMQXMuI)|x=6_G5s|v;f`^Z26 zCh&xZs^S|cxyeqMf%I3E81OX$6UpPQAbVZ0Gcl1Mj%=Vkt&vr~LXIR!0Q9TGW)hVZ zf9Iwff7pbRCp%#PYoFEC!hU>XZb$@{Bd(QWS^W$KR8ar>7OhwKHy&>WAI)!_NZ#~Y z(w9CPgl;IN@#VZEL4WSawm!K-m>jOisI+?ulJ~Ty~}-4&)6VN{^`)c zPClrU`%a5+?qk_;|MyAaSAp^kM*8ce6QdvXHpse-#fwfgB!5?fhC(ah zTPaZi)dNm8Mud!xVWDU&9Gx@?jP>zzc;in@g!LaT2ncT+V-TZ#&0scUboMCLos<%! zfdTlxhXY<{LTU4J?j6PCa()X!kizQirT49!zhkJ<5qg~;J%O~Wz`Osr3lr1$YZ@=+ zO(kQsG;g<0?Dzy*BEZ69G+jts{!HIuLd$&-(dg*Lj+O4EGHRf``0B$J@&I3Ep!JsE zPUh%XD}W~fD_Wz3iK0CP<~=z6lqId@+=VwA7?-_s^xGpe3>`F8qTcZlwUNrR#MklS z__~q#tutGkIW2Y+gt$@|I|hO?O|#HQQl(2WWdYs4V$SBD#ep6HMD%XuZPiZ@!(aEI@$+37UlxQ{zPj;NjB+JtUdFFom z8zGvFC*3is%qcFfPd;Pg6-X+GjyPZ-%P({w3wn*;XZy9O8U)cn(d~ZJJ#0GG>Mf)m zHYvI`i^9RdAp`~vi&CIb{APoP{0>RL(pb~8vK%pF??4E|n~L!F8y6V#I4~0Ks|$@2 z$@UiI%?XG>C5Nx3h!fF1lxZz#E1OIczSlRpa4sz?Efe2ZJ8A1$({r5^;@4bS-Fm;* z8T+Ll=H8dVcZXV{d;fWGY% z#PzGc7u%Km7up>1MXKA0)FgE>oI1P=*yQ`PQ#|MwPvP#{5p{~GGz7s{!CAhHnb#3t zuSmAuvaS}=yFxGC4y7IkgrC2@Hu*nOzmDUX|0@SA*C;D`uTDSt?l!JD^dxHTtcNr8 zR=6LwZa*=5A-~VPyhBd$Kd;cwAP$i~zM|%Y>HGD{vT!y4+lDqf>NetK)j`x!#;U=K zwe&@_bCP%nLC13yCERn?$cL0r zQ3YQbvWPfKR_(uS>I_gRXB%I@>_TmLK!+AR&RXwxt^BEX^d|P#1Z(RuOj4^0yBj+; zmJncwfrZV^hLMHwrn9`>4>uZ10Z2Y@={of!K0f$g6P%HepJmD+JWs9|8x$t>{bi_7 zL1DlaZN3Revx3u%FBnI56}y3p;nle@C%Za#vRFC2K*dw|>v^w_($T7Ll+c&lSjera zs`{p;?rQ{P8GgHdY!rL!UJ6gZW!pVI?jd%uF9Q1|{b3_w@|^c{vw=XO`&A4F0U_Gh z%L|@;ZZ0J=ZSr8$m=p|Q0}6EZhuu*YjD?;5Ph|Syxkz~*Ysn=MaU50Vlpdd zR&X5UEc5A;w*{bl#K`~@80b{rV9iYmrVa1KPA7S?C^4D}-f1ijPM7K9G{NPRt%rFBBLiHRKeFLQHqhiX`*s7mUI<9%tcu6lWu z)(kFfhj>+tBA}Z~Msv{Pjf`qUAbYPlci2$pMv}W}#~})OLs_=RvZ||HUO*?`hXas= zZN0^Bb*KBCkB8R5$Ov2{SA3|9kAcUoANxypDz{8e9Wi* zCl34&w0nF_zU20Q-TKe>_(4j;7jM&m%S{wtSQruyQhncbM~`FB$%1Ln(0mt#7ZO0| zK}x(*1L0mYwek01GrY{M9nIin(!I7FMc@$Z^`7LNZu8yRe()C32KPUYsGZ)M+LeU^ zARAh>#&0Ew|9vjLj-*Jo-xyaVjzf zIrUgn?B0d=2C0}1iNpkS=#NOS4;FxzD)rLz53}Z7urd;ei^a9)pt( z{W*R>3N#rhs*zXg796J)H+-C9IO(&UdJut;?4Mf7fYo_m06zcDY!JJSt}n49!{XmO zw4?IsXCFVmFF3vj*EzG5IJ%D8oR4o^ueLU;?Ins~WC=_Vh|c^?PJIGV?ugdvWEA4M zgG7#*>NzsciB7C3`qvy3GJ~BhLcfhBso9$uTfln9RoO|3iV7#*1cz9fXx_fbD=Hf8 z79t%oIJZyk58mEl7Cvm@+&JH)WEsS$3UHzw8~~+8txM;6ZcjPP%*}mn;Jw!|-FOJ2 zu=>unp3b{Dyv2*jNl{{*rh8y^+~5CcUfy&)vwP1UIKh4~f4@EA*)5O1szJ$&R`h?Z zYu+EM0y&eE|PwI9^|4YrTKRBJYp4Mu4+YYB!AO)u-KgcZp4;7!Cj}Jspu=qAUHL?4i^$PiM zojMhfuvC}%;?jN}S+qmcb;osDw{?J3dKK8+hs8^XJQSz&a2ye3BMv*_4T+e%v>dPm zs7SWFGl~@}g9!s1j^}iQb=WSy2Kk%6vk~p=jcSblWiuxpxdJ<2P{kv+lh)1m42tRJ zkyCU^msnQ{J^V&9AM-SQ?k&P9?$x&69{v*5=QWt*%w!d!3+*MrOlA8{_rBPddsOR5 zb)DFN#}~KO8g0z$70))I&Hs=>j58Cly}1yNuqRR+(xR1(1%BLGbTjSYmTUngaVRIx zdFTV4;7`;$uf3PoX;qySO9we_m+{wwm^UyWGM&rVt&hR&BCW5t7yOtnYFDfZ5R~LQ z{OUd6m-6n%-sGMV1q}Njbopr_KYHbnl@AYR_hRP%6HDW{G6G4t(>j z{e?*Ha98^yL32=;^}^)8y58HmLJZ#jW(^fi5G=LI$PV6)b8Nn!*blDx zzfE{tzGs1s#_LDQ3VU-_w!9*MJlbx?+~7GZ?`lripGyC36~h5!!<8zLMBzrjD81zx zUtq2!vG=ej&vgl)N+nVQnUL$W7)JoX|8nVK@X9;I0my03gH`3(R|5Jhb!F!*-)rBN zFRH=Ebp=G0_fshIKuMM0m!iL(=*av#S7l17paRL^bfnnQaS{L~=U#}vRDJ_XXCEU7 zSqKh>G&CvKsIPf0@Dp9Sc_0S4bX43_K#yQjfPxJ1CfetbT?kv^7+ow#TCYS-1ZBt3 z&kQ0U;U?n3*-`PEHrL}=ikVT)2|)7YpRB+@;d&kVb)G>O_vC1wndalEqaw11*P zCgg&HtOnpEi<`N>!-8?yWDJ}JuY_VZB@~y^Ra|g?o`&)>GWyq=!YU{jghXJ*+K|HS z4d{#Q5oV0KgX5BcwwVk@&AoPuy`;81c7_v7K(s3pY61^XUH~4~P=aKPcd~GlFCWQuCnjR;v6*OgW0zpW(cdcR1w^QwH(5d8`4IRlX~4?mUUk# zC_8d?1yl#VfuzDxhBtDlbl!&h}NVQgg=XlqXVT zahwx|z|eBpu7)Vd>r8;wR!aXws{YN9WMXn~F=CriJ46+cRmVJ7%bkO zZBtGp22v!`XkT|2I@yfVV%KQR>CqDaHQ5@yUGv_!h`=COXD8l-f}bezN=pUx|FQAi zpF)Lx8i)qW!xsN?{1};c=>cL1eLG*R02W*-AHgY;0najsn27rO~$sp|vps|{J7DTjpn%6*!|kN+^Py= zPUkrTJvi+u;Vu0IGVpM=AK!0F$3Kh??wVgVOdXrTs=8eZ!sAxF~|v zoGe0+#Rkn(=Q?#pAXUcN2KVbpiQpu=*zG?R4{Dhsx|MTIv2+GR4E!phcnIJ$QPj*f zz3vd7=uKH0Z7zLBREk(a^FlBmx2-OuMUwx&6M{H2SDJw=45pDcV7*5vp-Gj*ygsfrC{!yc2}lu@Y8$tqC71q z5o%?jGG!bmmGPE_Jq;xho|1K*q7sC-vIwG)5t=-*wF>90GoSbOgPUDT86NXQ) zW+y)L&=91W0OnlC2cdEO79FsU4PJ&l!U#xB!B~&q4_|ziYz)xmvB?xhEE4;X{3*{X;jFv3V)dOFMyeGIuea2;{b5!CkqUN1k>l){w%Ein* zAv=$Gv`k&V(4_q3J?cg5@V3DSkJCW_U25%H{`zi*ulxbsPg?Y>sm;JzOtLl2*>S5C zRk{L}*UYczfl8Bl;k6GLB3Tsm(WxLiLHvw6vVo`~uJ*B*3^p~R*n5qVY@@sTV!p&_ z$Ij}6mp6;Bqg~yJTYs5l~Li9N)}hU*qQX8P&u{ zE?UcOcH}r#)L6*DEz8QVkEvtJx%JDq zsFzqbzG@$<*&1l7wUgiI$~q0<_rQFn0>bd!cW=P5mhe3HB2iT0pi-9P!ya4g;T`ra zH~C^6HO_xe9@1Zhv}=?<2N#S0$T^|8F|-v_075w)W|O{V@3Yk%isbwwCdlLv8?zQq zX$<-K7(?tGR?`%CBQt1tr}rrX78q->LJkYo^E zs9Gc7D?|cJG>q_5aLmDXt>1F5v!Hv|5#stp{}_iIa?&+%UOfv zl!C2^h@}JH{Wxk$F2k99Wo>`UCkpELH6&!)6k5$HA49=ivdX7Kj5?P_<*pLKV&8(nbR&X+^!nO+45 z|2R(UbN|~05R2YWd{HYl+BCiAo*IfFI3O&A7X?fT(XSAgEKQ=&(%-zQ!2h^z4Xw=p zA}NwMZlx3`JOr$-Df{TB^&;q&-Iey{g6zAOa??2?s^{(KzUA}zp^b1a(4zToW7La7 z`)WE_$IY+)W${^HS?%Crb(|ZUOvI*~|7sA~6-PArc9)*Q$B|7sY-170H z;9PxCJ{bv;KA;A3;ZvuYwcI$ZC4ipA315@8BdVavkOVz`(ElF4va>iE{jXqhAgYR- zvY(;l@eR3FZis3B0jc%kEq9CrFs@`uR?_R8DNL(g=t@6EMoW>YTou(3ISo1`@m9r+ zSHJ7DP80O18xDxy+;hSagnd0vItIZf@H^URIO3&;7$a@b<$~lgD|u_qB?MkW4hO>Y zB6wtiJ2FnJbl2Ey{&IREiu9LyhWr-FF4VdHnqH;g<=C>!G9JEpjN?^4^+xd}x%`2{1x|`g|HU9QSAr`OCiNVvYoYO@pJdbD@0ZkH zjU-8qumA$oF9~dUqRz7)jDT0CXu>zc7W+Qa-~;y2T>`JnHACcxT5jBZ&YShKmD#`i z?%UT>dK*n{QB<9dV-=6@MDAuwr@wT|t_;t4xB6mkx>mMj;&?UBr$b0coClIjl`iMq z;1lkKW1aF}X>3?*>vCyVyurt8J*tXoQDhR+h?CM5iaPCA9~KDdAs*x|93rAh8Y%<& zYBUb5^IOQus@=kzh$f*I-SYN~S>JAhGMvdapQE@3Oc^LG-knlEEF@OhOTxa{`=)1v?0sWBst@W~cAd#(}@jj&6Ox2AVs~MA7007NGHv zbOI!XZ1E3PU`n+C(AXVEpvMPQGK|${Ia1Jtyq7i6+CgbNgeL@R#9khTX@5w7nYvVH zeS!2kQ<=J;Pxi6$J$p6B^~DaOgsht9-2T|h!~hN%8O6*wtHdF}#PiI;7m%DLLD-QI zy^poKa%}yWikghFi-LL*yFFI8(k^d$Jh8>(gTr#X?0WEwZw4y36_{xIy>%y9!%V5|>Gt$^ zOB=}VPjeh%!%g0L?c$1r%`O00bGM%4La5rNlfly$i5mavAqHVOmcnm*vjNx~=!GG0|-nF8`F2!&6 zG5K(LX1^Y6PJGAFp@rW~)vs>(J}TH|fpA=`Bp#k*Vh4l->KvhylAO!+q9!Tq<4VqB_67yx#w1Yc24wu5jDaA5=6kYNJI`rK#755vXL#1WDtN zMHpu52`fH{EfWD)?Mjm+Kjih!IfjNHJ;h z<+Ll#HHr2{^E-3j61sLS2sAI*@{6=zWLbAVGLjPb;{Wdb;Tl>14uaL#UKhPLLluf3 ze)h~vXC87Xu=kY7 zMhRsHpgfqXLLFdAxI)69vlp1dauEsblOJz3^6-ReCa@9s5(B^wK>EC4CsCMi*AwgM3CNoab3R~Lg zSaRvzl+|};amJrhs|{60O~EP9c7zJx>lFq6OG8Gmpj=bWtoK<1kbeG%pi70-=izkp z|5aCj7wQw^?qTV<7^&BXWhD2x`pN0SUew3e%t?fe{W7j!$B=%T9Wh>js(q8% ze{wk{8`-Zil@)2(jK9`Zze>*ojTyg`3UL!_$FZVCJnJU(<+2UK)1F%Bfrad=tEyyC z?3S$`+1D?^e{GH`xQfe1Dj$VgjF@XRAB=HHXF@*KkDT&5o~=dyy8St^z#)2hjm@Gr z$zWReX792Mx&sMl5@bsn-rr%=+;RWdweO!B5va=kMwm0AXkXTJ=%jyNr;$-aQ~UG< z-o@_qTzlK9shm?5fS_BW#~#C{0kJx zvTSMzw@Tm$_q6WffKvG5urGS2G`tGJaPgN0Y#g6pfF$)l?nos`0T}j;P?5hj$NYL5 zoH&UBILjWDCVY-l%WRtA)*{l5VhxZoB!t+&d~}Kq*dej$kApHR8uku*a%#rU4s$z2 z!UYE#y70i6>GDR0=GR9d-kdujD?OmFk@HFdXnSDlfV&u(HQVLeFWHIZ$Y1P z)#QeHdk;eY!}5WH=jIo%C4EN-zw3CwzON7og77nXF93xteuaAksLj+t z*Pf}Gi9G$JHpwiMV2uKVj#o^7cLSti@!7Iniy3pGXz8L39eo36#S{f z9Po&c!QlRoPd9}!nuyiaoty40f&vT2&$Tsuwa5GxbC6Ls#mwU_aQ6fX>BLeU|58o% zd$er54b9x3ssCP$)?6<;ZA!KXP|E*qW~$xJk87bvC?OUcWq ze!BHFU3nf7-Yam-gYVHR_9Of5IIYc>bIEC~#Q@(GxNTN80+O8xYI&7|S<2*cxB|m) zgLEa0_9k>WHfNRw1#OHNeZXyNOg-d8+v$b}v0BI2p$%n)VvTts&Hd}C%hUFsH^Lk& z;@^IE|9sCJ7?3`DQ3Iu$0xb8CkOHMFb4R2f>N^aEWH$^sx2w5)1|hBsQzpTjQ5-Hx zqw2>g^aRhePVCyq2uS&hWNn(IQ_hNHGtFLy)N2lBSlk>h?vQf1ILXS0AhCK~t#y|T z#%AF8%a>wh8yrcuQO7i%0qICXY}!=LBy#TfG~2wLPVA($d$TW=2&_v4S(K_~!w3AP zlh7@M7~G-N#qjcL6T7j&>o+T)|GU=lyh zcuriIV6|}GnM_Kihnd3ARFJ|4%c797+g-VNo9wOEGKPbkLj<74baUrMLZx3u8R@X0 zqN}Q=Av2T)NZoxyrLnt>+t3{LbVsjbJ2>#`qCkqR43Uc< zC*(!Ty^{RSm}PoZ`;?=YK5m;zB}{32oT4XhEKqVK{~f*@B^+Fc-R5}&YWW4=SZ4u+ zsWLP>9cJ4CvKN#F)*9SN9`9ZWrmy%1%zXDy9;ak5j4jQrl~*f@g;2JM8(rOeVxPRh;uL&p{WnG^Q@2RJZu`LYHZKtsmO49L0PvXz2=E6 z+z(ZZ?{9lbS(IAx(yo=USa(`2zdY8se5v2-G1Q-@#Zh+C#)kMAyhg2~w&>e+Gg%LE zme#s%1btpkK7u2vf_dA=>;p#&2NU40g(vb!A-WEk;;`gK-W8{tYKo2BLl+dx-os(; zA{3TtUHvSBQoS{&#E!a)Q!P&MXg9fCA;N9PF}YpGC3`wEf2i|3>^U&Nb@sZJ(<9z2 zWB|Zqy2Mo3H$hdxp!6#xcEwX-nT4&gu@cU=<`fPMyh+Oie0EBS-6$vo`MUCo?JuV) zf1sFBopF;00qf~wplK?8#sj&>fwE#Bnxfy1mS;q`qiskjJkOmgbyVWeqM|-Hm+H^X zl_1htC|vH4)UsaP3BBj9rcdz`bl#b^H~3&^R`Y{_h2Ins`jsQ+Q2$Lqhw+YcYmfJm z{METOQIy7~OB7b>QA6d!dD1L1LgpU-FYhdi|4TnX9$M||3qD&Z2B0P(?N0RnSH}-z zUtlAl=pBP50CCu6nu}Vxo*xLNSDnZ z4m5_95E-~|J-GIh@=IZJ4mJ){M|1U|!X+l4s#ww7X7iYmI;#;C3KQE^Ve;CBzt$I} zeBpAl9$ocsUD)Hw0ofe?KXRO*Rw!jl8t!rJgu&miwc2_=`fUR}D~%+m(Y~k7uF4qG zV0}X&5a&GVScblF82i?hGUNK)V*l6-Yf5THj?_Bgha~IIAitB7rtK*I7oowPeosej za{agGD{Nfh=N`T0{cr;SGDXQW6w9D_j8S!Xo!q}#*kwKHk0P}Ifz0M)NPyyQL~X8K?#bu&pLNlxua(A+LuM+3@F#@ok(1O(R)DM?)1 z-rmy9_it-;In=CVMjG{Esh@x*FiPIMcFFvNAkC*Q{@7nBGf9fa#ByPSGQ7<-m|92h z=#W+b4JdMW2Y|Ew@Gw|3H5>9t-sW+zebSc6Bd&1L9mYJB!!?|PTO!Jp-ySm>lko<& zcHneMlBph80hRjk|6{4a+FF^+))6!rnO;U3+S(Y}}#r8h}6oCi!0ue0e3 zGZ)EK7CLx{73#v7QN%d00&mfYjW|qPw--aS^Xw*fqUAEZVA}YtT8;*9EwExm)NLq8#tVM=s;vGe)e2ox4LwS0=gGgkYP%CblF*RLc+G!>vorhDH@fCPUQ~r!m={?EG>5kLGe%P979|+;8tFLt`gkN&` z2Bbg$tp)VNpJ`ALH1X9H);+P3^~CbNDA%!f=_;+A+5)T)&3rxw6MM| zz|{F~ba6d+U}i{&1V;EgyXHEDBEmYwz;PQ0LdX?}sJV0{pJE3?0g}B&sROE1hHO={ zY336o0io~*P_nMkn`HvL6d6sbeb^0N122}{@P zt|69Xnek+4Yv-^KtY1^kL7+Anv`jvn1rJ$U>RztAaCO7t06~H zo&RWFLS@6Q?YYZGeDpkUst~^gT|sqb>Tl+GJ5@~spgtH1+~G;>&?@@RYI%Yfd*tGl zF#9v?NbujgN@8UE&2;D#NVJ~v;dVM)Vu7W2=G$k=2SdcqzpmK_La!CYtDD$F!{!xb z0!t0MUu5!8Fq}|iU)RCbhAVQ_2RCnO+;}vwPTYe|v>r$sh{H};N>@oswOMJjVi_0X zm4lo1)qO-cG5;Nqos6>7Nj-X%Vi5dXB!D5{P)pE+0INaGDVZ!NzyA(PcA!?KiwFBf zQ_qL7QMi_9_um3Ns<;cI<8w+*@+XCc@<$b0Zy^VIEghS_E*Ru2uTd;qc6NBfY#qu_ zaYIhnX&f_-u{N2!(w8JODN9_6in!HB4W7jGcD5pVj|BFmx0rAbjH9#%8nK(h&b4WFPdUM8&csJXVnaO+4gw2Yx?&-)~I> zE>?@0ddQFRezVGef>fdh(BxuiK;>^SKqHML%Z=74+@T_KP!Q9jRgV{3lg&oh2hA`P zuTr0X#oW|A00JFHK-|%+=W*&?T18GSu6H7SxkU|3a^xOddsF|?PrvSQ_U%1NN!f6{xiV#OH*pu+#ZDGf8G!QxwQR!D7=^qTZ{)Vx$%bZd*+9)+E=0UFKO zH`M;P5jt&E%lTqhsPED-8{FYgZ<})A5HFHxfqXrTUtzv*hjlj_G!_!q|WKM`Kqt0*$rIL2RP5jy z{U0zly0bFnKL{eV#p9@dhOu(wRURU`ElP4#6qnNBfE!f5=!ZLTrf-(}fbc%sm0({t zFeV_7R_e3v-i%%#f;jOOL0X$)@D!Ii*k2#T&o?n`lfHpE~7Vdz%0?IZ3x!(oyY%2L+g@ zco>&lzBXd8c{Qn=hz#S#Jf)}*^lPuj1Q&m4I9EZ^u@~N-QNGWsPiu*Nw-F@EjyxLh zpWO=mGV@6=nY68aMP-AeZ>Aj1LaRicRAueLpMXQ-An|U(?3uU~Kj2ZfkSX--oCs1TE(L8J{xtC^g&f zi9QD!579Aago4yjl^L;^2y59Bf}QrONRb16QryfqcBF4Sr0S}61}!5_TcTOG57id1 zUqG2gMft2@cRqQSApY&1@HtTYvK>dzyu7{9?>eqtv-gGJ7)h^d%Tw-JXzm3Qh=@=t z!4Y(dw<=O>8tARRG$fc ztFB!weZ;R$R~-@Wmn%nFh@CfkT3s|y;N*Q1m8D>kHhN`3=6yj(>4hz0A9a_~`GaAB z_A_!Suga!Jwgqs{15$;UCwgDmI|qtYO-dW_n(%*G-D=~6llFozQQ~wko$q%~#aflj zqX7Y`Qv!~s@^7E;l1)SMU=r|08xBssr{q%uhhT9C8NMm(Q;WQLKnvYfojVv*p~O zoPtk0RM)Fa31diQ`V5&k-ROPslX20GGyI3LP1U)4tc@v7Q6NU8x#wVWP%>5H9ny-7h+fA_!hZ%x*dp?eD>D_q4M_@!*pc zI3UlagZFn_|9-#Sawqp^W|(1rSj)3oAUZoqy@XNU_mj9#HAJAnIpa_EBw$A;l z#)DU_Fa2Z`caY6Kt;I3p|8oI;W|jFn>$=qV;EqB+oV)QPLE^OVERtb!Z?M@j+hkL! zS6Csd`A$MtsAr+5;wSg+FHm8y`mN^gr_u?iquWdaWi|~}>Vl~XP5KzKU!f;BQCi3b zTEqX3rf-angz37CCX-}h+cqZV#J0_eZQHhO+qP}nwv*fQy!ZRxYxU}`I#v6ejjBA> zS}RuS*UR=~-A5tAQD~q}^)zT3(xC14a2Q~>-7&!PPww~#G(h=omC*`nV*xdZPz8Iq z-P8X;V%Am9P~La5hF(g|#t`H_Ta-}Sg=Q;})=X+z^VpF6>(%1sW9e-)86JTjA8h_F z>Vu&|UbSA;9xm&I3LGt&-M@y@PB-Po`M-6frbJ7>oGl4{!D5ey8U3%}5$4UJF{CA` z!x{_}g$e>fz&1&7U`+oy!|3eYT4cy>+V`T?9bxMh%rxEuA;KeHN4`kpI}(TgBh8Bw z8pKR_2x*9b`{z%vM~Elk1WgE8&3A)y4^qI2h(rS0lQxafUwj!SEEMLL$Uy& z4LtHyCHmjVlmAiQkTt|^L)1qDZpbY)#t!yXbU-87jE3S0(7+30eWb7(LDYzTn=`R? z@bq*)nucPrEG3YrB$V^@nVFZ~U7rZ;ZUh4=v$5$EX92=0?Z>qJpEgItdb?->ubyma z4uzwY(RY)hTXty%P#51RpEeh^bhre~q*X09_baWQ#bNP`xLW432W0|ICy3NTP={Br zyyF=zv{qq<%5G9@ZjVpX3Q472d6)wqo?{AJh4m{z>`#78D$H=Bg3G&;gIrFWzGLQ* zthA#x6}TU|bq1RMaJp6O;FJZD+i%6X*$}z>4C{E+!=-R>=@`}hQF1dq$#O%Y(q1#g z=Gr{9&62~$4H>I*L4xUMGKsPxb!fcvCOR}(WF30s$(dhMoh7p>`FjubGHM&-!#2C& z;uW~Sm3Rw+1C*DKRpKj${anU~+Ci2)X4M580`TP>m?y$ zbCvUh+F$(bF298A+OaQ|SqF(qwTSIwe{eq;Q2YwdAyTPQLS>rR{H6jyI=k3+f@~FDAVJjd_A_2XPDR)g;P2B4;aF~sB9CZ^illX3mvem&ncW_a+@kd zvfJW(-azC}gzdD&oxmf^YB7gVTNwIrU+t7fX|MvLN2iaSPZ49-w3TEa)AIUDXHd&I z%31Z{5Fny|$El%HjjKmDuA&HncV^jw8PARysvqm!5E_FZ*omkg{-xI7zKl(~>DD+= zS_h~8NP8OfxYy^7e~DuBN0Ih)48v?oNuMENL{T5A{UU;p&+d-33?rGGn9(1t*LN7 zXt+0;69O=(dmT4RcplfQ`7!(ZIQWlM25YV9Jt?;HU9G^;Qj~f13t^L`J6m-!^?>Lw z?PUL2%DC-Y8I&gIaFB)9U-6{_-X$Ure-|!FUuYD>BdclT8LL9DTIdN(So&P_c4}AROVb^=) zZU!E6qt3-LYnCQCi%M_rT^Fgi0TXfvKC;g_=_1}0Z{k@;LX>28UMeXz+3<>cu_%+r zdQ_(NaO1Y41qi#Wq~cn?afdrV&-Jm8zL;kEx5+wkP?$QKRyyr%-*ESt5x{h}k9d~X zva=Ds=IZcAOEIute(;--Cej#XGV0lD?QLOdH?LFZy>dl_yP3L41O$FTK=NQFRRWD4 z$75~PO{h7W={5Dzn_U@Hz_AhO1mKC-0SFD-1kwrOAf+q-FibQgLEh79qqmj{iZMu_ z0i$9VdQwFbBI!w{h;SjT;jjE&^!`M&quw+sdHDb%`@qWzX;^R_R6Ud+n_X|x6mCEpzffnEXqZS*TG(dRzpW%ZlOs~VEg)DhgsM<+}HoW(LCXl;4 z=*2wNwU$ZbJ%L&}S5m_v^0`_$rE3$MF@`4a*BPg9PP!3xJM|Ne$qMn=h zqmL2)N#{e0JM}9tJwL~r_uid9YDV+#ap5FQsK9_6xk^%>Oeda`|N)>WL? z=5Ws?4aNrO1Uqi1|5(^y1BVB_q;!?amVU~K{!Fhu(od3AxCkvw!#Y65HvDWLn)4w;xJNNQ zJD$UzEu=R<`dWRlc&B@_JCh>L?$8Miu$GM)EbE@TwmxGY&8BWu_2yPuT>n^5^nZ5r z>ChRMm0)y6B*>EJl2jjycKMrE@!J$Lo9Ujt#$Cp?OQPwP*By&+vpx)?DT4lx*@E=M zy%zwbNKyU$v#$$N4v;Y8Wt$ft0%}+;C&w3h_zE3ROEe-hzLe4()WSHtiza$8f&PeqqIAG$_xSHWL^KpX|)?uAZQ`l0j<62;PfM-KN+Y_7T^LCo1Rk+#v zz5V5h)vBK<`}4O!j=BW;Du47aT}o{O{(U`^QbzG#gpnaDh>i{-Cf18NqTkS0CSAwN zguq;&^^+j3SpgLZan?4}_tBS@ z$PEGTm>D3&?-K_2q^_naQJ8yKc}ZE^>vb78U$1o@82|&#GtHNjC2~{o3$~o?o!|6) z@~X|+DFfaF+|>e||7V12`Q+Tzc^#t$gq^d!0X$^!*cwlcl+AO(8-@|OTuBvkh#nbFUnm%|ce#E7rQv4rl<>1`!pfh2F(VYO#o zm{s6G0N-j?^j=c6I2*XzdP&+rtU`#Zy+8bNEVXitrn!^HZy>Y`cfI^+;X#aQ-XC&qx$@W)8f@ms6mLY`-5&SO zE8Qrcu(5YMy$r*h@X_oiKwJ+yO(e^QefM<3?O*+LWHNV?t+Fr7e;%}P;mz>D#6Ptz zqVa#fw@Y6Kps`w(KH}W(Gz}Vt*ouFb$(}ma+Y;{99n`&wt$~%9=O`S)M#!(XOigxX zlUiH3J{9%=^5rW&mlOMIm-RP8HBpbyY7B;}Lg@qEcXutLs~k~)2Bh9RpEf)6UzeHn z0B76sf#OkKE!8Rz{?4pOQ@9V<&`=1SOMh0ix&(WTR0j6|VH7++HDRgaV>@q31q3h( zybmRq#R^+EmjZqO6mw$G&r-K$aDF9%W~)5591vjSJ$;~nwxX6D2qW!T^!A;MTbTR# zX$}nPM0kJMh$gv+yN%KVaeQUdo9$3p2zvQKAP{NZ_k>zOS|FQVcC=j#?=QtiMMCp3 zHePaBb1jn032tUTIY2HtzjN*{gnQzC&Z9qhu+3-o+Wzu6Y{{1B1gTcU{I#-M^+m1} zbByOx@DQEaaO+Ln8I68uz=iab_dxN9^;{_cPcXoZL!;sK@6O1weJotwfA%_*xdp)X zDo3TaJtdKD)5>xnAhx4Kx;`@6*J2c+2wc|}xsJ~Y=iMZ%?k2)lx}RRJ#owFiD!@QC zJAZ!edEA-5 z`l~-NaNkDzsp7s{S^yKe+lOK7`lUr6pbUp0s@vTAZ?DR728NR09i^h8C7d580Kr4Z zW%NZ4e{=iN;z@XGtLwz%WVItRJV?!SSGvl>_4(DN{Yt0(bHGI`3wu*wAZ-)(0|byE zb|#eO!HedEFaH$xPwomdL^0eHv;=$m31C83T`|r4#|!?Ri3@0eFNy%Vgj|nbyV$SV zSk51t{`c-Sjfj-sZH{1@WfQ!eRkqoN?K|AC#Y}-JoljsH?{wK}c9FO(*MBsBJ!ibQBJ{<)V%xmZFqvk2Cc*Q+wV&XEVf1^5YhnVJNSO00^x+N6 zOz91z+L{@hFmg4@wqL)@kDNT@9@)b|A_i&rks%3?1x53kfH>Fop(nYRKzw4hMCJ>H zf3w8RbM8;kh2$b$Keus*u%g*;Fd}GA)DMz+w>$r;O2f22qac-8x^%LgEvB=6SS?}u ztcV{ZN3$k~jNUi7<+s#{fMYzQ%hJ&lJ>1eDPBzTwx+xUdjS+yuEf@YrEFB%A=|f^y zku3o+o89^VQ0rTDY!&%C#T!zI-1_+=pA&V3XrMkJR;A(IO-;8JtyrG0)Q~3eEo6c$LoV2abe@)^f{3y-Ky}*RiL|_yCk9 zDU6D?0}Vjh>Ac*AiR6DJyBqfZ_o9z>GwUo!vKR;gJ#TZ}*7A|_G#zJiqs56rEj~42 zF%yU%kl|KFDx4s4k1WNTnQo8zh;8>zW9S zm@2hjRbgWeO=U_qm4{0{5WbAFd}T3h(-K1{wFt`NjVF^rg=d(kqUHUR4o{3kW{(5D zTF!@32Ca}_KF3_&scaWw(JD+C3*^yCp_#gg6PhXk8#~mq*NXS}f7a!*kPcl5tQh)H z-C1eSr8)13JzhYMsnw$gZ%+ExZ6A%6_ZOD4$b)JVOpjnmQk~(KgTTyY8SYN%X3O^x zuAR$HwwMBd%3Qo`E%0GAz)m6ppw%5_RSQGK?8>S0!GIYaQ2hoFC-*~&+R*fCCzxRF zrfZZdDLmAmF1Ce&`*ZuP|D~Y44~w@E((`RBnHL9(MY7t&HLCaJsFHVR^LgNLhF(uE zDNLJgs#3bRkM6V2mP&alE27%-Q+mU}9=Vyi;*V;v*q{wyA6|#9=`96#;ZN;`)MN*g zmO?4e#+VOYwZ3F_&UtgDc$S0EGu1b_V_f3mB4&$>MXE0E|HEbGMqXn-76{plI8wTe;d#b zHwYL=J|migYuXROxSWu|?KAwmB4dWRIHk;8Xe&zeBA^sPri% z-QL%bb7Kf#{DwMLIYjW0O8>juhKdxb)qbSn$>i+hggHN7F4cm}d2*Bnu+HYsUbPv! zp*RkgQ25n`x%Be}eaY1VrPfKNTI|5<4NtjFlGPU|-S?c`a+s{b+!F%ZiEM)&IsAQt&*i5iqJQuBGk&7Ce)XA;aiSLGP6v)uRwxw_fkJ;5>y}n zBQxVc4?3Rj9xfVZ15}+qfSR(L8Km7eLm7?5pTnqafI-a45Ck_6D@_;`7@)E%MDPV| z73-pki;E-mrox*jEbC1%OwagUsQkrR- zl7E`tI@?zFjzI%_n=9itUC&>A>MDAKx6j|_@(8UJs9v{d+M(I5`w}XR6WqYhThBEi zn#xFcfM}h)kbb=OvqKKMkG1wM47}Hsv&ioS#Y1nj_nq%AJhZTp!Q2y=-O<6#A;9S> z2S|MggsG=(vh2T7+M1{=Gn;&7REJAuu0p}qcH-tXU^&>Q5vY>@ylQ4tEy&kPFyXt| zjwY)>cOSD=!f8LFsexKJAmREeNmT8q83K_HznG*Vr5k7+e0B;H4G zbd+p1_GTb0?WP^c)<<|XD@q8C05E>pB#-2et3ll}AVrK~snY3U4it{eu>vYKd#2QZ zeK?&XDLjN>Fh$>2kHag+85d9zNM%1S(t`U7)Z|xDH9hIr^it>dtrhuQ!epL*s-{|f z)$V@^li@s_Rj`sDc|l<%lex8+gOmD+WIyq9eTZeuQ%OMs=S9-f7~9pF7W`i~ZLD)a zpq&!Y%9YCzlNLhY7!1K^^%sVRhPoz=MYO%VCQ(r1f$%{8u^#_*qa+L&WN6PrJO4V?LW7y!x*&9- z{VQlJ3~DkdN;a`Vd_FKDWwsveYyl37p9-*Ye1RXj#=_VBc5Y)(8WF<2LPS6TGSMI0 zr7rz0_HYErCh$JT-7oAf569n1>k2m&Qf}J-kIyp}ixm(n3u>(U*GQ|%RyFwmE&1wv z-?)fG*lsKp$C``1RkYoCM{?ZDz2pdj>oy@j(mj(z@)2Ekb^MMnDfr=Bt;h7x zg+Pk*U%0b2XQK{MTgKhX_x{v}Mt>11JGLZn0Ox@XuCH8+PmBTS`+(UWHX$^L^&ku{ zz?Ei$LIn$yLkdYCNLrnSA7tLZY1ZV_qG%h4MyFs!xyVPO&FFW46`3~o>qoh_!KT@% zPm69znTgN#&1<^N$Ud$H7kgT-{lc&8Kv2AQ^vjkBa*;a-eV7N9cffM@>!K+_5*V$heb77-Jczp< zLpUvCCn~Wj%7SXJ+D0l#xz<6d?^vV*U)TCW=jJ3$9K^PLz(OMAs8k7ULdcw=oo~bIS^S0&^=_wn%TScQ-F6rgAkIc4DY=w zrz1AtO|h0XfcV*tSaW2s#0aLp?7{H7+;OYeaTHmM!NhK8N+Mh^%E)S{VAfOsj&X=Q z1K$oUn={N{k`hkDpDbe8dN5{R85%^oHyo+auh`n$c^~Pr&be(e#;2E)4mrrevmhFM zs*vr2zojlYe2k#B=$WfFWukVt77w3~LqG$of#%rCKn?EZLoFz@qYpkFB`zua1uU;J-)7;KG&D{yI`@;I>T4Q zQuAot2{Kg0g}=-|ERB}MO#Uk-#0%7WfxZrTT-ob-ln3~y=GvmN zNp#f=za7q2mKJa3grkZB(FG#|}|MuY8N9gj#fcA54Wq}DX@8e&|YTmMrnR^JOkG1e^2zom_% z#mL2Nf9*?zZIn*36poPd4%uWyYoaF9(##iZFt`J-`kiB@))cf1ZQm~u2?JbJ?SAn5 zMwPJ#2qYMIc@tC3AA>u@%+$nN#^#@KiQ;t@y4-X7T*4u%`8kwKmx`l$?f^ zjrnRJYI9hRcLJl}q-xLsF_9$;6i7k%Q-d5Bqs)G8zo7Us758o%_!&JAX7X_l7Jyl& z8|qE!B0?R9DZ&-h3KAIvFNwt-o8lW;@X)TTy~NWplqp*$@LEr+JpX5S1OU1A8|&sx zP@t6>J=~cchSJ@&ZuD#esu0)3vu8T>v+SBGbx;x*?{DeoRfy#SbB|D z{=1^u4z_cHDMq1*;9z<@bmbxCc88F4WUJY+T8=E5l^IxRC^&wibk5psN%5q{I7`*g zM#`&$70Jb#0@-nr)ypAVI6F~R$W@Bkh{vHMugUzMj^b3cn@Tg-0OCOBYKi_&k;O;= zxWx*Ytz~DzG73d)da|kU6Ibwq!7)@SI}ahQWjQU!Afg z{k*@|>bObyh5$TUG%K=qHvVN8X?|cM3EsB31t{R*{~TGt23!Gt=abc?V8lq70WLy; z1h>xnGvu~6NpXw&{z*ru^P!<`5nQ#5BN)jek9vLcCoq@^M)|#(Kd?l_`iaPSao`e_ z34G36Y!*a$dWNM&!*t?i0=ZLFi|HL@2?7$yA@V7SDVSXyuUy9~v1|v#d&Q~i=;cK_ zSpGbLEPRTJ%VklsxFTG~uPl*VrLxSkbTHvy{I;?9A1m|3;+O84uRyH#} z9YTofk1r!l2RCtNDR!9xEe2u9BnNiGf%2m?I!%R~;s_X|WK!~$pZ|ZGiFrdB54Ai6 zG?}e=Z;&)&gqmz`mb_uVc7!{Ngn9ucGl8Oq5RvgwVRED5FG@@$vz{e+$1b&S3>q_2 z+HgzvIXd;Ho4969WSxPtUXm?TC4s-t2-RXOD66cF^W-YN-39)OwNi*EWHSh*jRRN#TJ(I^C!-Tffv?fxt|20ByYAH1hSh& zOb?Zr7DStnLqy64gGvm+Ava+oX2+Kp6=7F48BWL`%RoVhy0OARrzq1%#3xCFq z6bjAPZ3x;$+F17ITsp>U4m7sNz%jnCaEAw*BZXC_`<%meYcf@A@Z%T3b9LV`5PCFO z(OzHgxv%n=pxP08SH!|{U%bj{mTy8PcY(GRZy5gS~c+0 z4&u)xA3~6<8&1S1B0R{?l3WuokdnfU13bYBdvl0bOj*-XK8u4<5PUxFHev>$nKE!~ zJ!%jZK{TXxLvUAek$4JlJQl;tjxc+{C5tBxR?-B06!du& zP9;I&Jf2c`i=sX4SZ**=XzIjKS#6zpZPbJtdJQ_-HHwY*(yG!=V$ZneLRuQBA|L9Z z0_6=a1BY_Etb%NC%p)uGDyX2hhF97D?%mp>mqMLapb!WV?qm9Y{en9I;G||`ZuI(} z@={f=fkI~vCYKKBbJz|VrrV13N{(FCPFoB88a`m@K$nYJIl`gQ4PFn9iiPSaiWX#e zpj>!NZjc<94`&4l`o3+V@TV!0dxRd??MYlXohnc-e{x$Cu1U{fkSZh$65Qb~jJLW| zQvw3?wWf=+9LRcvG*&bZNaGf=uxu`z+?D2eo=1bFlyb$zkCaUqg>Q13S@!;SJR>Hy z4kal^j*c=B(RxN#ZDg*tO^sZOYvE@yeGR0092eNwFJXqOA}&thTI~&dn(-nU7E3!l z#WR;o97;EW_@>YNwP(-^RoIr8wOv()mJy@K+Jtz*sxnRO5Q0S4DwDG8MIxwh;5bB9 z-$2N{!+^~nW?@0SL&Aw}wsIg$8+-f&@ zxncZ>Y$mGMEMrtkT%tGw8%+Gkf4$3Sa~H{t|A>YRkgnWt@B; zSmJg=U|8kzlGQ*rQr`v-IoE9%;o%i#5He(lDWm;XcSIQOwVP!Lk??U{@DEf44PUkX zn3#4HX_{oU-tsA>fcvh=IC(U?SYcqjQS)SDklMJWT&P+v9fR>1b{Xu@7r*`6#p z`+By@IF8l0DMSANb`&?FAQ6-IRAx1{q9|cSQ)}_^LkpIBMiUo>y=$5=iH89(fdm{j zGy)U-^&~Mv#7)mqMC-(Wgo+OW;R1X1lpiAh!G<1OOp%8WG?Jtk1zx>>j^m!tCF1-RY`SPMub*-*q3n+&`^9mwt zIfJM6@j)rvVF{vaav?*P4cMq2Q?e#?+n3=}_GR92sTX2DWAZW!^hwM7Zys+~i_p*z zHdUv%)<v$NOdb?C1jn1M9Ysb8fIzGa#j%wt}uiB@V19wQ@cj-e+~y)MAZ|Y8uFbt=^6p zd-QOj)X{+>J zdFHT(@U->6l{w~3)JK20B4tw%3=GtTRTy(*O=r!Lk1d;?8q~6G^I|Fw!_YE(8UM&v z7^lG%osr&EQJm8JA~vRqKb&v# zXs&y0t6cyPdxil5z!u-CPw$3_PZh&>jV$e|y3;#vX`SR&iJ&#p7Zr1^IA_C*t2aLe zX;%+@c&N18w*|6V)`hha2e5YxW7n(_Q)c}d%O>^Y9}+U3vTG-2a$C{8lJmwwfKp?S zC{sh^Lg)6)I-bX)ha1eO{{)toMoS7-j{U)^(khoEZSozWf)%%?N8}0o+p8eZ=y$OK(Cnj-C}#Q3mmV88Qcnm&y5f_K z*H>IrR5#TVr`}_J^VRk`F1Ic$`1janE1%R<*r!$Frdk!yoX0c+$KACFp&ge0LK}<% z{|K(M+T+?w5Qkuo1K7tO7i-MfSVyUg{mE<9r+>RY*TvIdR&w+VNJ)!=Fn-iDBgaa} zUYQ{T?D0HwG5FboLc<$`REp2Jr>=9d)PiUP6ee+^nytg|=?8=Xrv$*Zs-bWX;G0}1 zT-CGWYqk|!5LvmLRm=NYWtR{3M@6mit>+*s0-c3|Gv<_1Iqs|{97hiRs2$@d=@l=U z%=<~v$Az-rlb`;mAX_SeosBt?usgeHgi@i;=~GDW%`xfe>JfyrQv&@hpC zLLq(9MB|==TVSQu9`}ATYl_N`8mz?%m@;QBRC6Mxsc|mmoNSm;mz-$+=f6f7-03Q9 z`1*Tx_;xp1D>yK)R}Tl9Djd!m5CQtC;|=w^@qVMOGPtYSywc^#`c=*QfzIPKg$9sA zKY{I~Xg&np9L)Xmu?HLQ1DMFcsm%Km=0xNuC1EWjr;C*SJ|B9Q$_0&m!rqvu9Z20X;sUM^bSXi))hmdAn0Kzc~1v{?z z6|*mOJvlrzb21tDzG&V z>iqBtx$aJ`a!0@c4!h$i_KPfYG%T1kvgT?g&=9S=nrBpWBD(oeRivmNh=zB{`^3ci zJU)SBW=;w)IezE@W)|V8i71KN`x?sW5<~Q$<|qeJ3l1lK0gICi!sN~DiTHl#^Jt~v zW(Ti5K>6g+$z5j{w2{L#K^3XxjXjmZeJ3d_e-6Ag zxY_j{Yg#0kq0u&a0N3r<_YmV>*(7=G=V(Q2X0gjfwo* zL?BI;>!J1DZ{7P6I$v9W{Q|sG{dF||V(s1RSXo}XoWERti}ro$0R;d4k>!pzl>K!` zhGnYbG@)>t#*~$D2- zPSOb|(R^8c%iwiD@xJW(0|BDz_m>Ua+Wa-T9}Pabza2;bM4c1YO;5hdU2O19$uV|N z_WNq`{-6jRyPXDI>&5xYOt-ebhV>`IzkOey{RqbOTtc?j?0v7~vO(}3ow4oK0}96# z#Z5T}a_opUobc*|iCyv@p=kZ6C(Swp&l zg?nLTpu+`8rQEXF#GndbIa6LG72OJn%Wmo@q3IiJEdxO9bdhHL!(BFDAry^+)r3&- zv-l+=DR6!ttl7(#u<^Hk45ZubNgDE<0$D}!#imxK3@3Wc91DKwvTv;|sKHK^ose+I z%cX`SYM5jf?~U9%z0Mre9NupU)ELAjo8lqUv9?VDDT;0IuL*aSx-#%q|5Rv2i}2^t+Xomn=x!Koxt;?KIw6G^Rjw)s{ZTYHqIrJR?~ z$QBhCGASO_GlVeoe2nUdrYYue6HlA!?2R%pTuLm$p9IxXwe#OzCX5TAvH~#YY;cZ{ zG0!N=43V}?HTChxZv1{@@1|9#oD1? zzfQ09o6{#1PVar5zN}l1R1IEy05ey}9_y}m0T|!$iwk70r%Ag0@F*Tck?tLc0Qj53 zY7ab}uEY127k1X)qJ?EpE5$bMJcq@5B15jn+Y6L7?6(2Ny9WT;IbX*G43_f(-{XD> zZ+E=e0}suj^GEZhmkiM-&%4FQ07^Q`RE0_Bv*3dp^Va*fW{Q^kj;{#TGSE)5*Jpy{ z!QDT;@Z&Z+bKOmMf7qEjU|Q$i@?)P@C-D0-T4l%c`twJ}&a22nFC(K%xNHX)~u_4{iZg ztU(tiO)I2zrWV_r!b4A&Qoa%>{{oTenU(a)6mm)Vn^p4LXZito_m-VFVYMSAdW+E` z^(@q|qknnvel%bcrMRHf@*Rx7+7wg@%p9wN>A{wY>pu~K5b=q^!?M*@Q)2sUAY2pd zJ+?_#D^(C;1`D1ql};*a5^U|aE^eqH=hcvn3{vkQEh+|Fh_x<;jwiXNiMl?=3~`>I zju7eu_9mFShqUh7UHh-&gCJsTt6B+7)E@sRk%@ocGX1P{8Mu*+&9aE;a7qEx(kbKr%!CLLdB%XX30`r+r3JSJ# zfRul2t^9UbgRXUf>g3=N!h#x=BLRX>g&qNvO7Q=&=d^Ze1QU}qy16#b8cM+LSM|BJ zZbkE@^qg3sPbQLQoj|(ZpDZw3IL9Z^ZKM|)?8_}(uJh1a7#I`xDm^IM_=^XvgD)4=k>=npIHd9f$@fTPbs-{3Hxq@NV;;*GR4AJ4 zUo3YMavP9-qxzlXN0qkppOv*ixa(~VViqdsM;9SFof*a z)21_M+1QsBbjqdT3XpCt);BG{Hr>|3ru!YKUiGgP#17vf!fVGxv-q@gy4>-99wY;> z5Nt;zGNV$*?IM%$l*B^sOH}kyjUDOHENdgs0@Se6frb}ySMJ=56TQlI|Z zEVJLL>0i5MZ+xoH?nK=!_S!SQ$)9$yaQwh^ZU@u3Z=oBE=J~93nREUk)qZb#RzA-D z^4AG9{wl8CdSc0*JZXd7zG-|0jTsaIvN;%G?D~jRd93Q3Mq4IKoZhg3ju-2@n**up ze6ni!nEPe(YJ{fCmAaFU*9pAbdHcP4pUoTP-1V+=i=y*s|1#|Sb)ku%p#5TA-EW`$ zEFK{Ys%ihYc{`}%fFYfYyKi~@LeF#4E2C#=>4*0{P1ldMaUSLJkl^G-{MX}M!Rwdz z6WX`W{S>EMv{hRw>Z z_4b28%XlW;TCCI0rC~#1bx2+Ba7_^3o~?n~ea|i@Q`-R0pJumq%fR`wK;z>*p-5D! zYL%>vw6w6cJA5>4&=#;{GF1nX4=^L#?COMvs5cr_zC-7Mc{zw zrB}ig&+xIFpy`4A@7DXoK+2G7N0tnQYJ@1K9Xe_%<-Npqrka#y1StbKuS#z6hJJ?k zGqzuO! zAW?^Ruh;MJ1%xd10%~le{4Nl(}2RmSo6&Wxl(A96{!JwFc1y?5X~mYVrgd143557 zqH!$R5!hf*Z1%bcji^k&XLjjK^~=jBsEO$LVikAqJ~%w}0h0xuuP2er5Sy19#wZ-# zz}vJy0xm~0l>9(njzq!+UB?v(F+{b(5`v;b#79%z1pES$?^)U%Vx z`lcCHQC?a=5MfvZ{2wt3;)?;b4sLANdpEmA8*Ud4s0Rt5EAY%VohQgD`zy2JDa zAQ=b-h!9{-a1#;P-o4q%!?ax|5MO6)#=Cdpw5rct?_0-EAB&FDeFAu|I=87 z(k@5!U#!}%cX(S%EZO5PlW3g?%^P-g98bL3FNR#V>39uS+`+IkyZ@@>U&&!ryBuzx z-s-#*^7hAPz36W2K8Z9}b{caA^}}{Q?-hdpY2S`@|76++eCLb-)~=OvCpzzUhjkw- z?-wwe+XLVAM`d$XpUl?-)lFV<2js9!#ZGbdyZ0>?oyXmTo%hjeb)V967c$*jUN6k#*6FXe)XR0a6iGy{+vM*G4yR(ytmy8xD>W>ytg6oK%^Q_!cU0WF zk?h`MUTXyPW?Q~s%B_#44 zuSVEhY!C!X2%V}cB5E7h_|Z&Po521Ki6a4f{=NY0%e$aw8fs{U6AtY5#|A1Y`&$W# z@S;|q52uTQ^_7x{QltTwzjD`331%cux(L`VAd4~B+0rBYryNEdD)}#ncg#3vhSw7d znnEx->i0Eo+F%gWax8XZuN~FVe{d36lAf5o+Y35i$z9XM^@>2`npjI$At)Hyp7P}$ zo2^W*Wk^{;AW@QK9V3%=SXVi&G?(P;>Noku!h#{JH(EFrkrEW>E|H_ugy^L0_L3FP zYD=e!~gJvD;rv~jo^z&L9C=FJT(*T+s5KQM3_WDK}1de^LYk8bG=ut9t)3Anl~ zd(O^Ujtl5$XeO9Tui9WGq#R-s7i}e*nxTdi$vWw5Qon|edglBxcQ1S@E2SSibv(5* zU~GS*OAGECf&+fMLI5do?!n5K!C#nc5g_7?=r>n*JwIiQ$I#7QGk#$9BM-sOu?z}M z$q{}uyFPI9b~MP;Um}IM1;_DD)eoVvZx`5G3G2DyAB0ag(zn7O$>NG2p)YdH0&Rj; z7iU-UpKYw1wy>6=Q1QXEr^Jz^E#q4~hDiAJaRmj0j|wEwWV-gKrj=`z9Y6nUkU_R?EP4T=fG648$F>Smv2EWD2nb zA}JY-vdY(2TfDR9gU!>ea`=jRIuYgwdDmPd8OxszLm zO0G1~p7camu6t5Z0TXgO(@-GqHWNicyD!}wk`fz13YhatG3}T&jvw+#oNK26V-Z}U zJ60iplJY)g`3m!|#B~2(5t1jI;xzPcvpXgGiI+2ea`&m06{6m? zJc1;bnPoqSfa`=1y(zSo4mU!ufhk0=$3wG}^GVd?Nx`G%jkNP)`B zpE}V?!<-Om4G|zLu=Io4VN^BBoo7by@?C2iexH51n)cI!AN8-fFgC~YNPRG1!_p&) zbh62mQyDn+J(?vq31Qz}xVOmqoUy3lXvgF{b5_S|o$w`?;LAH762!M&YN{|4W^|n+!T(KD^lbAuE)k>!Jgv4LV&-G-EOBXO3Xst{L zW^OJ0nI7h(nphoo{#kg5h(Pn)p#6VZ0AW)BCxc>3qs&s1&Ovsv&*RHEjyR*dgbCC) zhk~~C%80=^aCYO(Z8@O^gyM~=`{;1V7ziti#>&i138#h)L!?+Yx1T<>O)S2`6qE*a zHS`VR4n9VH!0DohdakA?ZVBgVTA7_13^hOD?+f|xYro?Oh09~TnaAboJ^N`hdVm1Ul!aty{A+rBTJ;@7qo3}0y-!U$>49~Q zAE^zUEG5YVLuUqf2bo;X+j|&3TdM*RN@X?z0^NOv1YgBCTfS$ z9}oSKuC+nT=p=59q1iWHhV#(d{F6?Edv&#ADS0TBQ*$ zOPY1ME&eLkFag$-^RSh|FX@bc^l;X(Ll7eI1Ink7kCm`|^RjG|EwSsQAAs(DG#B)} zd6ZBzY~OXVl`I(ynPJ#RAm=FB;J-+N!UH-dDazA)->V2=hWS-M?M%Xb`3a>p+>Boz8@ zsjSN;EFN^0!zMGc#gV!0bL^S&v=$<{DkCf!7Gk+5K%>@nBV-$|i<}qUMR~d&G(~Az z744Xp^^GOcT?l2tC$-eCKS!q{%M^?du#R)-F}PA7qqzI|EcXi6^lLc5vsNm$GLH)A z;~cPBVG5CXl--Ta;91s@qDhcSeVf4OirJ4@R5fRwH z{-gZ~OJmAky9qVWvo|M7p77UNW!Q~HSPGW`v5dGW|4Jzzc1m_2hZS{2qhtR{P^U9s z4}(~XVQQ-HkC>e29@k=`p$JzA zaHAudKYemrT|X0Lfk;^YXO_FBJ-#RhI)X$-5Y} zM)hwioaV)|k_p|$-k;iDry7mCG{1(Li&YV%T^}&7Nzb{8d4M1%yl&SQK%r% z1Wa9Wos4e`WR1E*9mciWDF#Da zu{HL;7C${c-(TDXYJ_UEC!CZ?F=th$n0nih!lm3mJwh(0TbUejAcgMtqK!AfA~TH4 zzmPJ6R6M_94)55};%Q3U@I_*$!J~A;`8f{=-Gq3QhV_P;h&?K|NQ}7xm50?ZchuYw zGKho`Wm~&>0acr7c}38R-RTyCqCD;k>TxZl3;J6sPassF4wY}kMI+sck6u=V%`ZTsplXO~3wN;@a}G?YFsd21YZS9`UvuB;DTK zTL^iS7mKY`)jnSh`fRdw;XL9WMINA^M1ebY1CjA%_u$D}9{uHQbneW; z%ngU%LuN_d3xMXqM#OG^pUaUZ%WIYGiOXgx2-OGfo-m z@9IDV*fE|xDHG0O)q-?0C&;(X)M9ZJP{PfyduE}f^Bt>LDAFos#Uuy3xUuQkHMvA~ zA3!fjm(;Z_t7;{WXjl)ll(I|=my5|uR8i3s$*t##w)?La!owUXWCB?@(nQQ0ModLM zF}8qZ_E1ZkZiJ3Fl+2w#gXk=GnTx$F>U#10@<3X^xq;5)yEa0t^oy4ZW2(O@hd(Fn z?e%e{jK$P@DUW}7ITpP~@Du~zYOysD`$)@LR`8Q|*R)MCJa&m+aj@*RYQ!Hn=%z5# z)*NH`_2*hFp!W>-BhCFd(u5=*aedC6Rhh=#7p?(bhq4o;87`qZMXMb~~$ zRdFWPi|U`APEfhMNf>4m(wY82Zm&=MmLqE@m#faHStk>%2qz98a^R!|u7Q43l6_X3 zhzH4T>0mIAGGWO*+o!!I$H3@5S5}tZ(G=Ao^}r|D#+j1gp&`~1&5pv0KnHUU-flzjA z;~g@_mK{{V$JTxCbBz4AH#>XX-|_#YX3sm*PXhanS`r!yC#QeymGcz4Pmx#<&um-> zQgQSSo?Fw)KVj6l9VE4dFGwU)zV4*y0v=jI$D40DJtf{dpH8MXf*m=D|M_23e9LQ?cHjkDREMSaJRSs7!rT!*!%?K?Q6if#4)gT6XK4 zYE4_GA}POFbEeV7IqBzDZy1rqA81Kd5>aFeltQ_btsz*I-;@9b$bt}05%h1om=1sF z(aZE(e-VSk@i!RbAQo_P_N7)FpUMpjD{SwU!-Jx`!RQj2y9HQF8907Y*D~BTRszf zd^lSY(F5l&mWy~vx}*$P)j`}Tnr{=~?%X<{8P~h?aXzHS@V|1#p5G%&r)|OufOkFJ z58zdNhe{F)G`Qiv(ifl{Cr6Ytt!jpa-Cu?EBSXku|8Q@|ZHk2>F|e#XQ&tU+Rr%{8 zvN2X?amq%kQgoN%mKDsHr%ZRojGLF}7rXeoRCPyH1?-)iuS~zSu3Yxl3Zs03CI%+H zl2YVSXz8lAqBsj_yCjO{qtx+6EswHVTKi=ZM#$;=*N0+aW}nO`XT~XOB4a;x@blvT zkx)OM+gOvau#m!<&^i}$o9lex=i8RxR?V?=_HYHf70g;2C1YeWw_D^?AimSLMmjDp z%G95aT9p(A=89%Z+TcIj7g~{c2%xSYv^*bSbed|i2c>#B4r0Cg*tb2KMd)!xW;+OK zcXr<%>PG)_0**6Ph%?%?2Cm2L4=e726yG?oTKFHzFM}Pt-=G{nZ7#zKq)?2!tVF8) z&enxur2H0dJ<3Z1750j0wxcVJ%!%dOf#9cfF9-qIu2diVH6Szo+bqU8EV~HQJ{U;8 z@Q>nwN`*XFeN71=X%NpA`&wfR0}{+D%(L?kr@`HmP>FvK3%0GmFLbrC;Xf4yo?N0= zOtR@hQ5r|KFR>ZE)6|~Ij@Z#E*V4cP6$JV+5xf}RC~G4GApKR zUbn@SPonkOU5H%asj)c6=vIki{yCBwG?#DqUkUqdTsc#l6U*ihl1rvM=% z=CC!XFkM#710?wjzcV)`By4{>0ISXts4y_EnhaJr3@Q0M0V01HO)(}V2AVY#FWj%w5q;B~B|W{>Z`pG|nB?#8cvO)MP-rZx0~2KZ zEy|!oPdLgx1S3U$Fah^fML=5>c1!!We}^2d1Xt;evYwHY>&;)6bQ%m*c_B#g@NwQUlgN>okHh&*!j6+#O-(NqyFm4QE`F2|iri1ZDuhQFEL(v>0o#qX5R z#60jC*|!NI3@aq8ixBYNXdw=WZQ5rz1}mn2l)0%*v?Ffj5LP7+(q5luw6 zI-T<yV}7JS%f1#Mk7T#_JPd=_7;b!g|13( z*n|oF6kJrBKy7ttgV^iEnjZeq@Y>p;fQgW(!OWhXt((6b%}qvx%al?tJYW8H`?0f7 z>Vu8p;FY_qV`q1S#c7G~-vQUPjq}&BibD6AL1YSmpzYs3*`#VbSEdt~;RXsOhhuSs zlXT@6WHyFOQPK4+D@@Pu;)|y}RmQggTi})1XxQ;%7OK;9h=k_g*z3Ix zieUeEHhA&XR2LV4R4V$Kn`y{|(e@|pbNtmim*0ECmH$E5vj1HHmu;g=pnlIRIG4?L z?f=|esRh4N9Ya1RJVJXzf~}oq0N1TZ4TO&x!L%SB64D6;Qd+pQXBnEt|QYF3h2>QL@sT2dgfcN(pBQj_7`@YlnUo<3wz^g}b| zEo0mKdk}rnQcnLBvtPAlw^0_4rqaCb)NLOt$_?_3blj`Un0-t4_TJwRWCH9I_%$_o zB4-GX`Dpqj>L#y79=?PHYbJ(Q7sVizyyWJ@ZK8 z@9I_6{}cY1tg$1yxUyn?qYJItL`D9&iCe!qe|ztCob_SBKeDkYyuy#V!Wc4gh**%l zM`%Y$V(FvEeWEMIN31(JnUy3_1wn83O^FYqj0^S8FC69($nG)T4n?~wwfrgmL4mO= zg-&`|r>nd^{YdmpDB2gLKy+Bo#Yw=g(uXezn1uFAAr7RVvfFv138ya7?c*Z=loln+=oj~ zT761oYEmWx{ z8>88Il-u0t6iC!Rd;5}~4hD#hXf*9(6gjtx)wU0=DA)5Ma*s@&A`b#>{H$ACmoEQ$@k7?BqanVFY@}}%Jd{y5lmY7cPA%cZB zRrV{4u>vozt7?pkhWh~ohNnD==!4LaErX3E9mbkTz!HIyDd9+iOHZwf3h~g=i+(ek zue6w;K3EzBPNz0Y@=S|H8#XDq)PG^VBE$zFSbF)#E+@25vk$muj2AVWfO#X!(t~{5 z`sjyVr}?=}UkhM}M%tRx@Gpur1$((UcinZfdFB;s3@G^W>6B337d?Paana|Cwh@ID zUn;18_YemsF^*oyl5ayNWVO=2_~4b@a6Y~cb8BkKlo*HY!y5(+iGAem+T;9Vs>r}b z_rxAT5@9(u`PURwRlDvvReK%asUrI_Z0Nrp6v=}o%pi<<*vcJ1MzO2IuzN?adXiL; zn2O%YF720l%0zC1|F?{v!C+xO7eMu<=;T|TtzC?yz&9EKv)anxF_(U``h1EHTv5zMJi*O28dSujuQBIL$`3iv zN;WBH{W6E0oys>FOG}w5O?Pk(pa6K(MtIE}RXlc3302my`W@+{r@~F#TZl)Um07HR zvJ%`eqDH%N0=$BH5Bcn6F>x&3mW&mX+Z=*LgnCttEYKcMz?e6lc!>wfbaG& zm;RK`_G9Gf`{tFm6Y8;UPwJ#rgL^J4xSgdFbm?axNF&II8)xh!g4mhQZ^bJw-*2sg z`4!-K^^%_{oldPoLhXu@RLO_L(x*B#57Z_LAH{M_sxus|LdHtLd|9CS$3lZHm27Q1cfNOihR$;HwhgLv$xFJL zs7T5dv~pWC(ew^2=9+3qw1#$`HxPFQ>KmvvvYfAC1Sa!`R|)bB837bN&l`D;?0wfI z*_URhGvR}0drlnSZ1!0%tp2uWovq?P5AkkCU+^>5^hbOF*I+&b%Uf6Wi?3Yo_d<4U zG0UAFer}n|Tko8WR^59a%S)yp6!6-(;W{4)#uD3>yPLfOz>REG+hb94tKI7tvadSY zc>6HjH#oTQ%Z43Kd*zJF%R&#ypFY;sr9!?Zy4PaUPyKA$Gd)fFYp_(TQeCYIbdnd~syuv{SIo~K{&ymQT5|lSD1+wZwMhba z-``oNn0fmj#<7rqP&V~b4bJ>NjIK=edlY8i^shohRt*i$6*6WtWpU9+GqVmZEJpP) zw5hIq(!8kS;OzXR$1onvDeYzYgJy!^F;dp4x~Sa&7P2;$KXHgCt+#^eDH0B#eWv|X zGrzvd!3=F@Zp`LA2otp21@N{hNvCbN0C_NF*INjQW3{}1)G0fG!^c-5W*{>l5E&+z zIieMHl9h;#rDilMRt2Rlu2tZJ61c? zPLt7R+EX;ocMicr=>N0M(4(cV?}F@+Iis{#X@Hr|i9T<+a1RX#BpRv^vSZ-~XRCBj zP54&1cfcmWRy=_{Kj-6n{?h>v^upEE&HG@E(gnn`TKDgNuj(Q|re`{SU0h@__!z!g zQN!zgg$+>c4A_CHIxi~xCO;hT)?2OCebPGZL&?~6?gI*ad}i4IX5|m~RXxkRZ7_Y5 z8oVA*3y9BScAjm1MwNHn4TEAVx-h$6&H^GyoU75GGh8 zoRfKPY;3J~%(9vUIf#6XcFiq(GH&p6P0Q^|A7$Le(0r6#VVZ1KzG8C(B?t9J*LOIN z(R(j-*aIj@n|cj8U!LchWoN*Xjs->P6RTEqk1D z1V7M?kZtf8E5X!{S*~E!rub=SEDxPYIXR)l77~?c4yk8WUNik|ImiBqb}XC#=6RM- z**5HY_WEk5E4aO^{ejm5rHiM2QkZ1v3_%ghI{)lE%4)CL9)oJy+Lm;+4D|^6_;yfB z$_bSNv>31dT;!N8N8!E%oXa=;$zxMW8FJ%m3>93+1$=LjC*(tj)T**e;w|IKNNS9a zg0&9{-E(KX^Up_F08){WApw~lnSWb5Mav`$%vPN>5TC%NCnQYpY>{RTmuhCoDM;UA z{v?X{PXAPZGr1DsVorCGRklpS*9aDHJJs!u{mY_5W?fGHeNJC5$dn)hCr15a&AXc2 z;zEIKFuQL4H?M=j1H1>HgV?9m}${Mvvx~+A} zAM^QJRfq^&Lqx<|co9&My}>x1{@d%Y9}Q#2bxoI{ZuZXV^z(k})#s?iXFjdo<7@%! zb)%un{r?#MKVVUKAJ-N*3f}SqknB4fNhr8z)-o*PL2M+wEn28sOF4X3yGZGR~L zH)_K$!_Ud({j05KWpL?w-Dmis0iJIExS9F^-4yqEeZRajl4$N100!mrZtFiiE?)!o zN(>A_2fLsCl6#(O`j6t-nHt?@r0V=VGXZh^M|{#V#+5ymC{`=Tw6hZJJM~#(*cCD` zF$?LeE1+v;3tH?hjAq%8AhjEu{u5LmYdS${{ADB{s4p{2(^1Zn>D*3*Ny`gc#Yp{^ zvsO9a)=1sJs^oe>VrB+q!TA2jekmIwb=Hj^QXH?yW8MSH{ZBCp$LLn1t4S4vy_Fo4XKD!7!fQQ^sZG2|6?-O+Iu7NK%_47mL?Igdug!duk z%5z0NkG$qRBZkW$=KR46GrbjBuoe;x?)*m@wv_gY$`;!%-T3^W#Qt%D&98u%eQJQ_ zFmIAVWMHKc^D#3%a?R1-pj`gepxv5mJec!=$W+40_FuxP%dEa*w^Y)RbrYNmNab6{I^+8v0)z&dtHm(b<@b+4&R4<#UJjho^m4 zHa44}SQAJf|4ky)rPA0*{*C0FUexh_YumQ-I#~3JUDL!_mD7Pit-+j0LC>W4eJIoE zX2BYs<|i(48*1x@Bx1OJ9yibI?AR$T4GS`{-hwnaae29E4tMLGD8bJXsZf^FU&&pU z@QfY(WmDM;JDavWIYd2}TNTET_n6ebcrjcPuuF>m_3PzS#C1f7Q(>&qh?`KTYhqUw!Uw55o%G;k^y8k%R}sTJPS1IXTbE=`M7pxBF%F;p&dz3pXc$8jg)Ku;4rX zb7Y@(cGmFiP-u_k^8@Gltoy~TWq8wJyB(-r?T_PsjTi81+V8T3_>8yD;bYB1{4|yU z%yN7|@tX0aX$F^*J5u?e6{PCcd7|mz`k%gxd3OvbdF_6WE$fs7X+aMiT^}gBVUc+PYGu{M6z!`!Bv3n?>NVu9!NmT4^r?VS!-J2c)hcyCgi}M zxAPR4T36$c(U{1>OaP0*xR+*1UH)%k*j^wMYCKvMMm*=6#j@mrHtx}+t?JB70m1c2 zMz&)0RApVr0Z)*xjXczvlAI|*(szqzKWn{h)6TF2DZRT{^Xh`0+z z09KVzN&>Ap1-Bd&8O|VihpJ+$+BUYyf@Up}7~0w#4`S0KmK@En3RUriZm;#eVJJsO zscmqpo1|I$6~yTnFcmz(psB2*sm0AzP_L|^wQTjYckuUtZ}D04sm%5e=XU*(bH^44j!)*i1HH7MMi4aDwljLcUs-Ch!T~J;Mc29moJ|x$tr_?< zo}H<9RbU^_0R+V$faq0%P|M|Z0If>j-$ulp4W1Um_=^4T8%BvUtO%iw#vxZ7d36z5 z#sPlSJM#%nws7F?+FAq&gfxXjr{cPSZJ)YghmzFG)jc_t=Pdq;0!2^iiykH?_QUMf zqoCHDVXdQ88qc8~q5jnpFoJiU)BQP3Bg!Axo`p2&pP*d3TmOT(N-y_U%GjV+bK7ZJ zSr5#V9Mc~nj3hxk*09nH>C-eRtu>23*nbjj54@ZOmVsirQ&iVC74mu2wlQ=nSJl`OEffRgj$R9l0z6J}bl}kqXyze0XcS@j@$$d}pf3^|& zt%o?2{Wh)+!}#}$b-|EVgV%hgi}%YYrnXbo|MdIdUM{TL>lXI9n&j2CItKW*u)HsV z(lQL-UAk6aMQbi}%s zV8%7uRblvKo`^YOWy(ixtx6%)bD|T5*ukhz-sYyYLl@K^AaHhzlqMr|(DfWI!r;( zz3MZ}lA_>d-i&EyY$UV>G66djT<5E!XG|1xDvN&MA|Q~*EK_L$RNT( z#f0&YdCT%7ZLjowTE3>GOR5(xe3Y>K$55&s$ z?7ool0F{XRdI;&%DLf_YFE*H?MAy9Rmjp9}2S&FQ2=`?<3<RJ8q7(9jy$rx8FM?^UtN}zFHLUSebtGpe(Xv(>oU+1!1=|29hZL4Nrjnr`pG_6YMe7@6rc zU+5RL&|x#}IvX1}HsW`{7N(K5M|3p*4==@@`L5SQzS#xgot&ZnJPy@<_wjp9hL4aN zj{7VE{%=oK9XE?t8`oR^!M_IY!;1O%el#_F8I;bEt`ha>?rU&0;NN9II{UR_24=)0 z9Tf9JeO#{K1Z^Hlx6hJ&;Ez}cnAz8S(=)k@RgB&R@Bh{>Cr~RLed>v3A-_Lw^)27P zX?zT(9({&UxKY(Tu3Rsnto{#hT=&V$ejB<+=sY?8D z;2v+t26}hochNSQ`8X-Ue%D)hvaS?g6M;yo;P;##8QRs$gIC};^DXQrQo}T>42etN z&rZoNKxP(6Dl@kYrfv6cPep#EPnjYH+X`~@CiD4rS0c}S64$$QBVp5UvL;Z`2F;gQ z(&O<=8;JYFP;5iq1;#hOAbus9;=6)KJKES3A3=Wcl1dZXsYBxS^@N8-p~qf4w*`C5 zay$+ou(4m-^G=`e0D!)S^*Q)R44J*@RsAEwm%iMx%(7&`kUUwX0Uvu(Mno&woFSjv zsQ@%qZmtI2^z2KrI%Z%4n&)NB{&d#z z*VSvD)b7>i1J8Fyo_=uh+$-vSWbZiU>cU9hI&pW|yanq=BfGmUwZA*ULr;HIFr< z^U@ErxE3}Uo}bf}s*69LaQqu$G(B{aG8>uF^1e}`$3+-b7_Fp)Axl4b6a*1{U}G1#zjkolS)@%P1W%(V7%e7K)>28SsuO4K3n#QfaE^0B|=4dC{Y%mMEkQ@FK1O5 zo04mhjG7j}K2{(`EZ$Sh+3!;$W{U<7S4cP=kh53M#5~rExAR>e zg&i|Xk<&#X*6X_o3~5{p0eQxZQmDI=Ao9k9y6Nt%ftIp zc^_IG|Jh&&K40>$L5jY}TpI}mxO%R$XnO7^7uVO}{$Kvnjymp!hI_OQ0vRLVw(p)` zch0&W{J|Z#V9c_?qruy}kYPN5kPqUpgFq|-BX>wNlOW2no}Z@gb3xU&Kgy&v3jb9W zp1sq42>$0%#NlTKpMo8r>QB7?fM}Erhx)taG7-J9`4>g z8c35NFGH})0v1ZMp(TQCp__x?bnFF0Vj;%qa!*PKsb<)Cc3d%L$G7Hv?s@oq#!JZC z5R!sxV`EwoOT9B7O$qtUEkr~LH#SUNHU&G+{u#>kAIiE4d$3OedU|RcICBV#< ziEoQjHI51nlqf_0JpoS9w!DO6_OAysJ$}n|OC8!GjJ}6mtqHBJv>HyOVhBc@P1yBV z=(Io8B45rJ>OLl&h|Ndtr27gyn@7t+8j(Z24uGV$1f~4$#`&CI7AEO3BJVcFL|Q z=dt*Ci5Px=H`j{GSScKrR;{$}W08t8ySCYo(U8!sN8ztg@|kaOaA*wZn>Fw^&S$1x z=b+kF?)1GQ8>4rHyfb`FJyoNQ!CMOzz_Y@ypq?k$Quz zXroe4Cncd-z>%^bJXzK(Xp$0a0Isd!{#WeVhVVNOWgm|lp=Ns6I^RPGb!Gm44;&cW zB~g4DdcAU2eGtIL4tuH#-$F2anDM!ASA`7pi;ZUD4RY}Bg91$|dhXbBQP#*Xv#DgE zjhc5e!3|TeqH^0XgMC4W##?#9|M`rhz)5+s%M(Av_44-QpSIdCF90~NPEQI6MVWAR zDlaq>!Pis8P$YSjlQ!bO?|PBA*Lf`#N;ql#g|9c*3D`xX8ez{0-0V+WqQ`CX?`>ujVV6A*Fd@OfXO$)(hbu{)}!#A81RBr9~#i)Nu!Z>eYuDs zI;51|rvx7h)=hGdC>YgTAI=rlB_u@64FBC#VsNxt{uXi0gZVe#&QA=^#?O%Dtq8}2 z>(h4)s=RWk>Fh}L)xa!f12}MAp9k<*Q^i>+hzR@!-4x;{IF1B;G|by2dYGYf)%MT= z-F#aY?wlJ1lY_z7m5&i=_L-2~CSC0?NU^7=abbdSY*{|QlWdCaUyZ40{;e#^StWK2 zYVoYJZLO28m^6T-(akG;DYQWC9a(+(B_RTRZB~?YtrmdP?`}Y(O2^WQ8v6@l$Z|dB zaf(cS_o#vgcu-7DOQL-Hti`2A#vt1|b;2~|fF7_iJP?wtr2LNM(B@XD4J#_Ds=~Ib z#MeS2w`fRWkSLdu%Q{+TB#u2b*Zs5Q^{jQyH88q?=|A`*P?+?;7l@xFw2;4g7dAWp zcfgk9g+?6_@WPy}_(-!x_jmP4-Yb6|SsPC~N6CRuVplGefN7)XjiZsZf;QGDuaJQe z4f(aEU5Te}Fo|lvxqakCe_O3ngb?a#2snw%87K|pU47lp7Ex-Yr4T5WGM z7}zryAslGbmwi}%>hhkIvY8*)oA5!wInB{<`Jw3vf^BGL8T zr_c8i;N|Ikn6V^b{^Mt(Mg`fSw^j1(V39>Bc8fH@A;4v-(<*v%+)q5VMViWCD(@xG z(eL&1d^?2-L4#b`CC#EcZ?XFXLUGw)Y8^mT$|v9CYeMwVzG zqJ1Gi5^&PL_pc1J*j2e_;C-AQJ9Ln$pEEI-s;aZ3w^JhhfVf~TNAO16T@gu(^u2vf za*awg)n`f+otM0A`j_@>o`hBK9ow{=^>8P{AIS*A2mB+a8PkdXi@(5&K~Mhh5lXVw z|3cCT$B2Nwr04b|Z>-|Ub(p9OP8bViEI0`$qwBl{PjpKqT~+p-tWYh45zBCcHMbG9 zpL@r7E2~ghqXYN5%W0k=7V)x!2uC*V7rk|6mlf;_Q$Lxn8~9(;-O1{ZQkMv{A%j;N4n7&?~bUgBr<^EhC3aY7AZd`* zpuM|ZN`;6;B-Q>+a3a^L4ozy{RyAvj&ORn@LtF=k{Mn8RJb-q*VGw8nys{;N8W<6ayRbpt^cp!2-?y z%a{)gb9yIHK_3X<13ip^_fnw>wgWl*F`#0+Ta{IYHg^Ykqz!pE3}w><=IN0V?~V{@Y92 zx!+hale7w-_S>tl=W zqKDv!f(Mg>;3V1f2kRT0ZyjFrnu)T2Z=NCs)va2L%afccvajos z;MK22A9c&?l&dyrw*L8!)=rrb7i+ova1|kTO(Y{JbXW@JMBePL86(d3aL@wuRNy=Y zxq?wHDawGcIJAM=lwmDouZ8myNU`wLP(OKYJ%M0PZNacf_Bbl zTJ5pR@1A${=(}NGA$9vcuv(dG+IY7vG|pw@k5*t@i@^?Po^k2)lX1`nHyYX2zZ^_% zi*g*Eet*awvpw5Aal#{|NU~LNn%w99DZ2B8-Uqwoao>XkWNt5S21CUzvXP6Mz?5KX==GiqP=#yV-r zU+1xww3iCXJ|dzeM)BfCGbzv7WXEs?;{b+HTi^;^h$XnxgNSvAYYM^o%(2D0=jT|CV)LUL)g!* z^Ck=QKF=I@e38(jA8lD)P3Z^FU(c;Au=W>_SpGx-rdM-_}i}6-Vk$>Dw8*gME17V9d4`O*zT* zJ@*TFAr!}V<@6r%_Os!AY zntK|E=CK~9wMF`_iArghPe|A6uHM?p0flU$`AZ*nAX1Hk1S2At_F0K-)O7SVN8*kS zGc~pN;~p_ks+OMFkxc;wW2;E38f_2`DR65-->UeBSu(Dw zL~@ka!Y|biRPWx%ZRH+j3nE*$mR5N?U51$uDqc#J*F*ri*k3Bd@PI_uLYEC6Si&%>Zn1BIh4v#7LfT$t zYRrJWFqx%EO@ns%(Y~ESoC^EhY0WQC&WQJDl?6WoYWE-P1IydvhidmHW&27}J@oq1 z;MwO=*D<9-A9&-YV!QG)y&m^Z_>Swp>$@+CzTV)SA8fIJL;`ho=HnJl`~XlVH>^os z0t;d6PXjgszI7Z)2ZA=9IgY`hFyY_vsf#QcQ{Kjd4<;ooi86cj{tTw}g8DeOM22+i z4F=XRd=Ls3rhCXu&IjI;Nc&`kudz9?mVH_3W2f>PUv|Btr3cjLG)kIQBQav4nXqN5 zyvTZX`gYs8;F!u`#uv>vXCSzmw06!Ja~hl$3LoL56aa847`shL2@XlZn?}vX^(m>t z(Hot5nM=@wrPo`1m^i_KuEFJT&2+I@`*lsG0#+IX1OfXW`ci{N8; zU=caTd4mj8FxigO3oH1(^zeM(Z{RA9>$;xa?8S|r*SKvc$f1mooTc>M#XUG6F`}Ha zM@t))EXd{qi+vm>#!x+wl|X9TRk8~)qq_$PQTMkkG(<7eRRrRJ9T`q<|jtS@|8 z8jjP;!m2{f6?9uwzhCwHo?YdB=JdPB+eCaPMDvEPt?t<>AZB?;+G-zWf7TL?H~Nj1 ztgpX&uh(;8S-^Y!)N`i4deFx3eaMdPQ?GBZxf|7^br`FCGe#h=_jfsVWwCL0v>w=w z%o-`p7zpv}Eq5-l=m&~zOs}I)x~61-@~+LazwJl~A1J~KRqqbToj_{T-lW;dm79=* z-?vphuGdqR1h3shCv^B+H4h9K;l>Y3?^Aq(9j7AKSGDIT!9f2Yk>^+~JA>e%_34W9 z{Sv1)4a<#1kcRYkV8&HoXnP%))<7=$W7!0rG50oz?0E4W_ppA6lh&^8n5(df6()vB znEU?`_0~~seL>eS1xibCcMER8-QA&Ri@Up9f#U8~+`YKFI|=SqG&n_y%bVZxzR&lq zmA|s?UAeh4=j@q1bM|<)UWm1fh?a=R&3)3uL?eVQv^HutmrqD{F8Niwjs*YA+G3Z`E#FrDFhPHEiur zFyhVEeY3jVacbGdv8s!I-*4f=fDHs0LA^9B4HqhM;>pYf9>*%PNb>uHM)FI2v$Y!^ z_0#&(w|XdT#^>X8?=i``_i&X=WH9Fr?Y}@%?A6z=_MXmY8$^~D{LWNUvj4PUAue+CqQD+RbppD=b#o&yk3Nrl_&-SwPy z9=+y$-{Hw#0?1aIz2`jr2hr@?KKt$;VRZey&utB6&WvNc@FBQxxu0xpj;r+^F#XG= z;x*N>RKNLfF)Bh*`|yXl8lkvWkuF|%A)b^8(w&Z65A6;rKUW_2UDO1j8l zKs8ce68xqqAtWPS=^=)D&1}kfTi?Be2vO?Wnw|sTI^qs7XE$+)dD~(_LuYH)K2g59|3qyCT^6%SWE3JUP1s#@?o%?`QAwa2c7}%XZ z{pNV}LpOUUhQMy^@C%+C1ObB_#lcytiOkRDvtJZA z$qtqpt)%S1-h)>K5}#P*urz|mBP-QO2{Go5I0{c0b4}C1)uTnrT`!!ZIqCzESoZvz zPd6M#{7hteTVqk{K{cm`*PXCjK_mub##w#RE1m#6BTqbf$ZSoF^q>%h%POLquOI_# zAnV$UTpqA5Aq7}XNw1u+VXPb-pD@?bf04{Tyt6w}#u=VYactYbkrxVFz_C=(m{e-d z2kTHJN@lM}4Wp*cz)4jzDSKnk)Hymj?=!He)CWyeD6y)kc*xRHSSTHH7HAgO#-@6e z@X=lYN+elGlh!v#_{E%L+yP0`fC^f@!UL**-$11YI!HrS07{Z&wXoZ7cFLeL1{KAL zkdU(#4Rk#rE1KZ;4X6l)P+6hivRp8-u0UeSm%a<}Hi{O+Koum-f9=-ZG?qNd>YT)= zkX+GEEuWqbE;XQ4d|`Bqo}(VaHrs#iBP=iADcc&qvGm;rfo_?x`p07Wh8%4tg=0Lq)_?uz#I_PWHBZ_05Hwf>&lO<;QkhE`Lz)B)< z(yOai3V0(Ko7qgkjJ~3hAIEy)5$>8H<0J%a@_ATuMd}<60AV58HSV!Ft`%nd@JW3e zR-N@>ZWqT-BBWi;S+XDIEQm%gh%BhE@9O)gF}E`&G;u(Gzq1DaAc? zX>3)3yT+m(&XQjkrypsbLz1Qq-M5ao8Jk}d&-}yBQz|~q%I7FH&qNPBg$k}r-zq=( zns}-!w~hv}!qvnx?R5|6tA?`E>wAJ^%?8b|3|jv&iJwt>A!vtZPm|9S)ST$ z-PfcBnFSv(K@_zHlO%ItFY}$7LO5Q|@~$f*G-^?f>XplUGX$ z8YNrOVh7~Z#wLEpcm9V2vr1KviT_}^pcHZYq2hcg$a{&F#c7Eg!G&f(5}GR}%z{?V zn{8*w-~#<(nww)i9pL!XER62!-{MYV{K&@5Q4=SrB%uWc@|nTAbH_|@SlzSSh2LZu zWB4(z>7G4xK^I0w?lUN*Y~6vsBtG@KSSY=O;wQH{jsv?uq+_Kg zVgb}GS4eYT$>HoeSB1@>;7*zJJhJ>Z|ag3~957F`-&+{SIz1O^+pSags1*_mgtWaHl^%)48witqD8*#-hUE zP^~X>opA@2+1G6p>ip?IS>=sFf|=qcSs|Dr40}DxgZmYavUV^11jc>A2(Bgq159m_2A;RLdomNE?Wj2yJ5gy-7#(z1o4|4<81oK9Gxf)W`z_;JIus`Zy;vwsbvLC5;kVls?m=DXXj6WwJ@*e6(;1}pv29K*g9fwyZOlbYv_ zI^ig_<N)qHsYxv&~Kv`6qNWaqB896vKaJCY-~!5075eR;Z@i zSvgf!%0R5IoRd72`0eWR{RnJBT{i!gDh3f=6w#E z-ypvb%$DAev`GOOCb(y?$ARnb_IL-4d*skz5jUrM#vhQodpI&Ei)en!L?7X+@}HAf zIEa+bu#Q-FME%XxeA>XQow}ctD?7#5E^$hbglMVOPHTNMijw1M84lmsW68iXdqso! zysj?{ZzW*3Upd`vVYeVH#d~7;@$fST@qhme28M|VXy@f$#7PV#Q+-)gZsTPsI(S$W z?1rYE`2kD6t&Bw_k^iIaDppEC0^PENL^+Hv9a72=Qg_{hm;u7q=FaRMngcU2Py-{Qm2u@RY`vW|Bhrpaa#7&T`k-sM$IiVO1) zVj_JZVFQb~9-~F!ik&R3m}_$5b+wztH8weAj$jX>*+ zwtXx2WI__Sbi9;TJ|2u2Sy2P~^$VI5y)xlu(f0w@mnMd)C=X_q&C{OBe)vz!hH`bqvIdX4 zB}m?sl~~0`79ba9O=L&v+;UFBiU^rvCQRY3mLmI&+pv8fl6<$S&97BmJP=>W&ypN(WnxOR!M)~!AU$65Ms=z zzP1<%BO#8g_RZSyWL1(`x#EdoH)=Owkbc-TkE%KDvd;4_=tCN|=wi0`+Bu0cOm=yL zbIGk)&Gk<}{ju*ay;xuweL?Quwx{mB@rz%|q}jCVI9ZhsQlrIH6Dc0@w`nZ~Rnw?i za=#{w3-2bj>_Gab@W5`%_B;^{38tj>IghGuzg*Szo_i{2U)meLG}5R&`|(1uEG|45 zq1~RMBUZ+oH<_yMsc#h|68#tHAb~Cjcyvzdc3tJ zlHnks7qr!qeu#~kh$alJ-X*v*2{Um0oQqBSxjCD&ITn#c$3Oer2ZNin0llc;p-MWE z751xv4j?A_uS8`Px2{dV=C8z8m6~`v9?_yU3GR+Hosf65!^&IY<1CH7!5W?R3C-=j z_o}P1YwhpV}Xcsg{a-T$ml7LVr$^swg|_SzI_1!D2{tlA;y+dXXHz|x+P)tH-Y(;vlMHC_en$C9&IO%lE_R+AV?gw1Fm%E@YiORofU!SKd z^msy?!2<})lg(U)@@WI%A$WKc5tqH2)7S{Phj8)+BWz zx@?TQnxhWcXm57+D|tOB^PY|QtS{eLPS&AJ>726Lew~ul!wX?36E|^JbHzBU*0K)# zS-Jg)W2?XW(*~EyLmzlhk{gU@Z>bsI8(+c{hBR-YPI*Eo7IoiJCUAC`l~#cS`5L_? zcJHmIx(XuCKv!}HONnj8D5N^37*k-F17zmDvCVMS2_r15)zx=PIbyJM zjgwUhkuw+O@Ytu6j$LG(FNLD@%CL@#o}FfA+z6IEuRu?-lK){-!46tnTqLoQBS%M% zfuKuCb`*98hK8<+_ovP?3d|&RM|#iUNXd6WYyT^R4oK&wdUrmdr|~D<@dnII<=;Nj zk*JqDY}y@5As)0kT@^Ocq1>$BpU^;6&@&Q~>{vtCvmV_oP0*|x59Q{h`(@~?lu;s{mW4~=QdLQ)TGs8#yXT=>mbmWHcIxOz2G2-+#M$tlIaGon zaJAAebGu=QQ*(xY3tj%bsw29L;o!GljkcX(f%HzW={AiP$3?0o4t3ncXns)vp1oDg`+{My)bTfe~W!&jsQqBEcIEk5uv3E#KLB4Xp_iZ zF0I~5ya#rtTE4Q@$0`;pa-dG2cHBzDYr594TT}ex?6ol^qakk}6G%VPD}Pz6`%qScBK*!B2zeJ{5|uDtFY*Z;BF;~Y*XGywk$@3Ru9Z$Wf@?CL;V zy$DCsM2Dk6eB>jJ*N3RjD+Wkf&XTcJ&LJ+l=rr1BGL`6NrdMAQ?g&qJd)VdoOrbDI zZ$S717<^DuGocET;f_O?}VZGRe!7U1!N+DvP1SqfllrRmxeX zn`jZ0YbVB7cMHA06GvxOaZH!J05yo+toRU3`bc}rDi(>C*m)+;TzGuA)n4Z%Y)78p zhsB#(qwBzkzwmzlhoNe4huYzA_x-OhuI@DT%G&fKQXtBI4H`~jPycH756E15aJi?qsUOC(W<+MbSuk_J) zJ6_@0_)@oO78HP8bk*2zJ%fPS^5nG%8Cgl1vurE(V-V_=@wdd-G3}{iMF(`3x?gKz z>A5}!-lpdx2xhevDVI4n(t(9wp0!Ys<9Ni+78jDcWe(8^+dCkq zOVlkkq5zMlp=LJd2pjm1cZk0VuJAe3w5EIoOTUIatFa1Tc0j<-f=|+tPY7hGeWV}V zT_dU?-_iIiF$mN9>_wsR*E8V_oes}wnPW-|9bUOe<-O)FDO$G*Vi)n#yjn&#vG(PV z*{x<;65fM17waO?drhpUGh)KTkL51ED)X4$ z_~eMLHNrELQfsjA?(~7l@N-d&Ibpa!zpzt|Cscj~R*5n}+LM2V3p?zQH(U`b=9#WF z^E_bJY9{$4B)=wtfV>FVYj`DEJ2Sto%y^RZ_r1)oL)F) z#Hj(PbUoIaOz)8!yxhL38fk!7uW=_zaM+#|8BedN*hDO-HZLq{2s20P~E5I^8JIUAo=cz{1LZ71cEiUs@iyNb|6= zZ*JCQTO0WBDO;yMgK_PPvX!e?zLa=~=;s7@pz#+(M2Z_(m*gzpWP#j*u-C4Dv+gCI zCDKZd9QEcZaK-k$KUhf9x3>GP(Q~oF=g#qcsqxICeS*W^HhC(FBNG2p$3v-2HXTec z&b9u>KgqUN%kYsbAAe~A#)r@1w3ITksK7Mc^wJHlvP+Sbe4fJFi@aj-Nk&)C*Eq^A zwnosIehanbieUXOWQX6m9CGN)xmk2@lg$uYINJ7E`p$Z~`iBwhCK(Y_zRv!^loB5M zqt^9akl6}{Q^6sHYK@SlOZ-W34v_*LCN0fY!{xXx35i0fpwi21?3R17GtK#K4{SpR zV2`)~5*v&kj7hlajhDpn<)!L^kS3x3EvWwelk{AV!<^D?u$v_I=$}R^9)%+f~Srpcvh9k6^d3v-FeT>}dZWyXK7W z6A7u<-0$E#7&+Y>#CJJ}-7F9BEowAy_3{o#D$`z|Mr zAgkRmtX2!Z%v{PoWO}^{zxTv4#M)vas}d?p6ii1@AmE|MoS^{e*xEGS7Bil|a3NqX z&DzOvG?{sk>Oi=tL$C|RL#Mcs%lCI%iJGl>Q~!F>_4Q#g)`0399o+|6p=^h zlHAE>xf4OKTd!v^BsIn^Dvvx z8p{O zt1*CE%SS}NQ4KPgAgN0Jn**D(9NJh3DQsb$Iz?|fb#tC$&7vF z_Wb0M@Z4qRS2Fu?3vRb45_9xRQS=iP555*aCS)aL;%th`4FM@RMK?Iw!d_1qg)WH> zd*gtzCoU4AQowbCz=Vl>ckqNo@=Rdq+Mva)^S&h`~1G&W;NPwu<;rq`M@>*$A zp5}K3%YOi~?v{e-RxOgzc#Ix?+Pem{1*YxHQ8<|Ys|zr^8hC(g0Ob}MVBgN^`D`oHTi#6sp0Ije=vFp#=3fmGAC z;@d3sFSZ8Z4UrE&hoTzmV0~5ZTYYR^@W*bQu)1|Mc{>kjM16p}xVvuOExpF$`kI@9 zNzW8odf_I+jKTJ zAGkW2b*r`_c1!K$yDq8LYQ0fjg%E}aeKf2_C$k&%BtUmjCP{K*k#UtV~s+#dLJly4m^zHKg@&U=m`9j51UftNy{KX*2+ zWLZ>`q0p3*(dVHT0Z{%6pp05gj$iF8b44sv=(ATlscI-*_xi;D2SiMm^8w4CL&_$X zn^pq*YNJ3qiTLncqjP|&E>pl4$Yw7!ny&Kn+UO(|n#LDjsr@MBiCUyi0#py;D?cz~ z^lbz3;Td|W&UdXDJdkJm2J9S)x5%|TX`2s9WrY}=5a}%p?URPzr1V%;p#U|Pd)+Jj zXZG0z76@=yYZ{u@u?)UC&`R#h0UCVQoYC29nShJGYOI23@We9#rqLJg1{4OPBND1%P8;+vN zkQ=%L1Xi`xC?oMe7OW@5lu_&V&nb-qG6-m8H)KCWL@l@L69pjq`*9nT*5@Z<@uUDy0la}MFD3DVMNKH7hZyptiwaDVnCC{*&>~n z+t7y1_d<=vR!gqe-88)kM5T|J`fGm)6rZsit9N0K!s0+?!eQ;}v>J@NoBoxuEL83Z z)Z5g^dBu~?IeTh1uYdYl@8A`fPhC+lY;RvB@N^xhJ!fqh>*6PQi0i7o7sGBo-tL)P z9zD&>#lrcM)zfOFKtRNq|8h&<9}2L4!6fOXtKYm2;NQvK zT%Y%4t2wL4rK8+TZ1DXMz>-tyTCP6t?{dM%H5Ks?`YI;`zbP48&O=QB}}+ zlZxGP)$)tZ>7KA{G#D9pC}b69@tyjXouoT%X+j>@C{;}#efV914AmZ}zMqwNcp$<8 zIJf?k98QA=U7Q^nTe}d5#ROB>Z{(5Ry16Mbh|XuJh-i8l!YFclU5!Fp_sY6NvYZ4;E9*CZx- zerl@atPBx1r^jKPRJ|j~Jc5%hT*aAi(e$_9&KN%fuoJ5!_X*}v!xFqrDwL_ymCFKU zKU2W`9UB}(!N{($@>mJD6NZi?7OVqNqLE3}^5jX!@u%uN`5ClM;p4$P2*4~yjk%T* zBT=|2FdzRA?-w|L8h?8fwODB%?*_ zd?>OxJwf3>6+vIT$GMBP(r3-$b(O0$&f-Wh)A3%ihMoXlFhvzS+DYVeyfF9D@$Y@R ztrY65h^0|=d`0wYW9LaC{Bcb~-b#6iGsZAizW5l6ST?1l#x10p5q5ED+U83Cm|KYg zd=tb$2Hug%L|7!GH!51*;{+ni6pFYVmaAt78w2Gn(nmi$n8NTxjkT%>;3HjPC-GT6 z;JxwA-9DM)O1R)3Mq(#7;U&9d8Kn~GF9=`Bc|T?sMu2Epl^SIHCn&P&DiHSCj%BI| zB%&gF_DK&=xOYs%2la|Dms_1JkiOl`Ql}mpXPR=#F*LaMTt|0?jVb5n@Q;I^u&9q` zL(@vVxi-vGM2D1R%)qf6A0zx6fKi;)Z@Vb;)Z^YgxC-TJ$;=8IW)JNW&{jc#dH;#8 z^+;j(dWEBb#t3OY&dg^bdq7Ty6(7pMm*ui+-&(lv;2xSHy2K>GSstt*Q*h0tj3(50 z;)Kv3$6h3?o3z`2Y}xN6EUYktnR_Wbi^>|Dr=5%PCn4e`I6}~StskA;Q&BaDvHEAO zF4<|LE=LD8h@Vf11coz^MDLjMk8DD#L8@ImY!R9*=FoS%AcRdGlsX(_0@Z+u55+G; z3i+YF=*P1yL%9ULXri%!k`yOXY(ck6#!p3J52$NiCdhbi+1Qt~Z6~ZJQSo=M&&p0eYZIox|m8aa5O!aMuwB+KG8e~=E24sGV#kZpjRxer&hF?ccBy_y_ZvM zV<&=YOrQ2RgHeqUhNDKAoM(bfhgzubu3{Q~{L>9^$%qg%U+ahAY)5C$W^124P1O!@ z#ByoEhy}L4FP<%{tWnbR-^%GaKS5>fyxp)decVeiRU_9cmG*a8T(c5<4I^C#qZRxm zCYC4IrSb$N8kBYX*Xw{(o0%bGzOu(PoH~bxAC;a_!B+L_6!BF{Nf%Sy;&N#*qcl{> z4~J9C1+Z~LBgsjxQn@%VC-RIsjZxJRrra~-WgFbOtZm3WMTU;Mwfu4B6+1s@K(jTf zPre4pZpyvQ=VJki%`h+Ub4fA1bb!IjJ}hx=kXr0<6hG1LeQ{a!jkiaE@D^k0^wr&} zchEOfd)I$B;e-)pcV4$ErV{Jfes^yO01B>g$N}sh5x6!@Nq;Fx49vkhuFJPP5Z3Cpf7+N_XFxpkHSj%+^G@)I(X8L#T4iz0tv9_A|zYe-~#4`xeqJ z6(z}SmNO{w-l(TcoN+vV5Q}Z%TH!{ApuB>D?cf65^UV^>Z=D;{$CW>GuHfEuY4X6k}H`_-iV#`e7 z-%}>S&hbgtAEeXEzd34*#{j`9#!1FJ%SE+y-?{x}e-?K+eHG3F9m2;lbcP_Ig3Loq zNU3IFJ3X()jZ+e`a4BZNIu(2t9O7yT_FpX?~ zzaQW(1~;3~@nasT*Vrnn>Tq%2#jS1p;0hwx6DT`|yNdLu6$XmBEE)eT@Q)l$hRzFL zj*lB=V}ShuMx5@;GNlzn$9&JKjFT3GoftlwT72CCR#M=UL`^DZXNy-z8DmgWOvX?) zntMT2#WiN!8a7)v$86hiST@k1`Ips}27b3C000F)xLFbN^2n3B@3O5s}~b z45`*i7vb42MG8%9Fb^R*iYyWLIa%rpq-6>d_S*;QDD6xjv&l@3Q!}&|Y|%s!DG;~! zt{cmcY0}%67iKndfrd%M=v)IH%ZQ{2)<0eh+)J8x%Fp9Z2Hie!;z#xKT98%Q$9yy%#CzkM77o(M>9SUj5ma`tS4m z?Bj_-jq+-vk>L9qk6n70EoMM^^q6`X2{MI1EEF9(vTGs|q@mV4t?y}Js{`$k25|S> zGWN6;M97jD{H>lQT01N~b?h%1jpIQF**Tvj?$D&u&h0nkJea^ZV*P)R++K#*E;H#i z+ou%^>~AyXblx6Ys;?-`6XIoR6a%NeMQ9_Fgqu_-!NH+?I%R*I9ssfR;Y z1)#Oa^Jgu&6v(Ekt*)|w${-_G;8FD$8lARA7y?#>UGFgg=e$C$a&8s_SCR6>;T@m9 z+Bi7NI8tIpq=HQCJAT7;-5Ta14_LKbYzKY}-gFpUFhpE9zbae26aJDD3TM*{Ox{08(~Nws#r*b$D0R#$2SF)boAtpCWX}=|)dwV3zoB zYm+j+VZFe1hb-V(ta>8v`i|RYDYfqo80dtio00sbY1S%U~i00T;g(^stdTzP z=PIMb`z7Z~W?8*xH*w+pPNdGZY;_l`SKE~_g-yVfoXY^z^``aLo#Iq#qf}5U*O2^nqtp5+Y9wk|6BduJJf2=&2du3R{VTG$< z(Q;00piqtcJbB1+_I&9@`pYuxLqbHCgk+DI%g)f>O|ipl!pJB1>)QfzTtA#RW9f9a z*fj)y;A}!j$*Fvj@}&vtVY0Z|MGWEY(s~mwa1ZYg=uYz`R=K{`U^kY6Mj&15VA8m% ze4iGjVZ24j@_e?Eh5}a;UZtIHWaD&aPAZnL!w{CIUUlq#IPXpCj#AVqH>++?O1dMD z-8DK=xRspk86?k|X&Yzd14yR&4rwFzwO4#kW^HRj8tYi7*jKZ(A)XWbSIU%GOGP4D zjhXCL=%~8}n#7>@qa95_yQU&lV%zcuev zf*Mp}l;GR7CTo-8^{$Q+0mVF9Xi;CZ_#T&AO=_PzuvEv*qi*SUfdhZeZCu5G~FDT zdSiO(ms`7L?EkKy4}Q8rJ+0a<*ohYT6q)3ojNe%-XrDZ6j6&a&^90Y7+sN)57}Cw) za*mGavfRsOkQWo}>Z6Ml`%sRFf+N`pnU z^G&WTOgSfj$S-d4Kx49FUmfw1oT#}d4P*4>H-U<4F9Fc>?a1 z3eI!i0hxLhiFjRJP@KG05Q!Ki6`B?0Y#c1&DrNM6Eo022=1xw}L-~USvq1&e<~#KI zoM9U_o~ESX;+&H4{iJE!_C%}^C0M44)7^GE!j9O#d)_n0Kl`K^T!-1hJd$l_5*?eb zu?!k6Q1-=KNz5#miyRqAXCk%y;k?#<%D%KzO;4q3l}&q+n>AX&S9X8~wA#wlw8z-? z)T^f!i2fpqC7Qf&RQE@$(|S6T7Nl5J$RpW(G=@48BR8 zXo*|m+@33ScC)_RXh0P1Wy2IT;eSnQu`_euQ1>GBRl#g907RIueqeZ8hEDMfzPHe1 zmf8vvL`NoH*k#1iD|#1Mgl2L(yTlpUuv#SkP`kK0z0vsRE3x=Ek)^+D9m7r*&Ex&c zK`-eT)5Y>-OkOCAFAPSOkzF^Oqp+XOgyhJ&Y*-(_y&hs6Y$6fIvmC)y3E!yD!&Jz# zgl#aNG>It&4NAvt$v*1kWGlS&ZMDY&9OO zSeRHVGE`4e`V}?m>wEq)j6|=ebpmPGu>j!A6PX$ThbIMh%A}35Au%XClDt-`(YCg7@?C0WsOkZy^YjN{sW6 zn=<9(7o)NKg|aeMIa3!vZx+Ht_NZ(paDGebwcS%4tAYpAcY0?qzw|7aii)12FIlX`mEPR^ubqG{b72r@>f zXo)HCr!#np$Nf4S(Z66JQ>CdmR%v1$GIA8;rL0=7yCggD0efQ#{C$VJlHZuicNdLH?6F#&~kSkqjJh`Z*4q|jPD{!RD*0{r6d%4o)&&ytb0+1ZsU z^3>7H8s?E`bY}qG`|2BFhAks?r`@)5*YWoFZ7RrE(oN9uNN=f$qT+G=aPOc61p!%b ze~E<)YB9vDJM6Kbdx*+U%eomJ329J0>R)rL&PaTYs7{X6-}`VF^fbL}>XEC^_ih*m z+{A61#8=a!_=I+2>-MnmP$>P*uIjT%YVf|ca~KYBtt`wizw8n6I&|&vuHLXgH8f^e>cgx&%4SYbrC8w|sd)DZ(?7-n$KQ^~_KYxV_9u`= zMUrHNB)TQ7Wx@!Hr-h85=y@Ea9OoY(5u!c{jK@zH-q-j~H#7U2jlAErn+* zqktCL*=%mQ8`@1gVyi{3;6*yD)Cle$C z0yFbwI_l|OyJ?o=P5VhYrrC1KaE~#wzQKCEBgZ*eKk2EC2)o3At1aN0TP_r!qvyu4 zHkvx&>i!1pB=vZEz;{uMLsZRx0vgsb(G3>s4d}#YBBC6fl4B^BWS^E6rovGGqnyXD ze)@0gVxb+Qv+qPwAk`d(@js*_%Q2Ia7Wcq(pJ4Fhzfo^VPq6+Qu=U`v;Wz3hv93Q= z5oM8i`51VKzgD_@zEc+PH~nv)UpP^ORfpc)-Th*v@@)vMa1AtQ4sQDJLi}@GYQId% z%y{hsMgw!kETfL|NP@9_7tBf8;`{=~2fUgjnZGRGUFBQG1UQ4hjLL%3$0rv1rJIBR z=6S;!tw{WJ1*`Zf@CrwkA4!82O3u%Y7 z8`3xiw#ggFJV~SO4(GXGefzKtM0sy|mlIMwM1$oJXm(Hb;@r^&!n#aeO$y6xR$rL= zsEKoG%Y_gDY_Yt%Of81W05AGPa&vbyBYbqU)M(anFZ@W@>hT4dm{aBq9DS2CTju32 zftJ*G+%E*UoLE}4GKPN;NQIbzN|H+C+C91UH%3Lfiv>jF#2Edk zEULMh+o%@IdYw(qo|H_H5Iwp^-T28&=Mbw3&2(mhJhNyWx~=!_cH$*o5<|)t&!okJ zNU!(A)oiDu`DVs83J=>(X(80UF;hxv*#ZmrdQ+>L8ZJEq!3wp@gHI<RD#hEs$B zb=gmTzD1j3f7|+tn8L$T1dWd4;0@HAni_|vtghAJX)-G30L)u!-+lVX0Nkdnd}wDX zM&>W2!B-e(9GwPvmcpOq91AHg$yzI|%jea~xg@=Y2})uiQwxAnr3-s=_X8_=Kr;=A zD~kj)GeW$FiSqGOj`gG+zop+=*r$4DN9mReMuN%a>y9cO*~b4A0T!OaWV+O;S@f`X zC#kaZaF9xWT8unW&1K(v3)=qQqO*KLXa#LvBj=Y{@!kbs}wu^j3Ua>U1AfEcDn9{?KzJWB)$0eYWU2@G$R`!vGQ- zWfHx6I~`m>eWi>A`KdCHT{OFjj5L`INlF!qnPR>Ob*HA4kpnkYVfs=WCfyplhF2b% z*4jE%hy;`uZJ+KNx1cmSxq(*}*w|N|Wc~1A*PG2lVWrgW)@+>5xC!98|$^iXtBM-3|oAX9a zX_kGTL4~)rjfryF+DFTd=5-ZbbgE1*xG3GjSmC7St6eu(daLzSg4^!MXipXJ(>nqB1zrzvs#35#Z;Gljy1^>=OJ ziG=IjtFZ!%fNbE-nY~FE&y*`Z`u%;UG@QUqUAME{T~t-y<#s;5x1jzk-Lq8=x!QI@ zdfsVjA%)0DWosOm4xGluC5rZDg&DWn5AVNr`-p+|6Cg^{iy>~#&+V-0o?@Lx*sK_cn3`09>j{N z2?CTPJ)n%axJB%62_ckSK4UTtPtg7&blC;F{R|R`8AKBlY&x&mob+0)@~;dmAJck# zOZVsLxwd_CuWo_z(2h^rj>9*-Pn~}oMY@7o-v>*)9{y5d#W^+TxgIn>c;daIZ{1&@ zq1gK_tv+83I0pE`sU{NaKErG<0eTq$&!ztnEf>GvS2P_TWJ<>w#|hR<9X4PjW#VW#62kuk&}VwnW+dW=pVi zGFAWD388YHLG_})b>v7jfzg~}OZ0~y@{(J007z^H+hq-OhuB*7Z#2XQ(obheoHV)0 z{o*Y`LT^?zOBI~bDC=A&(d>ZGTmZyzkJWnTJrrM9P&|i@d{A80& zShn7_ea9f0P%e%4p2Fvmr-Q2oUzoIYJB`Yx^j5Wnm6_qn?%Bg!eZ<1s;MaEeI2W}Yzs{V^1D|?c1?T_ z8FR`Rp1OrQHc2~jfKPJlKZ;^HO6cW^IIlu`KlM4nJUC-`w^zQI!aY-&>DD#r4emD# zO0!_FGi%`FmCwVC{BJLSAXLqJ$MI!VR(#6?Pn|^cX z^wzpHUJqWZ7FC_i+rHW8XspS`@dV#ZWZ)H&O}%3mz1lM6hK&LbQqHW_n0L8nn!*rO z0~w-&BWoLSW#;s5=G0^M{7%}( zaCtUzEH3}!pI+F94;YWkFrPG<(*_+|E=e)it!?(V=G%rg8)l_G@aQXftL0`XELg7J zc{&HEcGz{(^>Zas@AV@Wasy!wxN*%&tz&`GyJmt^2lR3&+2NSU6mJd1s=Mzm6lKxk zW*P1@{Iw(YSjvHNEt^$FvCO+zUgOHuopnye9WJpH6ds4TsYdc@k=rPb`^3V0XwvDN zay$rlP#RC@k$Z8W{ijkAXXLSm?~%K2GehflTpebn%R*C6fmw&vdf#b>-!%@W0ZS>DUNKE3xg55fh*%QU43%## z6=iRpgx<=_^IAA>C<`sg1GWt~dNG`5sRR0J--WvU(<1ajUSw7u{2iO)S)^R`;Qv$u zu0>$F6g8nByB#t`6&($wk^UovK`v*BGR~mX<=sj~)SVNwA9ni{)=-DldzpHFsYjHO zq3K`#asF+GE8x!d;gRh5K*>H}QmJ(>Ez4n)=xtvK9YgR9(Q?ox_cPRk==@H++GVeju!hXHBC%`z+}P9)PKJ~} z3c5GP3>tdjhm(2XqiwyTlluHI7JLW|cfK8~SBkaL-)fE_dnOY(x+i&;z9kO*7rYJ$ zD5}gEuROieCQ;aUs~;sDK2Em%Xl(1(+~_#v{mA=N*L#{uL5TK0QQ^D3q(NzAIN=5l z#d?@`|d(1+MCgb2r-Mdvd?-Gq}0mce=cd(GkT4D3DXuwGMty zrDEpMC;nYJ^t=2-huAtK-bcX|jUn5cL4&EUvyxvX2i}5542AI*TBa}X@o5unet44G z=fZdEZ1M~AwfOMX<+)Ut{VeC|co?`pYG!`Z6^4quG<*J9{UXGEgKkbJ@H0OhLTX!BfosRAvPXxc;2hAcKPYr9fW!5mjloBr*)Q5Q=hrtf_Vgug4pQf4mv%c+Z41P4_baAcIttYvZq z;fe$08hu1|$Nj5@ZY^h$ztKGi+o5JFD^Us05HKI>>R?!Cb1CaH0PWr5vuxhSI}pV1FVA?Q?E`Fp%#r|YzxYd4F1`LspJM2!AO z0VK*o>xH=#2X?yBd2YxIKr!GOZV;k3h-U~0E)XvuAk>WzTm+=fk7QY`X2X=sw2u%-XDOYpY)hnST zx3}!)nQ-7f*G|}NkKY?7^Sia^%~m_Py_gc*yFFo7=0=+?-!G<`HKnGg85` zECgZmU5!oHFKlxnVz-s{hikD%ry9yqDjgz)ucTp{v{yW{O=9aEevos2XNarMq==}o+$z*7*rb$yAmz4TE!0b z1dB0itLf-PZvQNKyUSKyKH|tbGv}rI@oP>1g_9qZeBj7P&{m{BohZ1kuue=!aXcGDN?Hu=eBy&qK7P zSZQhUp)$7Pi}wk09$viH7aUe;l_-;Ni6Q$m^v~^N)$U@4`IwC{qzYP}eTp%YWBRCgFtgW#u#qC;`jQqS>U;6ok3IQ z%6l*<4w@>r!6kC>HJDwIg$>Gb3I4cbrZLDsUg~_(ASnqWZ`tjUciw}@79?QJxrkZfK0BoLFjRXlna$Upv`X zj?XnP@ND!wKc5~VlkR!dM3rf=vu@Sf$L@U<#JSzn=gX=qGAqhc`^>c_wW`>AGBZ@A z&9qZ|1xL_*sH!}yFi9#!otoOFdh-3{+V;0iENLej)BBLhr4N26qpCx*jW~-@(p1i< zkvp5q#{N~@rbieyH!_u%mdZuVN+f3 zF6uYp0tZ(dTO@s&3JfE`btHV4nCyzRHT|D8HCyh>FP6{p-zF7rNp#_C%!1}#(ms&4 z6o4yV3tIo`X4q!hf{qBZ){*Nv^16X`2A_XGn-;9h<>0d3@%WUwQDK+g9x=HQW#1je zAN{3noBe%r>mL3^(sIwM8_Ca}8F`74jJW924FdR~$+OE}L88mJ;ccHkCArKTG?>tt ze6jnHXGY$~D~f;UhU(o^TX&RGJw^LM*GqD<#MbWX%x21(`C$4@7Ijcw@>hQQzv#6@ zkZfCP6~nCB_nG&Mod@&1np!K#!LunM?#>4K`cEthEVvVZDxY%D9hHPkhunS-=bY2C zxaRfDS_RQLHA@FM8^7yFbeh#Rh0i0qCpNY-cYg;Fc(5%duP-zD5$rE%UB(Y}d~!t* zEH3SXcZ|Ffr!nT}Gy)f(D{PP$2Q8<@xEICP6@kWrpUw4x$%kIR5RyfmP;woRiqL5K zO9d1fr+8I;GNIl#rNJ;z{$-@v)((D#{qv1Wq?c^S90Kg0xpYb1<&*>lZElM;s{Ez! z<@3%{IS);x>Z8hpLw)E=lLXj>-V72nm%KCy<{RwBo1asc;56Ut$ih!iqAW~Hng@C3 zk-priw0k@C*6qj1KFS+c?8b4~0`K2XZ!Sy#9+;#wQs*kAh?nr)ID-B5Y=JvYq82%+ zHH{~C+3*{&pB~r(5?xrdk@*=PwAW@nG~sO8^NN}%oQkG>Ow5`Sis#9?Nmo5@bYrSO z^AJp8sG@m;gUPTs)i(S^McFW6( zABJIZT4@~XYr1xq zlDI?_`T!c&FJ)6xa)x!gTaQoH{p|i(!n3sW>m-&?m2!fY@vJ)el{yj!v$Y~WdQTO& zAQditnMd8#vnIn4pP1fMHxbwC!kT%Hao>{F!rvz9mcJlyOv_7hcuujkOxvL}{*$jd z{*+7Bo+?dOjd8QhtYc}UXCqx_q1{!|nQR|QZX#kWcCj}dN`(AQV&~*3=t1Uh=q2qV z-}M(iyB|*;x=_M)qNo#~%!Yl!`=muD}R_e^4jl+Rr|8<9ZNz*~?~PhwR`#v=!m zXiGHzy{Tm_GYbeYGg<9EO3MT6-z|!0)&(*2f>WdlY8=F7DfB ztqH#>iM9;~rl6;;uS@NTxr@yNBbf}-%_gtw$}Q}TSaZJq%#@Yr_2h^fj3C55-B;kF zl|Z8rqI%wX*|0Wi*PeUN3Av&iOoQ?pO1yeiaTG;;L#5-intg?6zH$O;PCSreV+Dr1 zBQQkKmUh+7H?7RhNH(_p`UEpgcf7&1a@S=cUQr&CSK5p^%o#g?xJA321x4_#Ytt|7~(e1>4`V)nac= zZLGJOSiLZ~JTR)5&8E_p*a%exLC}{9z~?E}%MtZI?keaFiR`*RX`#H<<;p8ER{UNF z`K}ko7`79w*+RcPAk6WaMeoKd@jH2W@C!GbCwYIDjnHe+{!nCE6U2FM#IlSblW)A? zLDV{^@DqG;Sz0|Me!}=Q?OpJjFw?H@JV~eAf48H|{I(NyPWPsgXBYN4>D%#FY;#`d z(RS!y7?qR;9S_xXF7$o99nghIO-ho@VBfh6k{UB!fqz#_brb{e^!wf5dc#Xv&4o%o zKyb?7vpNyS@-%vx0OxmI0~_j~xV#&E2$243tJLtq(C}QsD{flBJE%h}m<4|9s;EV6c~BdF5GtfOb(E;W zRaaGF7;H@xj7ZQZW4MSL?=En3DlkB;fMMcgn3lLLjS$TCH}2a*?E-J=G@76N9=F9`d3+d0-Loh*E&A6 z$oZ!p<=xjuhT3u*tQ~i7y;3wz2abBNf`7*d91x_tM;7aTkUN=k;|pTPoQmU}GIop1g zLSKt0NX`Ov%%I&}0Y*1fMs;q6&~C?#hG~Y8i4=~#OS}v_!OF=YWT{b1JW{=-3*hQ5#Qi98FkddMN^|;JRC-t8+L>EQM^DzZVX;`3II) zxEK?u(s2WN!0$L!1g}sR13Y@E;U?$Pft^t;PhhU ztDqFN%~%wM7AE^E&R6=R$6L?R@|e)^!KP6!Wy%(ZkD`;udqpSD-WFNI^=>$L(j3nD z$gGqq>q$=2hNail*b+G&Q&rWYN-S?PmX0@5{h2(wYabJ85679g2OqAKDJ~C-F6?N$ zH-A#k|CI*aVSDSTkJI^*os>u8NdVUgQJfDNF0Iv`bdaN!&1C^%F#`9?{RF7A;fL!C zP8dGqM(;u7@xMmBi9;rSw>1(f*DK~Q3em)S*cNk`;b6EJ^l76tkWm2g3e*VL&FJp= z@Zovc;&vI37t;5%YQwd(^J58b!{*RvtQyC!Aks3e)Y8<{l=i9~T`Y=~oSkjR|1IAW zr}0p{lMAVbFJ7Rm{*Dhk4-J9>8i`BoT4Nj9+*D_GHB853)48{{e7(2{itk7^vq3q+ z0DFG<85*BUQ08gJh#TpXr!`$wp;c$2nq6RG!SD*xfY-ok{$f+j>!FZ2D9Pz-=Qos9 zImXx8r@`UcAsxa`^Ys~iG$YF!C31-fmP`hU$1>E_J~ZnH4Qhy7?tgq!{nK>oe4vfl zS7w*y>0?%qgX61RX}@^7A+zFp)F46_-0|#1=mU|1RxLbZGT6j~;)XZw=rZDgl8^0G zJoEUC=UZ3pb8Cszrr!~e!L=#=-Q!yvnxYF47HrR-i-VveO7O?GG&o3_PmXW}|NfAP z?tOu7a}rge^dn7r`y{HUU_#?g+#l9U-nB$I%Wd9LCq8!fE`QkaEIfxs8%tB9D!f&} z;}_0MhGM>yb2P7Ph1I9jI+n6+x4)cfqw3|??DOi^oDx$!9O9SOj`6R!_r`=uc)}LJ zc6R8E4-&kc+bihDfiQ$r0PZKwHAZ?NW zgl=s>%tj-FZ|TT;cVg1KW#)1boQeWM#Vw@JNzn3sj~97}Vr%AGe~0EBm%rmwsii7J zO%5}ca9)*v2HbiZq!U{I%wDvpJ*@guc2qNNE-r}zydJWPiRd{(Y)pRaHN1i$j^pl% z>%`SJH}uZ2oB2m6U~M)oSec8C6#F%M{evntE<|77Av{r=E4zK89R+*;CJ6D!AhV6T zRH*AGSlCo4^i_S>!k8ta>9Zt{_4nkD&et}+wQo)jf{BT977R^1Ch{-KH$C-?YZrG- z=!R~Z?#e667D*>qQrtwrs_z$M~t%22nkoLxdth$z|%a2lCmO z+oDdVobjAh^^o-`FFPsq*l;y!iXv)oFJK~s_xFRsyHa|mmy?j=>Eg#dm{$SeWgOoF5F|+@RFWL*7(9 z$IGIN_T5TGR1L~~(8l9Z*imyLo#2)2vBI}{s8X1CWla7s$9sg{SacCp84`tvsF~5s z5Mz(-+k9B#)s8G03g7SJKjN{E$&zspj4_?y73cL=H4jsn9b;UZ_V=sDJ2L5sw@ywH zk-nyJzzv9t=&SGY)o&;9k{#YV$7Ousu21FJk#y;UmI0Ir&(ZlsMAlHZ^n%ZeGA%0} z_C#EECcP4xNjcbC1(bwQ0kO9;F#c%m_%6FDnJ<%(s{g+4!syneckzzk@wQA`&@MRG z%42*q%?C5hLv%pk5S{<>&cXHod2^`&GZpB0=O^Aw@xr0HyegLsi(Az2+k2tL^R~;7 zG5#@OJ4j-9)A~}iw0Lqib86fYj=yRRdO_QxR zwc{JTVrb(PN=2_D^ZT1RE;1FeehuPDppkZEgJ9y|LkgqJZ;Wy3azi~jlEHFT6>*=w z8I_9Mp0-#4;A3SglRKe#_7or4u5A8$FB1;zL0v(gp4Y5zZq(mCcp~0s3S?jrwnktd zihoiz!zh)(K|3llu=T0ZuEO_gCReBHOoa;#Rcv-nbZmU4buEdOZCDIH%_L9~lyExU zuEC3&r>idf^iZedJfX63husga3~3r(B^1H~YQ|lvgx3k~bSO0}*|{7yKLnUgPl_T) zuO^5Qvv2(Q1Qt#Q*Z=~rgK}Y{9I#=B<2zyz;>Dx8l1?D}@1&rlF%+Vq)zr~in>z!R zEl+TSEIhFVwbv~Lk$K~&rH-+z=f$($*oe)AVPXNmZvBj({Eh% z>o-6nDvswK?(a}7cF6=WZtA8{Ph{=J^~zlwWGsWasjG((y>7==a50{YpqQ^YT2X2& zxVId`eWNMFvF(>+%J7s{6S5jCA;W^k#PObacEPBqZlW~dAH%Q|yA)_4{2j3+#a|W1 z7_d>P>a%;6qQY5Bg5MO3(a%ODoGAEk;13e-U~_yPJ7P=MoNkJO3{Qar1#li*UFOQll(b2M zz8p37^h82D&w279YjlO3gFRz@;{}?biK-EVbPN_zoO%&+&sp^#KI7)U+U$eom{e?sFE~xl5}+*G6jd) znk+lglsXD@w+xup<|13OY9=%C8EX0%wAI_D@C62W{wi~sm?qS=JFDF4ycPh4DLj$? zlK?|{^qF9SEqCoB;6}t)_~d9<%WClPB6Q~vq2w`n=|$dLfcD6SjX0UL^=eR!B)FQ_ zYXb)ed&w=xD`$a&K9En*r67?VV~lYBzgmEeut<0|?$G#tX4f8|mt#p47w3abQ_$*ejSfv)Bp1gE?2%r%NTE zyE6C$K?v&aRe27Xs4oVMkf;S~&M%AijW33~bzUZHOTu^XXR7ED0Z!peO8 z04@>}whw%)5xHxpzSk|P8g$thJ?f}_Kp&`IO72FH`i~Po2tY8TmR)eA(Eb-=|MSXo zE$3IyT2g^y_utlZ!!XiXEw_Q1PiD~kp^15@qEOYWd+}AcF{KMS2yH67nU(c`Z z5am&ByThE-R)(hCUzy{z%J$94wdqCp{J*6eZNx^RxR>1s(D=#67ewNqG{ST!5BQ^d zJKS>B|Lq+}tq`!Fh<6oo+2^;D8OK#LpFQ{>iOdc#uK7}KrLPM9aA^h6T~|7FSsj)T zo~Xw?DL%zl#Z(@gifZ<-OTlqS4Y#z;A5R6unrO#A>JGZcYAGq$Iev3iUF3SI*NDWV zluR~r0F1}Pz-hX~o~pM|LQ;7Sn1WvfsR_kDsYHh1dm3UP_DR$TQ$iJss%|e1rQGd0 z=S5!{s)oP|HmlLKu_h+=q59hOo;S=`-2O2|ZBT(CkuWw!sxMmf%}ss$8Fs#SNU~v- z@^3GDdqdc_eSDx0d?`cge1`9;VviacLdV&R`{*pGJBKv>hV_1`Pg%~ni$%NGpOy2) zOwjHygO-M4;G9K81(%L`L~Jwk{za`BD#G+QmF`w8f+m~XvK3T(;;yXuFwQ_|wTP6m z*@6bV673*?mhkit_2?9Sb8Uvo#n!NyCi=Rf|Fg+qr(W}_6L-y{(fdW%*jI;t#_TuiT<#tLA)oDR+TqL3yAhhG#i1#^d&cH5JdEMuac(Yuu zJy)?92gA5($7Du`frB(BCl4Mr&1_&%oHoVqH%NTv=uh1cb#VPqpwu>7E0(_U`X6N$ zM#bV?#_j7=^EkD?c>|}(wf@%vG={vS2a>5AnT-3npgT^GS0Vg-$8+%cq|S9|Iz#wi z{Sw7pT-tRj(4FwOy#&q*!Nz$r*XzF@e;m-e@tmE`1Csre)W5Ye3{`Q8bGiM~qVyw| zJqrJre`Gims!IiiWDXwUfoY-R>K{H*e=$9-=a}qsF!-A3X{9d2sb-xHQ$$PPB6P}9 zldLMIL7-$25|)^MH4*Aty|Mfx^`E=awRHxlc#>Rgzd)jLGorUouw}>XNwub!SpT zmu?Nx%T=L3a=n%NOa`Q<1;aU61wM)gw<8{-S~*0sFb7pkJ1ts?u2&hrF*@5qvO2qa z9RNV&BNVXJo|eJK1Rb}=WyQ1hY)YptKY2fPKu`=cd=DC6H+0Vq?b=Xa4sy`!`|e9= z-N{-T?aJt&XP%P(?c}rJJE8>}jvxh<&8I6`S=MJt@`CaE1LM?JQ$xJO%~!72l8>eZ zq=M*WjNIx8PEK}#*$o;>g7GPm)vB2oZtmYyUGU0~PgL8oK9=|=!_v!LJs80$(S7L&eI8;7^i!S70!j6t#k}kfI54yLO zlLY}WFyOTAHFZT)E6s&A*TX?qgdnf+HRjC~IBa6v^!0FS0AlGv-!e$uazh>%imNQ76oe6=QhvCjpfiexji8O%JW;il+3L) zqD*Gqct<%J^l9SOucV;lK<<;4jkNjV-BEKaTAAA@gz+3q0G#VgK(z!GwWFB!>z zUJl=ThN6PQM?o;u7V7++jtbu=&Z86OSdFp!;oIU93(aR2B3Zyn88uWK#i8t$N= z=3j82`Z^-z-3T?LJzHTvIpPD$cnXxv5!5uY^(x*6b=*71!)XTY*!3fGb~&cp(iaptr8oe2FakKa?pJ>97n@j zhT$U)HDwJ4Nae`bodq*ESD-;r#}OVYPJTP!|_6>fI zFY8N30*krd;R|R>9cG=Sqa@09qjY`4=n3d2S}vAuPoSw0g&Pma#)`l-5tfa;fRkV| z>yx7|qsLehU|a>E0P#IEprZ&&X+--EeM&@5cW%ZiSL4qEivsJjA4dI*GSs_snE?K2 zCyP4Fgp{+q_P8f2qvJmrT4Ln@*)AY&^5OyGw1A}QT?U-L+%3nF@bp9=Taken2cN-^ zH^0~;wTSOwP;@ z`Axr*EP&tx32)6@r4n@*J9L>@G+a;CWRm$^zhW$_Ijp6B45$(~^m!a+^iRcL0=lB$ z=PeB$b2_S3uVwHlL{F4QOR*$@ae(PzQe77xC1trU86T?JMEAvjjj+IjMsqQNr(56A zMxZ8!nFzh@x=sgq6eYvNNMv^So0GCq2~za3{47y>2#!C~D^8%(7^Vt{%&pmb8MN-b z!zrZLd+OpaUB@Z>T08e*8Fe>aN3+}iA0<)AtkjekuQ{ptyfhvunR9+<#17<&*N+*J zGPVB?OS$vAvm**jKA?)sISS7va7D{a3Ln&>Ixjc{>hZfX#tDuRmIBSsk5Z@4)3;y# zK3wGBH2vq_*Qy2_rGR-O|9s|W&F*YcfEW+FmXzyt;3VX9jun>1FY2Ec1avBXMo#%h z(FyaI#Wo7xBttG6**A%c8OQ+yy-Vw2j2uGcc17d0N;^Cagknj>-xVGIlkt-5D;(x; z3U54jDI~fnV7S8k+PROP-PG#>1pT;X^jdl#TW(K6(VCsfQDm9FOw`iR@^p<-I#0!2 zEYKYHk2)Eh=aGPB$Z(N&ukxlxG~N$0*tlaU^L^s(h7IjQZO=>vxyr-xvt$Bdw4cT2 z5j_4%K4{cLQ9ON%2~jql3!0m-l@WfXCMadR316R z_yOpQqI8~zRKby!%CQ6A;;JR;PbVMMWxD9U;(zmr{3rOYu^Ii z&rJLj6jQS+a^1;&CFsE~QXMp%SZ4ap%mbIe=^r1uZFk04(z4=gx4*^s&ckC2>1C16 zP>oG{G6=#`C}uX$|Fxe#vcs>B$$8O%STIF#8h%NwDWEA3{(PEyoG~upvD3Yd)_n8- zh&Wsw+g5d{(R3TKsWNQ|EcFEdYPyGD`7$ygv9Qk8;nK|41FsLSp^Oy%|kuhFLdr?thFT3 zz24-c{i<|I#QGTkssZ3+eNg`ZaTH8pMLLrK9a`{brO0nH56>RfSQ%q&ITb(uKgGtH zwE3O{~3s%JWg)Hg59RoHTX072UnBKC;K4a z`z5gRSwWC!w8%b9ufK+dhTX{;I_O;ndXyn=2uF|Ff11oXXSccU8-jf(_}kt#)0}}c z6xi+|vaJ{F`bRXA?d*QFJWU2|BP3LoV;}l|{+=2zE1|l^kpzjw-uxg&S+n+bNJ(J* zVQs;-X3!YfOTp{c{}gE>2G$%N&7`!{MfdTffEOfeKhU8Oo0ucRlg&sBQeM&mwj#=pR?D_ zK2A_2REVu^Q+w}BF9Xz_)+6T*CZ|eB6Dev){$n%yoSIbi;%7my%F`G*J;aX2;D>|* zE6MEc?Ch@!9J>dtR?dE0f(ZJAgpsX(8kP0=pz$zOT$L~dbaWr^J`ojyYVgjP!gUSp zp!V{B#gAZg7Z~67{eR$H>TojF4TsYdfH*AplWSK12Y#!f|KSh{OxZ0@W6>TbsWksJ zy855>K6gWmVS3(D`sW96h4L+{NhSRP=AbO>z@B;+*i3)qWg7FmTnx?(7haj|m*9y@ zA0>Pv!}LfLsgU!Wt5Dtii2WAmXb@E$2bvgSLdE~v{^+$gUrbSwzd6VM;TNT-$2n>N z>njKp@UjUxs|oL6xD2o;Kn~<$&UAt)ED*BsgksYZmH&*4QYH$hxn2c2jcxa)hVOR5 zo(4Xg#n_}Y<<(>7bJyOjvn@dJ@pe!29B@TF5xIANU?YL%>|$4IBs+HciT`P`V%)e-3(E1TI({ zF?@B}13*EVYHNM(L{U-EN=K5lsUSTPFm>eLAEQ`%Z+$F5Nb3`NOFldNBtL6fDgw}z zMUUDSO;y&z0VpD>Vk$qCdfz*qf9@1-gd(l^+_q-Omj#=DFCJo(wF}t=Fz!6g z&;>Tq(Q$Jlh~v3O2OhtB(K5&j4C*+UDf6$MhgnQZsT$M>7#9GEV@qcIe<*pqRJSV@ zY7kCUpoJ(0q>aN-`LUw|*b6n1t-^HOqd`r~TAT4_VEs?aN0{M3km^8KNnkjvFoMb& zv?Z~&gT(1|>co%~O@@`f_VnGjy2CbY(H3AL2x0ZXtkGIlZ^i1j2(w_;B}b`8R@1Dm z4pmaOZokd#)nL8902FzUn|%1r4p1W}5XQK@8sUTewUMT-Zi<9j8(ZzGDq#NMMaXKo_QFD7*#%#wwj zMv6ay3P5h?XW-Ev)+VpV)=ug)8rRK1(2*gYmu%%%)3y&1U_`?wg-^Yj@5BG|-J1L- zUC%wL+(fUzXpjX%VF$&0Z`ekkS;MAh91kTX=+`8w6=W*+Jry0h^;@zqv>~l*9p+#ETxEzay$o=PXnQgyqvMRoJuR37 z(c|5X@9Npv${O86QGk7el)o2kjEHLuBlFF=7Baz&HQk>_%4SL?^z{i^% z0B#c}h6GC9aeHT3wii{;bD0jc7%q{hJpO4!hpm*j=*e)wsh}Hme)swoid!?E{}A*= zB@jS$Ho;DEfQzVOp`J}RJpk44W! zKIOeE#{8r*7$QH^J2r5A_+_3!qi*uHruhG_)@)DOugI5Eahr_7VWxku51M7Zixa zgwdD8XbUP#Wul(NHEw>gwEP+SI}HsJ)0dMoO0@szpZ01mUmbTI4LCO<%|o*9-MRr{ z`x(5mD2DZrZFQ&Nin+dCwRiJdP$6toutMlp&VN5L1kGEcBC^6!amBnJaRBCo`VKW{ z7xK_k-C%^Vyw7i*paWV`(pYfAi@=SS(#>LUdi01ZvD!8lZ1@U83F-9zyr`dLD!t56 z>ZNYLc;)yB3abr3{SjUN2Pq0b2VnRuY`qgH{H{+AA1Sy@I;O59B0?!X9Q`k-D>GA{ zR6h>$g1I|Ea2gPRvh*f~{P+o|!k4E@?h&C={ilHYJW4MR)vPk#L)-jc;*EJ8Lfi=5g@SBNRBgDvVcEK9stz}kApMStv`u@2A;}ku?hT7EqMLmD?zwT)Q?dHI9iD2CKEeAvgeu(bjYG@w>j^;k`i~nD4yxr z*>NPx@#^BAf|QZgHF7Lm7dtQ24C^^~JZ%Z*C4Nr&h*7wp6Y7EquZtXV+cuLD8!q}s z&Bfy~2F^mjzky@{U+0J3`kuSzxu7%TlN_8 zmRv2}9wqFGi7Yek03+Lc{_}9GK!FRu?s-MjL)f6$W4w9Im>W3|<{*73dI8^{o2v~m zw146~*|@{5!Did?N;abD9lzVzbDiVX%lFYQA(zpjyn^II`HVgP^9LWq!FFw-lK|qz zl;be~L+39kslYK0c6ScOjL{#M(*q!qiH@(n(_R#7zI#&Y9Av~UPONMBMVn`8cM$y5 zS!1v9av__Q70m}d#W1Sx8u8`{P3_wR`ceB+n21v9mWas#qHbEON#J_Uq3})TqQ`Qk zS3r{YU)C;89R@R>D(ozqQpf2-x4mu&t2vV9W=|K9NUz2`w6bVS5a^xN&zP9)TH;M} zm8%rOho6q`#9_-l&tm;&5@@IWmr?Y*c6mI{x&wa{qJlu6b2Sx}^s+K}>+foQ9U*j5lh#5yAA8tO$eHET!tY7s~6`8JNWEL#Lc#xj`o< z?7ppEl!50%y2Xis6(#9Nu*_TkT)QFqHQE$P)uA_g!JER7U3JRkK6ihr=@r27KQGhR z9>(aD`iASAELKnMfY(>y%uH)fK_I-Mj1}5`*E6w1zK2{}RbFYqnwQP5EuW%vYeeX2 zvL<*k6ruBNHsUS}3mrC6rajG=>Ouy-In2h!ruysEud);S#*>-e8_#VUaPCj(8G5q> z;Zy_by1Q?`JzwtRDAL6Ba(b1|vAGBI@rGVA`ol^`q8OS@4^9X3EDJJ&e0cNTB|{za zOO=?kkpN<1f`Tv*O?!NeS3Q^*D3pB9O4aL}q4#u?^mV+Fxi6cKcx7^>?d5;IASTW~ zIu>AMq(Y{n2edRO4$Cj7p)yf87BD@=pA0L5TJf-jJbVF;O@X{opAd3@fhE*L#=V_g9Mm zi%QjYxGk)+Hxst=!ag!9>4f?kEbb18>1BWm*O^XJ%bhRQD&-rhcE`5FG&!R^lF!D?i0lQnEG6%LZhFN>7TE{SAc&ZLvVUH8OF<4=< zqS&DTw&G(J-p8XJ2d>qD_ekFKfZ5K0NnMrtZ8z+`>gwOh-bsXWW_$#+7Hv?gASw#q z^Jw_i?ZV$gjf@%l?Wjkh_D!cgIy;V&dW7E9z*FsaUkeD}H_ zc#?Ui!iZRzTZ2&u9z*R<8eHCO-j&DTT`yQN(6kHP8)oCaaX-Q{h1-DlU z@t6j2NoWmQNaUDsTm%4VEyjd|gshyLqd{UCTkRUDlXXt|;Q^e{XN{KEqR69EB~=f! zWC8i*9k{V)WmyxzZAqm?3DSj-GP{HJ__jd(xqxOfqKtbbxqY`e?^u%#u(6J>!z=!7 zm%h#w=HoqyIWXGoEx-a6@s)}2zw8tqn?;GnjfssksIzOEJ$T}(LFzA@+!SSG@_DW3 z|KSw7MNv<0FIYu|gKfKd5jI|6(~zN%1aEvWBgClwDa(rC=6F*?OxP4NWlo+O@2^8| z)>BCUko~l)UQ~IR=Q&+A;UwhZ56v5_1%Y;9}~3{%m8Lg;MsTg z^(dpz0Kh-g1;(x})GU>t_B{Cp)7z<8_)KG#l7;cvbN%>dn#*Z>_(STD4|!>Pz#}vI zR-wG9U()w@XVb}L5@PgDT!hKEO!J@=b!JE zv?OYFc9EiYS4fDv-WA)?qO9{M3^}>UH0Q~62R?@4Pk%=Nnmwa9VjUBz=D(Gal}r{a z%w9f{K9-{}n|IK>*)psp{1EruVS~`KFhrhc=n3c@(5jfmc6NYzD7n*KT_rQ}8Nh1X zj@noB)4*a64BMalp&xJyTu+I}YGHPZfawO-}h*F+O_^9M$2MS?t9M><+#8@0L?p^VqyT#Z_Y8X)SuMbYXco* zD((fkv%;OXE+P6?61V_}E&!h62`mwUIO6av>6zNv0r@<~tH~Jq~MpVKH zqk=+8N3CnGB5(0ES@BH)t@UJ>=QP_i-EiI;l6jAcI|>zX`+${k_;yX2{p!sLwIxjR z`de9&;dqV?U;!va85t7IudY8YJ{+ZNa3&M)cM{17!U3;Vz#kj%!hXPszzx;+;xnC< z#^~G}5j&6R(#!MxM&FUqQM!w*Y=$R5=yBbM{3xDZZ^|a%85v*YYK->lDsR?C!@0d$ z8>DwP$q6ws<76)~eC|GO&=-HTB#Hy#2!-06D~=8gXuV-F(ZE{M|ODgDVcz^Ou(T&>>%Y zF-2O&sP`$<#KYLo&@`|KiQ8rA%R09eYxuER5`k_PgDz>p_$^T11FA0N%?k?pVv3kU zVep4)-{~*l-W+!x5@MmWc~qxiNG*fg#U+u*D6z=O2Aq@s-b;+I)^;+=yk z6N`J4d(|7F5={%(Nra$VdEXGI1s0Rm`iI+Zs9c4qTpLo^g&Oc4{ZOdx_?KXMWLcz} zlik7d^J=~P!opW0opLW^)0$bdVQ#Gzoe#3_x}~2#B7@?HXVixex1ij+bH z4xIx#Q|ZxwOr4enI=2FCXq!{+&daLD8;~0X0B}e^#)CX>u1lNHuFQ)IwuEniDFVIy6)J=0kQipegSj z!!&M4`WHEWR#qQvA9gnN!l8_I%nH+Ei6UL%H`+ZT%I?p$+#B-mqxRK*o4RONFcjSN4U_SlC#TZi$?p^m5{o zg9F_aQg{}m1;HcSGRp*;`j$A2b9}oph_aU_i-t{C`wEqo;~Ccek8zYY0K_~NlX-bH z((O`S{!JwuBYjY^F=8w4Cl-XNF6>TAF`2Qw(d{iNJC(c-pAzt|Vbdw+|w zGu0H$#l;2I!avSNH8RX$i~dLU5^qU@O=AF6MJxM9+#=0V9ZX`*u}2nJ&(|ed6RVl- z3;)#NyAUAf))-7xCvhdWpqG@8;7C$P5wOk(NubHkZ?mnF_!h^WAM5Bd@? zwmVVOmddVG$MP%j{;hqYaW6^vI#s&O@*pc95b3HfuWP`+vQO&UgvqgXF0-30mRFFq z8eAe}W#!E4oZcn1v5(YKA(zw$JPdOh=!%i0_Rxjk#5oq5mzMV$hcDg-soxQ~(*3&K zT=>8Dt3|TB^+TDp{`a9jAmLu z9BfirLpo>Hyu24(==l-Bh^{p^FGRo@@{t2GFt2vYu`K!doz1vqk)a7>H^JV|UJXa=@ zK0nA{uy8yT#P(TCi5(rgR(j-GBfOvO^5&l1Z1J_K2gd&1%HmDN;-Llv;_lS7`|HA$ zay&;Ni9HnhMK!^P=g!&C@TR*0Fzv}He9O-j?}A~FypfT-DhXWXv0rh$J8Yy5M&kF$ z)vMYpWbnsGM4frhz7T%4u`F!YS)g^l3;*t*n8>T8kZ3&7{0@NMfP9G&@~C3=E=~`T z>GogCX#24cSXH57%$Sb$eh8I}l&iAQw`OPi?(S}t=sgM}LqpcLZ_i?)MuUkV+sw8e}Hvq6y`O{vLV#zxld(})-52__w%{JUq- z#v%O|MpulQ1(@_sF+YjSVB-38LD zHA-ic!K}69y-qYhbrD{8%OIpRVDmk(XV)x7ZybLoo583oM%(YkL)6IFkd=;3F5z=R z4_rQrZ_tVZ2oU=EYJT8@=3dsKy5*(Cd+%JJ6f z|D*1$!`kYec3~>ifjTKgO0iN3lw!qeNYFx|IJBf_aCa$13L!vncXxMEN(sf?y+{ad z!R71?ecp4P-}PSSI_F&9KVSYRbZ70gX3g9)bIC)o7zqmm)j{Tav(-V zm!aFoBQtSS8G3xE`|BXuv@5}2I1$P(eh~mEoi<8C@yXx@8VCx%b$QR1eEHIv9C2qG zZ~K+B#i0BRU-E(ctU`y6PkggDjh9-rU|#o?3Xq>Bym85kF(EEJ{PJb)snYt=X{EFw z{hK z-7tCwd_Ca@jVrWSugW_BR>Sw?uJusShJ*jf_<^UhX7S@cSR{J#CMP`N&dxpnbJVAb zWEnaEW?Tdy_#fHxl#BC~S`F47w`y6Ptm% zy-RLGuhSjT>TApn$e`x#0SQ}5=d&wqi~#)2CP&iLN9%9d+gCy_dtE%QeXHa8>56JU z^nsH%_LX;4-kxB@I-22gQmC{Fa5SRwgX-VceK#t9R9e1w^5jV)`e3;6E zs=oRJsJr3?YlF9ZlIZ|q8CVv4Nlq*ZP?a|J%e^@({T%BU)eLBlWQuO8(dL`<0W7n` z=7IP<6+UjQWpW^E-uRd>rd;ZL%Q6X}`~*&_GUS1}zxy?o@L@|obLHYjMHK2Iqt?@u zw=AkrY%tHXCr-{TLzBk+;bXMRiJf0br3U^mdNfUdX)AHnW74SN*s|D0xYL4LX} z=f*Z?2ff_)+$g?eJL+98(DWeSu*QVD(+X(LMs~CJ1V@DAB9<&mn&Ios>0R~L=tji* zd*ljpXrmY-QXj7YbIL`P6s|ga-T%E`ef>I%y{&TL^*4u{;Qb;T0(2oX^8I;mcv))4{ft-V%cC0BT?1slTHNmw~<$0It1q;v976qN3Wg z^>{P#%~>D8BO-^*v^YHG(B`;Gs9`;1GP$SjP^zpyYsS9;_Gq*rggIAhrNRk`-V5Kg zco_*?BM>9Ew*-Eai@Ot5$WINXUp}vW?QV#^QP-umniD^goRZDk>JVT+r+2<95RM3v z@1KqLVHhI(b;XYtxD?>HH4FTBWsm^&DqOQpc^bh@rvHCmEvK8gjnE=K-Qi8mzk8tu z{g*(|OyakP2nFz)nBcxS@Z(WQXA%IV9|~Y716=gp|Mu#;o}{YTRUlXr=v^G`t`_M@ zKlq~ouoHsL@~$utkr^J3K)tG^uz9HI^#Y;IbvKa}M1kCOfzvlUKmtYJs+92m)l~_* zyB70Zz)GE;{%yT$1^wOs-PZ6I;gB@Y+^^hUpLQf)Wp|#*o|Y;YLka4J=(I{EASigF zc?ulL)56x2sO+1X!LYGxqAa+hKYq1<%M*wRd;>}}f=M#ts}*aQC%~`&fNJ4PSIpVU zrvecCy5ErJ01Q%nBf{I@~zy}fAo*@L^nFiwKKbQG`xH@{<{Hh3>*S}{!wWTW@fU+EA1G(mC z7AO=M_rKQ$?qu}Ul2-Ze-~A5-{FMw`?cIN__CMdF{tjB4mg?{B=X(G>O_KeGh7)l; zM`n4TKY5=!g$99^$6qjPffh0)`tPp-_&G1zngBh8kMF zKdb$pT=k54!{YX2t}`7p%ewH{JfV8_|7Cz5Qq-i~^T3<`<&qw!@#7!oe)dmL{J+0C zl^P)N$cKkx0i50O?>uyolw(voPk~FW5L3V*IsTg*2LBrcCH|Ge{;#f@tqr}>3<0+WO5~m|iy$JaA>^0gV)p!pC&_AyqDQAJ?pZ`Ca zJqw=y{Qp(+CS8@Q(sPV0t+s^0W5%?ND$(x!9CUWcER+fOW?2HgF9mW5=;FN{3g+<2gXxB?;rj$aPuAvp(v*bt)atb9xgCv zq$TUfj_V{P3!~-~oR8%9jvm5|^t0iYfO$sSAw6>41V$riJE&e+IhDI*SHxAQ^=pq; zIBUdVqRWO$)c7zJ22)wDdR(P zHVnk$e#=g9aaeMok6^2uDjiBNcq=rSo6gBFhv*kh85sD=U7^BOP%c5xNyg)Tw^TG` z*}H_}Ln)|<3f#rF2Y5CHv@IJTJ>m(qj{ePg=X^9ZHK=jdp(cvXHSiquJ88P025zOu z|4w-^_(HDx9W;rqL{g41infLpM-A<`V+*|h3ih!=wWR=s3@Q$KBkE3H?+EokQI__z zh|3XyBFI5tmC(pX`q{}8chT=9q`sm6>i#X6r+;`NNFIy}WC_7nDj+a>rn`m_k1`}s zEg6|&K+B!7u-`d+Neh(m-E&N`1n;}tq_vLFI-Bd;W_Zg}{?)ZrEsf`?Y z*854vZzxj3s|@L#D=Z{X`(~9Yt|mP2{*PG{8KADMAj_O&_n?pOmK|AeTJYt?CKeD} z-j`tr&F%=)F=K`ms^z=L_v8^eb)y_+aciKDN$~0!1g0WUDc}77^#Y|PUCbpG$&BOu z3dR%fu;g!Q2sR2@b!yzZzRy_}{*77v6uenZWy>K0C21<9%ki!BJk71`vLe>V7e!IO zA^zfAxdW+0iwcFGW4Mfz(*A_B;2TjM`_ouLmE)1eA(s~%uXVLt^H8tNT?BRKDlcbe zIj;mA5L?g)bNIrkpIMzN0M0#Zg-eK@V-AUkNdlMnZIFn_HY611GU(a28ZLK^;mXm> z@>?7*m@TAJ+1_+KTHidM!>FP>aPqAWr6c|{zdy7WPY>?y#RFKRc;%~ZJ5*#Zj*`+} z1#2Z&1+G!yRT#yoD56vPqVQy;C8y-+Q2A@RhXW>iD(F-tm&3yMEn&}kHCtR11&*!r zRl4ygQTI@}D9f^v(sq+*kXWcni2Y76Z`mxmt72&UpiQ?D zPm!#?EhKm3wVHtx0KV(Aw(TSHfx?8-Mya6P>;tD09A9BwdjBs8y0ND?veHw2`&J7v z^g3bsEs2kgv&hF%&t)rb&lS7;{Tmbs+0i=d%*!dWa2}SZh8x;uJS>+1a;-GCO8%cWpT>G!P zg>p(x{4DH%2}}#hJ=C6d5XaEq0wU+QT8whKbk&k&MJ0m=7JVfI@ay=4JY0dQ&iszB zkO=$HL#UT3+~vCoNTy#cKY$U3Z3QHgDK^*)V@>@c4rKsDFduvLb?B8tnJm zBldSgPJ|y?N6_Fn;6^#^bYO~1e(3>(4*}Y?kY4WY>aEsi6dY!S#L+LI50r=4@@PU0 zpQqczImpXQ@GwO(cPm19n^g{^&x?bKO4LF`q;|6S(sx&DxZ89UVB6pOQ+U#+=G!Y( zSbmSKJ|c74+UV(emM-)d_XTbQJ-aIth=HM7K(>O1r^RejV z#8xjqb;6HlbxEGcb>HeArZZy!nI+4e%>Z9E9agA}SThlK<04*vX8tPg2Ew;5TRSRT zP-y&o3Z4CIVAa;>g)+VA{gS}cP-x_roEnDLr`kax*dCx(LO7_qtGCBW2L>6#^nX)c zrcKRZ6cXJf=$4ROBIjlmGVc8`nwDHe?o66rwzGcCLLs7<|ceh&;5|W6!2N`>S zXsO#88+D^(kn-pw6srtxxg$>ojL!F9qnGJEpV(SIwM#vT-nHV`u=}*kJ$4_DYhey1lRou|b z>`P9c7pq`~S8iM?5nRzL>SJPOm#{x=J_jh~3rx5UiZawvtehu@&$8>+bzOtbl>@rm z{EG$s3q=EQef8XGi9q_Hkpf(W1HPPkF$5qfu9q^$sYzjyOi&r|VL(oG60)QZX%mm* zCN%SOQ=Y&Xq}7{lz7D}oZ*W5R2%EoVZkRX3gaRuiD?tFl2l72lbj zUHzD+k}yOXlT4`Ta$A2m428_^XMw&4>5QK1!aX37TZU|TCL4n)!AS0>5%ZWC#Kd(4 zI36~;SaqONpS)MOZH(%Wa075e0DbpbzF7t8r39al`gA%4!1KbM+#NUVO@%4O*z}NF z&5tv=DbO`y@NlaGy0pcp9Zg@3Wk%?9c8T`Yr>72}ix`qg5G;b0^IWF1DMj*NH!it+ z(JO9lId4B-=~%P3icHKns9k?JotLn*su;oMPFs`p{2Zx^y{B}=(tRSK$@E|MLm!VjF1!W-6%t1H zQ;HGAF{;8Rf15om#j_aEZZjQ1MXRd$zk zfsedD(I8?kA zr|)g0Qzvn)^i<0Yu?*}{%A>C5#P6ScklqZ%=j6O*BDrXJ(uZBF!BP@&&kB1WS+3FN zpZa_-TWS!{S1-xoox|^2jtaAv>~t~E)#l$VS{v!GY!O0|l!XJ7_7!|N>*`rF`-Esh zZIvc}mY#O8V!? z>O7VFp$!D)`Ct0nH%-kZHxI1#5hK02gT_;-(O(cvGJlts^#Um`-I1c4eP4l2MUK_6 zl*LTPZ-ll{uGug`72r{>ru8-tU?Q}IAT=p(wuHi>FA+z+gjP|QOMY$9hw$Q;(%AE= z-zFg5bJoxb7$DZ^&ouE06COmXzQoa=qUZuR%-D-ql^T=bbXzC=Nc*D`Mu3M*rK-UY zW;bqvNM8S*S(H0^eE0ymoQd4)K8&=lcW*Wtq3$oK@Dvhwi#5xEec>GHA zg3>lkSZP# ztd5#{k_GLd4eos&vz<2-h$OA4gM3(a(FMl6>Lx;E8VP9eQ-ao5=+1JvEp9MaN>%JD z9pfxfJ_Q^JVK@a^a=f0#a&WJw@fk?7ZII#+b*@nus0*nebKKHU{3L2$J_|xz~~!} zRD*+}Kj365-&w;#FO^ zKj}2|3$9mn=_>CJ@NBgD)>AMoDCk`VJF6UWpFcbW>2`!PY`O#Ov)r**XUorf{0BZO zVZpDur3RBccsBslm9CejA<(y(8cW6Mn#(pzIOvl`0ej+6Xcd)tcF%ica?5QsuzeyI z%%+1#o>Iu;ZZk?T!>R{<^BL9uBU}_55i`wU>B^Qm+#U)H(<6Uu)L`zDtf9cVP4+^~ z-Fkx6`5xzOBVNm{SkahCj$lTd=Jy=1&p_nHMlbcbJ)VjW|H4`Y;YQQZ8YU!AuRm`I zYqkEK3j#0$$N*s+E&5Bp**EGvUcA37Wuc1e4C)}_c64X+)N}=gkWn|%cS3@gapq|S zuvA_R5ekGL{=D`VPBSvzAxIBj7g$$6nvJ2(aOm@`@w_qc3OoH=R-(da1dcY-eMyu8 zt)xFy{3E<%;9HsT1P4|>UURM6&1Pjsjd2;F%e=fqL;;p^U%__!t7})nECn^?H2Qq& zw|U=<;HmCU_>cug-)FX3yBZYZS*>*rRJ|%2W=1S>g+t_~Kq)Z~j+|3JbdiGt11b8D zc#1BA=a?Ds{j{DzfDQ*VPD_~zuY}FX0E`ofz69+K31M9V>>Gb8<32zkibE|wmwczp z!$?{$O~{g5mVBw&X0FOdMDZDsVV%naY9Qx2ZApf`*?jEfJMa7pvgxI)b~CVE4{Nys zOTfLSsL^NG_4yuIkGsd*o7M|E@|WLnc8~Ggm{}{k0SqXQ0t#Y>x^PumsT^Lj4jTUf zXxOns6dVlf(axd$_wy{P?Tn+gd5thRKq_Tp+D+>a>g=)Mp|pDn9d>AK8n&D0Vsp@V zTzx!q!QM0##(In_vG#vA0Pug;UM++^lYT<7QG4ZpkfNAms=K_Hjnzd;|J7}2~%E2ob-uSE(E`g_T&;<_?)92IEex#4xk-LmO-#Zn7?f7 zjtk7_O4F1-s&__8R9>LQ6iLFf~n_7p$3s7;_fyR zG9>CkZDxmndf$6d)^Kj*ud~^WulhRoUQmq7dzG>I^Kk6~QqmT<(NW)-!f89Da=N=G z#*+d17^%R{YGFtQRg9Hon8!1$4pja@lbe{16!%y*30S~3H4-M=zP4{;B8{~#7#Zz&D#4EAtvys zE%f`!TzzP&KTzRNGDdqx9{}z90l^C~p4;3Qc|KmSZ@lsau`ZDrx*^@s+TEqASvWhP zT5NopuQ8CugJ-+@cLb~sIN36A6(?16e<~03!${K=G}6NPnH0#`@f)U#Ck*uEcY%p$ zW%~joN*XLQBQ-Be^Yi_YLh?F90s(Ny%+TUxitX$MFDYXMT7SZ9wZ1pk!X_=@Dh6Wm zUyi&)tACI=umf?5Rw-`s9kGz9s(uADC9KJ>2OD-9?WK7VrM+9MQzq3P>e!@cbaY13 zw^hnKQ10W(heBWoVga058g*PU?9OS7MPYA3b22r^Iqef8%M7a8N{;Jyd=4ZMuGbzb z$xN^@E$!AeMw77>kH0U$4Jx=>j|}MRIlx+T&!S~h0o}~0yP-4hTtW_t4oRuLtNuQ) z*pnP#lLakOYh1T#aKW`pbi9AAB%Aga>w*tljIxFyJgIDpd*1Uw4;acpHkOQ>j$v7` z7IS334_cDvr}TF;>%J_BCe|@omSfyuMYd*VH0g6=V~m4G<<^2G_MowOa%@Kt08$!t zV;pE>H5_f4ZDxxSLNGNYdp1)XAv5f2fQDvY&T4$Q5ZVDv&8ySAl|OBAv`X!?+uc)AyIL5B1uQY; zuR>OdtsCA6{{VNIuwC0b8rEN}kM{Hg9F(>aq=K}eY^f#57cw=?Yv?=truaReX8n`CO8SJkD~B{L zv0LgPMWgDhRX2e2-pY1cpPPp!gCkHNGCU%4V6s%323m3Y>eXB4TEpKE)M%M1p&AuASTH{D(&8?*A@PV+@BHi&jE4J~; zIL=voWO>C zR?Uy6P?Z;}s`tk49xEla2|D5!Yw&2VpGf}*OZ~wgjzIgm*CuT&#?zV`^YX+WFbYB0 zVA_I*vD2leX~He(g8VugLW@Uo^PVMHRtLpB^0FFpFUJ!^O(<--TGJQI+=&J3naYeV zrzIE&fl0r-V=llK=9<`ntm?z1CNN`ky(msrlDP4sCu6s*`6E-E0BW`%ubSDiIQ*ea zwZw|-EJt`lVBNscY?Gvp{7U>h9)z0JRi1YHGl3t`3I86-x?M@o#rDrb=g!%>lBP4NlB-zfrjCBb8Ow z@Qp~=PHT8~depXHedZDK+ds@eZR?8BDNk)^A5k>!fXRUMn>Q3jPnj?LC037d`kylQ?Q+z|dp66eO+)sox> zqQ~Dlao{s~wRW0}q~z?(3+e|qvUl2?^qs*HrZAGjikwxYK;A}E(5?mDQ|$GPFG&Ga z)dNPUL6wqm;Eydj0I?wsp;G!=e_T#i)54#hGH-hK&nmhTR+Klou^LysjnHt}aLeD} z`-8aN2miemKJb7<{ov)LT^x93W;9Et?>f-`RE!j=k>=*pSH_4wKoC|xyoy{Cd zYovz$ST-A%xKZdjeQ2$2KmSX@IQs*IaVOB9HKn%P2Osl=ZHg@{b9C0iJHq+nt-M%x zXJ24*?$hD2Y&5$hNG3Eadd4dplJtjxMo19Tjg(bW(D(S7hW7T%3) z0KKdo6>l|b4t$Q)D&Os>n;8$<0Z(GoyHj1Io^PR(}) zwf7NME#Y43AF}yNEfbJ=tF!T&1Z%F-j>NcC`W+&T$?S9*R==SVNgL zb{|#;Ndo&HVE7={M5l_O+fM}l=th+o-s!jvWBKVzaC$stWx71eS|e=VLoK;eBH@72 z!eDTHRmhIvkM0hog?SC!)SVxDvr<&<$OU|CE~ZQg9m~={2q$TTbgT}{z*iMTJ_e~c z<)*5C8qHKE1;j0hy9W$Z%LwXeur{0TSxnM5W{Rge5Z|r#D|CCeIFzjky7D!S2Ajvk!ja!}`Ep5XUB^HfM(QSGlCV z>XK=)%3r(y3|zDJW=wPSM68#sRWtlzcKF^1Ic~=Seb74Z&FWeXz*F-I&9#a&3{OAy z1V!;{?{1BGZx%+Cb^@HRF`Ja+5)+VVSfCqw z-Cy`)!$-MMh$VVe`@@{%ITEl&$KOh2@Mj6W?N=I8iJNgbRxOj_%fVE@(j*mkoKGgk zof<_IQe4PSMsKRmji@>s0Aor}|zj&)d>IJ90a z?(KOsm-NoPMR9GUk}w2fgK`=vD`b7PY4wC3u~ppaba;8ha&84?nf1 zzdl^Ui@j*)=$?^3IJ|znI5w;!p7*9|d;>7uyX4}6vEUrFAEGXm4cD&yX_6M$Ff`Xc zIlf}h$Eu{h)V5)#$!@pCM_{?c?W0O%JX=;0BcChhr<7<;9M(!A0#0#_Mo~&5L5mJO z!Ee{&B(pZb>Sd|SI>ZsKE^_I)*>z`#t zmIwyAUv^F|ln(Qcf!FQ$ulYRI1?f?0^dz{Ik~+dq9dS{<9G6}A?EdKGUJ5g>n|0F2 zGgoNrh}RP$zXiM)uNuN@QT8YadxNJRJhz)IH1xC9mtQ(6K8>J4cmuDyBDp{Fo-C}# z=^}Q9C(qx!cT3uwl87orwl%Q60&}e}jZ&@lYY!vG@LN(~x~rdFmmiiV0)w$-vqCdG ztH8f&o2`dJ<7wpzz{Yh3CVsjb@op}}7dXB&5fBjRz}pFUHQsZp>=Xuc(fn17Q?tUn zE;#Rf!AtX|o~`%Izz@^CZmT5P9ibpu`-QID?Dxhwmc9)3(sWLG1%K&C|Bs|~uP(i3If!Sd zKVW349Y(_*PB=!|bUF8P(~M(%;3lbE_Z06z1&_Dhl(|&^-};O^sE#!g#HH#9o+%D$ z-sea;&4}dRDApf3AKJSAR1;`tB5<2e-F32)MV9S_qm{c%cXQ=m{M9sKl(VAIMO#x` z?tGGcDUAR#r{-oy|JV-yNV^Ho-Ll#sQc`;&uRGHvUM!#~e|&X&885wEH}lIDt@$KN zPo_c~*Fieq3jbzppH)9R3! zr*577O0@+es9M@IHO{zo+m|uX?;4t^8v^~AHCLYa`SP@rt{(YPCSkP*3HPkW(%s*! zj0n$+$0)aRe>i~Fc?R)h(RoR4~*&m>B`!qn-I zO0xR42X4Hvm->EseN7Y@bT8cPot?I?pQuu!=pcY*_!-9 z1Ea6m6}$7BLI9B_P(kEE7fx&*eFvr#gThodQ)uae!|B5iTO1R17E#J6{zj0SWz^l7* zk)UyRm<5NXAved zMscJRvx8-1nY7(8Zrb|YdEX39KZB4rW3)X%U?gH+mbGy=homeK8*X<|F@GWp zi5#p?uB+wry{!CN*=j?%?%vbE{;rTWnRD+8T6@$A5T7zK&|zAn*70_X%xI_jV!I z8Tjz=xDsv)T!;&7r=MtPqJVjT+@Ha{Yt`yYCqgq_CF!GEu1n*zQTg;b*RvS*z$W*J zbCY|yM-}*~QJeUE)xsm26x4bhpj~fop`rWE(5q(hc?yjz!D+q0UqrU`L>F*(M{M1F zqt@g){L__qzF{YpI)W1fjIcTCFQewT$74(KVl@HPJU6Vnk6^3reY~04DRFF0v?_C0 z@aZJL5cNmKoPQx+^CUGuvuPbUARh!`LX6=0c`b9|SZ~3Zu!c?5;<&!!Bbf|~*EDhc z*EkvIYjU%SCo0WQGap$OnT9ap- zkj#O@$7~fnSN;)t$7SPN&raZ|Zqw;X`nsw?jpRH_n_q*xEE&uvSVolguHD0JOere+ zGt`tRIH-)`^QTobT?XsTateR8Ot2OE|BXeiV?39WXnr0QmY2P$a`f=g<*Gi}S?UZh z;IuVbvu!2}D|6}qjl8{H<=m8$?28$M=Rk zij?t3+{ks(N}|N6*|v@co7NxZaWk|cctaVL1^u{{FcaH@z zuhvATS(_e;>6|K}WZ9m%3Jh!2f_*Hmdt}|I1?$x288=7zw52>arS9j33t2zmE6XnPQ-1y0lI*1?ApV?BiQ^=6#qm(M(Ms1@(6uH(^)OUd z_WLMy_dqe`RB^V3aDGrHYzjlEWiQL4uA8Q4EhhmC0|N6w_=vE zarc{>iP=`CbKGW&gqGSfAPK&#_1WJ`1kn4dfxPVckn=~-VQvSQ_c=G%0pBp2$Fyhs z)3kAyCa)U08MR`HD8mVcUuQk=HF`!P;3r!%OllVcM4E}f+Xyy~s<&qWpByIn%#;>u z`&#C;jD$d2dhD_oRJ_=4pk_^Lc-t(u=v0|@%L0wN8x=uAYnx?+&5Z9~ItpFm#(XJ{ z0m0{8&H(Ykd{1|(s#r+nyI%bXFqg=-;bMuN$$;*+0nTSFiLevdE$3rtEq{?&9|i^t zd#0kpzNC_v>E1QMb~e_{M(1BL>=+(Q+)}T5BVYCO&LZ#)h5n=l<^aZSG4ffTx6!5Y z9xb~LyAi5g5&1hK9EQM+U7cPZ#6)R0u*+C4Oj-F|yT{a}{abO%X`NE;1InVop91;m zr)#d|-Wn5nM(u9m(&E;iMgCLNCYDm9$2rBvb9+gjBy(T3_87(hFvphEY2KDAsT|;> zbX@2B$(5rs5=mFOe)U3S_ipoIy3JGrVKXyY4t1NSShvdP*|rh~0Yf6mt>Z@e5uUKa z**xJwf2xWB>ngP~!gh{j5Mt3Y>`skQ;W38%lcgci|QA3h%Q(&|sT zQMG}eiskVq^4G6tH`Eq?O5{z(jd_6_X$0esuHhmBCNXa;i`rH=HiB0W8t&oK9{>SaaA-~8MIXZ zNfFsGkXg-heuC0Ly>%$y)>XOYTA*cF=4x8dQp?ewujAm*=T3|$Mw89zCZ(P-(278X)tSzM7`PZ zH2&O=y`Xp0@9LNrp?QzVt1~^r$;o+R_ZC1TEi_{G!OUVU4Rp@G9WU%sG;BKrgK}R) z7D=(R{O+2$4a9JO2=So1Qub7y2nin?5k492urFR#HJm8M6yS8!CRlDn7JOB~vp!oJ zmL}t>KzT~#ZjIOz1_lPUw=*v;ziAn32NnFzr*HMg)p+aex_qguik%ALT-tp2qWzrT zUMJh}tEhH0hY=@2jh$H=q0c7sI*BApZTDIn5A_}PWz@w1qDZJwmHzFxvYRoPR~^hj zrp$ylOxri#oQ&rGga=88*pnsMmoP9=w{vM^9TNg&PT`NH!`XfGrfp*x1$;}mr*^XW zq48#h$WH3#Af^Yqeoh~nvO5lnK6UGk?i`|RcW1c|?bS`l7dAP56qtfxJMhO%%Q>uE z)#SF+9^Ag&q{~=2)M)e}(-UvS%YIf%=VcJS+FMm8h07WpEXgW<*(ZWAD78uc(L$Gl z)nr<_K@USA8ZaVUmBc{Yr7koeC;Cwjo~m3;(}Elsi#GBebk7ZRE#L(ObJQ7=uc>=V zJ}UouL=huO*n zKV=$PJ)0dvTN&dITD*MGFsSAJBQ9N2Adc**e3`>usJ_3PN4!y^cR5|QiZbSsebfw)NN$$6lr7INGm#eQ4U-~$1@;VNA~hU}I+~PDQy^wNwe#BtHplf?i=usH zD>9CYk8-ap&LXR5 zXQ2UbRb?|EF!BRM)Bx|Ib2O~%P!QHCh^BuAhOiVjqsv>v!WO<;iN0x0b^QuLJeU#u zgV$r%Sy{HMKu*cLVn4_xX!o1%o$xn4%%XZPgy~6Tk}vkX)1GV%=}lJ{;5r`r zHr4uo^UCif+dSnR$4vRWrlHmIc_cCKjy(OGnwLM>LRL#EYhJBZtZX0Pcn@9B8v-uJ zBIvM{vZ(zCw$!x=XVC1)y#>$U44oVYN`AxmUCS=2i-aM-Ik0U{W1UwcUWN|~&#gG` z-_uyY2TtUM-F5L9&pD}E|9zo!T|_FX$7VwYDB8QY1anv6*&5I9xB{()4CTCY)CyVJ z4F^)na_PWd?G#+zmT^`sc#bvYHJyr}SvsvtUnz$wJn+7hsY{ioaB|+0buhAIM}4pc zuGzZpNN}Cr$so?={mn7awuC*uZHNA;5w7l&kjq8KXqC2MAc%&U&%Qvz__w+r7CTO6 z0Dt!~4y;Fp1}3mmVG~c@9}7uSv~kx@uy#7cx)cd*Vu%YITD#B1uSYzzKV98bdsT4n zzIO-D=eD0ir6yapFHWPxrLe#B6wO&q5X?l{3U_amO|h36+5LxB6y(9E^v1sP#n}eN z$D2d^y~1e%$ww)g-P9xUdV89jTlz@h6wU)bzWn2&+T!hQ9~h7u*veUF^n1BC6-RFLk-2m#DZU~nhW;iTtHwf2GBJ?e%;g) zqKy`I6tqU6&Sfr$MJ>+q)64;UR_R5+;$SEs#y4ZN2>i)rqvQPGr1|!(x5tL2=WH`A zSXt0>A|v7Jwve8xI{-q5Fj0s2OB%KgH>vv!2yRk2e64q|{?gaA&LFePspv9?MAk9Ml`%&o4w z%tdNr=d6H)J_|9~o9u~pnJX9O0|JWaCmTpXVsN3g||i9HX-5VtsF++;AYYO7(Ep$YIjus zwJ*+&(J)3G0+jTVlg3`6J}RaY78K-BW7L}mQ2BQ+3q+H|ynQ{`H7zI?J9FMMj34rE zN~GRc)+e=Zhp_ixJwO~J_vSxaT>TLlJ*$&`jV^-ltlQ@s*0t|#m#Exc~8y35~~Y} zV~&@@G%Y^3nUhSE1`1sptVZkakpMt3ATAxr8)h z&wHUe6)f8d=^9|!LbA=l$~M7R8i=Yd%ntcs#DkgVwqgVsWkaySq=Xc7Zn;s#bYnL# zI^pHyA-fIU2SA0`gHJmUSs-(s`w-SO?~~=jm{q8a4aMIuILTMnOJSQM{yXWPz)j^h zOs?)c3^}SCVcsz=<*4_{!9YuOmElI&b!~!nquo;sd~}Sl_yMWU?${?4Wzoj?e-Ir4 z{G;`w`)PR@!On(tUAGMvtd=pGk(-0S!UbE`ffKH3l4nF@h)0S=H&%I1za5H!=r|8| zlq5Gtg3+FBC0Sk1la0Q4+3_?G{ff9o-psR$^}Kgj@!8{GDEOQiTjSp64Y8_#%e$?! zmZyVu{Rn}w+0#g^AvDC-mpZ0Ud(7WrkhHXqgp|P8Em>{zMuHm}kyf@O0nR z2)2SB1XY8GTTV^C#cX(z3Tg0`*NQ}jj~C93_b~c`gR~`b>4B4c`s9&J#cnGu79u3{ z%=lt;y<#>UbPEpjQL!e@2Ups7AO)Kw{j9NyH*gno0gk6E$U1N*kwA_hMieCAa@Kz5 ze_9ZW2!AUwY^U8RVx(~fT2z2nTPNfU@((M3dp{pF24x}W`Tgu>$1QL&;ESb;AB0d} zuCG@rG7VLKLJXNV=RFnt>jT&eR}Jd|o+P110?d80i1PzWffs&@$rN38GDh&s|J~mU z-~q5JrFFp`%nNnbr5PADk#R?K?{ndF&zq_TFn;4X8gROXj?$)C$U#*mHgO@#97)ATUf0cY$Co&3KnXd!b+px!d2rRVXj2qn*N()kZjyb&etck~&e}h0m$4Ma> z8bUb24OU%hXbo4fPv8Ek7S}aqyjI2P6&MX!wPrb|i}5~r=^^+W6K%`mV76ic!hX2Y&CVrqub3!OVE2wljooJ;!8Uo|`527qa`BK~B(x=0rIXVZXt#cfL&d*H#^8~Fa7i(8|df* z-%{I8i@}LtzHR^ssjsN!Lr^F2r>`xHr=3pRCQF13Yb>m9XCfb9W(@(-xH4`_cCaL2 z936pJ4F47KmjkI-6Az@;h-Ui0iqX^ZycZDr$Fc-2+jtFo$ecSd<31(IjL;33?lm8_{ISer94P1RLME5nb99>HZ4Eg3S@su!DJn9bWZGYY zZM_=a`SrxT;7C-fciAuy`EFI2UhC|F1TEgm1+n`0$E!)3svn1DZjJu>S}k1kcW0@mH-8AmenNBaKQs> zg-*&o64ZSLfMH5q^AY25@WJ^{RGv zo%4zgb~MMNGVdP1#$EtvXZG$m3BNG{YQcJ@{O=omGv*?ff0RCs<1Hrr{7`X^AqjX~ zWO^~KX7j}ZTq)k>ZbXA!F18E|=-#$4#MKKL1pGX(u3HX}p&|iF|5#7lm+^3FL$&>y z54P!Sn9?py5X&>qV6CrTM0EsNU;u*upleweNr5yKDv+C7i=_Z;+>SetAYaR8n+tEz zKSkBm;8g(pQV{5;{edF_Mk+Li|)#EbXarqP91Y3o4BWUAs}2`=Q?) zg$Wlno}&fDr;D0x(J9kb?zqsitfi1SFoRFH0~UGLqEs{PQxtf8R#&}4QP8O0?1c%B z{d*0L?s_J{lbKn_7`)C){OU|QT1l(jWa$nn1nM|Iw zM4m4$@a@ZVp*}gbec_i^-9MWxo*EN1ux{tCSj~BYc!9ArV?PTPdyWR?=klMyZ?5I4 zXRB3w8n&cr1=@mg;iKX?okZy8g}Qt|1;#6-Ou(O7^%k_%uefI|l~)F@M4OPJlZQAh zDY!x+@nq#uN>>9y?IT$aYU(P5En-rWFYG)7;%|5;2)2ummcpm!CEQe({s3L=HS;|G zileUn75a}q5BXvIJzjWf8k#ZvX01tTn53ug8HyO+htrc@4=3TDv`8xq6s z{Oy)W&2NBYji=V=ARa7#JoT^J<`REQI!DqX z`!2?o$d_j}DezxVmA_kI7a8GRNF%in^m3d7GB4n{ICT(>db6} z8W^Zf3H+@TIY3>)rku(6zpMhU?A)n~YfTUaG{ zewt(xL0Q79+%)E#l8qRVsqXyuqp7PtDX6%sMA2^FkcR%zW(Y|`kZ)`SOLwD}9}yAr zT<0N&8n=1PrE+|7I-S0u$2H)3K?V22mxOq0)T?^ssr<$(5?jHqi2$N`QOUvL;H)>e zn|lHDoy<)~YF7a=NdPSWymPgHZ%FYzz);Bz;jw9Tk$^^+dih(x>LZms%LezZmDlE0 z#(Ax5olZc|l__@S_4sU487WXUkd+}{^0zL*X=I1!MEb2{-<%Sy>jws(XjyTh^FG-C zsvEa){|$wxf9T7%N!=KYU=k+5xpm0kc*F7OyS9~Yfd0UYVTY4JRxK*> zke(v*((LPtGiKv*N2Agon!;3|$91B;lskGk#4UKa4Y2L}k zn(mcvXQCH`TME`x!CYw>MIyzHuSoR`%cM}5(3{Hp(=e4dEwS!uRe873b!uLE{>i0z;U$=^Q!7+7T9swY4$VjYm=#_B@9TwStH4!z2*0d-{X^> z)HNZKLj4<;0{w4JMrQAP|Embk?tj@PPT39AtCa5PSrUpuYl&=j%SbrX48#7B?8y>Z zi)Elp^Uu|SOiMYm6q8CfSw3M+Z92%JC7wEG1mwHXlU3KoiW+>KUd55`M5m3+G6V|g zayD?IynAWV8cUR>Q4Yn6#T%{a(1DQc5aZlV@oH z$H)BPJlx`~OQ*WEE>4_$%wE!*^~!%S#Fmk;^Ad(frOo)OM2F>SHK)5e4+2=~*jF-*d<`aWRPG(Wd4P{BAI( zpqCTX4ESg30k-%}hjlrTY8G#E6DKDIiBJu)*PT{Q=0G{2%!J3xX3TZxYpKG|aW ze_01pPUDNcJE2~B`Fn(+yU^R32dSk4-`;n&S1LsH9VvJAy*Fut);b{Lm1J;#!vg#5xiOwS8y$J@vjnNR~DL>7G*&Ok}2cY=J>v;{%_9hzSEfmGi zG9*2F20!EB)iCn!#Pm?zWyJESzVgfgrnjb+Xr_PC@V~}caMi`FvBQ8qMMelk{8}%e z&z_Pb#MLt7wNa~W*efs$Ah*B7%tvtzxNcl({jFA3th=z*FOD7n&TVZ&g-5<)u4fio zmpr@>B-TgHBnTs8g|5kX4oYAC4SGsAn^v!!v4COiL;Mut#7uucm(TH7WJFGU2}9fc zIZnBQ{Si_i#D!(juYNcV{^8l5i{%FGOst_rDaWeuS4c_2Jl=O0Em-M-v50T6d!4jT zU~5ZT?pSKi$d0r-prJAgsK=qxo&+d0GL_17^5&%Z9daXg1^*PWWv@RAo4&q(zgYX! zW+dNGEsiJ!qeNPwifR*0o1ktv0DdFn6f`G5L`w7?wgTSP}@6_4MHE zI>7!)^-sTQC%+n!Q9A4<{e<|aASUlQTa>q$QxJ0m5q9 + + + + + +Network Visualization + + +ptb_embed_2 + +ptb_embed_2 +FullyConnected +num-hidden=256 + + +ptb_lstm_2_i2h + +ptb_lstm_2_i2h +FullyConnected +num-hidden=1024 + + +ptb_lstm_2_i2h->ptb_embed_2 + + + + +ptb_embed_1 + +ptb_embed_1 +FullyConnected +num-hidden=256 + + +ptb_lstm_1_i2h + +ptb_lstm_1_i2h +FullyConnected +num-hidden=1024 + + +ptb_lstm_1_i2h->ptb_embed_1 + + + + +ptb_lstm_1_h2h + +ptb_lstm_1_h2h +FullyConnected +num-hidden=1024 + + +_plus0 + +_plus0 +_Plus + + +_plus0->ptb_lstm_1_i2h + + + + +_plus0->ptb_lstm_1_h2h + + + + +ptb_lstm_1_gates + +ptb_lstm_1_gates +SliceChannel + + +ptb_lstm_1_gates->_plus0 + + + + +activation3 + +activation3 +Activation +act-type=sigmoid + + +activation3->ptb_lstm_1_gates + + + + +activation2 + +activation2 +Activation +act-type=sigmoid + + +activation2->ptb_lstm_1_gates + + + + +_mul0 + +_mul0 +_Mul + + +_mul0->activation2 + + + + +activation0 + +activation0 +Activation +act-type=sigmoid + + +activation0->ptb_lstm_1_gates + + + + +activation1 + +activation1 +Activation +act-type=tanh + + +activation1->ptb_lstm_1_gates + + + + +_mul1 + +_mul1 +_Mul + + +_mul1->activation0 + + + + +_mul1->activation1 + + + + +_plus1 + +_plus1 +_Plus + + +_plus1->_mul0 + + + + +_plus1->_mul1 + + + + +activation4 + +activation4 +Activation +act-type=tanh + + +activation4->_plus1 + + + + +_mul2 + +_mul2 +_Mul + + +_mul2->activation3 + + + + +_mul2->activation4 + + + + +ptb_lstm_2_h2h + +ptb_lstm_2_h2h +FullyConnected +num-hidden=1024 + + +ptb_lstm_2_h2h->_mul2 + + + + +_plus2 + +_plus2 +_Plus + + +_plus2->ptb_lstm_2_i2h + + + + +_plus2->ptb_lstm_2_h2h + + + + +ptb_lstm_2_gates + +ptb_lstm_2_gates +SliceChannel + + +ptb_lstm_2_gates->_plus2 + + + + +activation8 + +activation8 +Activation +act-type=sigmoid + + +activation8->ptb_lstm_2_gates + + + + +activation7 + +activation7 +Activation +act-type=sigmoid + + +activation7->ptb_lstm_2_gates + + + + +_mul3 + +_mul3 +_Mul + + +_mul3->_plus1 + + + + +_mul3->activation7 + + + + +activation5 + +activation5 +Activation +act-type=sigmoid + + +activation5->ptb_lstm_2_gates + + + + +activation6 + +activation6 +Activation +act-type=tanh + + +activation6->ptb_lstm_2_gates + + + + +_mul4 + +_mul4 +_Mul + + +_mul4->activation5 + + + + +_mul4->activation6 + + + + +_plus3 + +_plus3 +_Plus + + +_plus3->_mul3 + + + + +_plus3->_mul4 + + + + +activation9 + +activation9 +Activation +act-type=tanh + + +activation9->_plus3 + + + + +_mul5 + +_mul5 +_Mul + + +_mul5->activation8 + + + + +_mul5->activation9 + + + + +ptb_l1_last_h + +ptb_l1_last_h +BlockGrad + + +ptb_l1_last_h->_mul5 + + + + +ptb_l1_last_c + +ptb_l1_last_c +BlockGrad + + +ptb_l1_last_c->_plus3 + + + + +ptb_pred_2 + +ptb_pred_2 +FullyConnected +num-hidden=128 + + +ptb_pred_2->_mul5 + + + + +ptb_softmax_2 + +ptb_softmax_2 +SoftmaxOutput + + +ptb_softmax_2->ptb_pred_2 + + + + +ptb_pred_1 + +ptb_pred_1 +FullyConnected +num-hidden=128 + + +ptb_pred_1->_mul2 + + + + +ptb_softmax_1 + +ptb_softmax_1 +SoftmaxOutput + + +ptb_softmax_1->ptb_pred_1 + + + + + diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index ab0c678f581d..e895d8389e74 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -65,6 +65,7 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla #... #--/LSTM-part1 + #--LSTM-part2 # now unroll over time outputs = mx.SymbolicNode[] for t = 1:seq_len @@ -92,7 +93,10 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla smax = mx.SoftmaxOutput(pred, label, name=symbol(name, "_softmax_$t")) push!(outputs, smax) end + #... + #--/LSTM-part2 + #--LSTM-part3 # append block-gradient nodes to the final states for i = 1:n_layer l_param, l_state = layer_param_states[i] @@ -103,10 +107,12 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla # now group all outputs together if output_states - outputs = outputs ∪ [x[2].c for x in layer_param_states] ∪ [x[2].h for x in layer_param_states] + outputs = outputs ∪ [x[2].c for x in layer_param_states] ∪ + [x[2].h for x in layer_param_states] end return mx.Group(outputs...) end +#--/LSTM-part3 # Negative Log-likelihood diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index 2837ab7d8b55..1ea93e3b6116 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -31,6 +31,7 @@ function build_vocabulary(corpus_fn::AbstractString, vocab_fn::AbstractString; m return vocab end +#--CharSeqProvider type CharSeqProvider <: mx.AbstractDataProvider text :: AbstractString batch_size :: Int @@ -41,10 +42,13 @@ type CharSeqProvider <: mx.AbstractDataProvider n_layer :: Int dim_hidden :: Int end +#--/CharSeqProvider function mx.get_batch_size(p :: CharSeqProvider) p.batch_size end + +#--provide function mx.provide_data(p :: CharSeqProvider) [(symbol(p.prefix, "_data_$t"), (length(p.vocab), p.batch_size)) for t = 1:p.seq_len] ∪ [(symbol(p.prefix, "_l$(l)_init_c"), (p.dim_hidden, p.batch_size)) for l=1:p.n_layer] ∪ @@ -53,7 +57,9 @@ end function mx.provide_label(p :: CharSeqProvider) [(symbol(p.prefix, "_label_$t"), (p.batch_size,)) for t = 1:p.seq_len] end +#--/provide +#--eachbatch-part1 function mx.eachbatch(p :: CharSeqProvider) data_all = [mx.zeros(shape) for (name, shape) in mx.provide_data(p)] label_all = [mx.zeros(shape) for (name, shape) in mx.provide_label(p)] @@ -62,7 +68,11 @@ function mx.eachbatch(p :: CharSeqProvider) label_jl= [copy(x) for x in label_all] batch = mx.DataBatch(data_all, label_all, p.batch_size) + #... + #--/eachbatch-part1 + #--eachbatch-part2 + #... function _text_iter() text = p.text @@ -96,6 +106,7 @@ function mx.eachbatch(p :: CharSeqProvider) return Task(_text_iter) end +#--/eachbatch-part2 # helper function to convert a char into index in vocabulary function char_idx(vocab :: Dict{Char,Int}, c :: Char) diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index cb19891f03b1..f96fdde1d674 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -6,9 +6,13 @@ include(joinpath(dirname(@__FILE__), "seq-data.jl")) vocab = build_vocabulary(INPUT_FILE, VOCAB_FILE) n_class = length(vocab) +#--LSTM # define LSTM -lstm = LSTM(LSTM_N_LAYER, SEQ_LENGTH, DIM_HIDDEN, DIM_EMBED, n_class, dropout=DROPOUT, name=NAME) +lstm = LSTM(LSTM_N_LAYER, SEQ_LENGTH, DIM_HIDDEN, DIM_EMBED, + n_class, dropout=DROPOUT, name=NAME) +#--/LSTM +#--data # load data text_all = readall(INPUT_FILE) len_train = round(Int, length(text_all)*DATA_TR_RATIO) @@ -19,6 +23,7 @@ data_tr = CharSeqProvider(text_tr, BATCH_SIZE, SEQ_LENGTH, vocab, NAME, LSTM_N_LAYER, DIM_HIDDEN) data_val = CharSeqProvider(text_val, BATCH_SIZE, SEQ_LENGTH, vocab, NAME, LSTM_N_LAYER, DIM_HIDDEN) +#--/data # set up training if USE_GPU @@ -27,9 +32,11 @@ else context = [mx.cpu()] end +#--train model = mx.FeedForward(lstm, context=context) optimizer = mx.ADAM(lr=BASE_LR, weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH, initializer=mx.UniformInitializer(0.1), callbacks=[mx.speedometer(), mx.do_checkpoint(CKPOINT_PREFIX)], eval_metric=NLL()) +#--/train diff --git a/src/io.jl b/src/io.jl index d6ba2fd3d8ce..48e0a31e32a2 100644 --- a/src/io.jl +++ b/src/io.jl @@ -58,62 +58,66 @@ and split it into mini-batches so that the model can consume the data in a unifo By default, :func:`eachbatch` simply returns the provider itself, so the iterator interface is implemented on the provider type itself. But the extra layer of abstraction allows us to - implement a data provider easily via a Julia ``Task`` coroutine. - The detailed interface function is listed below: + implement a data provider easily via a Julia ``Task`` coroutine. See the + data provider defined in :doc:`the char-lstm example + ` for an example of using coroutine to define data + providers. - .. function:: Base.eltype(provider) -> AbstractDataBatch +The detailed interface functions for the iterator API is listed below: - :param AbstractDataProvider provider: the data provider. - :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. +.. function:: Base.eltype(provider) -> AbstractDataBatch - .. function:: Base.start(provider) -> AbstractDataProviderState + :param AbstractDataProvider provider: the data provider. + :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. - :param AbstractDataProvider provider: the data provider. +.. function:: Base.start(provider) -> AbstractDataProviderState - This function is always called before iterating into the dataset. It should initialize - the iterator, reset the index, and do data shuffling if needed. + :param AbstractDataProvider provider: the data provider. - .. function:: Base.done(provider, state) -> Bool + This function is always called before iterating into the dataset. It should initialize + the iterator, reset the index, and do data shuffling if needed. - :param AbstractDataProvider provider: the data provider. - :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. - :return: true if there is no more data to iterate in this dataset. +.. function:: Base.done(provider, state) -> Bool - .. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) + :param AbstractDataProvider provider: the data provider. + :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. + :return: true if there is no more data to iterate in this dataset. - :param AbstractDataProvider provider: the data provider. - :return: the current data batch, and the state for the next iteration. +.. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) - Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that - is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this - case, you can safely assume that + :param AbstractDataProvider provider: the data provider. + :return: the current data batch, and the state for the next iteration. - * :func:`Base.start` will always be called, and called only once before the iteration starts. - * :func:`Base.done` will always be called at the beginning of every iteration and always be called once. - * If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with - a call to :func:`Base.start`. - * :func:`Base.next` will always be called only once in each iteration. It will always be called after - one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will - not be called. +Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that +is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this +case, you can safely assume that - With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation - of the built-in :class:`MXDataProvider` for example. +* :func:`Base.start` will always be called, and called only once before the iteration starts. +* :func:`Base.done` will always be called at the beginning of every iteration and always be called once. +* If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with + a call to :func:`Base.start`. +* :func:`Base.next` will always be called only once in each iteration. It will always be called after + one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will + not be called. - .. caution:: +With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation +of the built-in :class:`MXDataProvider` for example. - Please do not use the one data provider simultaneously in two different places, either in parallel, - or in a nested loop. For example, the behavior for the following code is undefined +.. caution:: - .. code-block:: julia + Please do not use the one data provider simultaneously in two different places, either in parallel, + or in a nested loop. For example, the behavior for the following code is undefined - for batch in data - # updating the parameters + .. code-block:: julia + + for batch in data + # updating the parameters - # now let's test the performance on the training set - for b2 in data - # ... - end - end + # now let's test the performance on the training set + for b2 in data + # ... + end + end =# abstract AbstractDataProvider @@ -162,7 +166,7 @@ abstract AbstractDataProviderState :param AbstractDataBatch batch: the data batch object. :param Base.Symbol name: the name of the data to get, should be one of the names provided in either :func:`provide_data() ` - or :func:`provide_label() `. + or :func:`provide_label() `. :return: the corresponding data array corresponding to that name. .. function:: load_data!(provider, batch, targets) From b595394759c377aac99fe7d986c13e14e42541cc Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 14 Nov 2015 23:43:39 -0500 Subject: [PATCH 237/630] call visualization in test --- examples/mnist/mlp-test.jl | 3 +++ 1 file changed, 3 insertions(+) diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl index feabd1140a89..4931944032a9 100644 --- a/examples/mnist/mlp-test.jl +++ b/examples/mnist/mlp-test.jl @@ -65,6 +65,9 @@ function mnist_fit_and_predict(optimizer, initializer, n_epoch) accuracy = 100correct/length(labels) println(mx.format("Accuracy on eval set: {1:.2f}%", accuracy)) + # try to call visualization + dot_code = mx.to_graphviz(mlp) + return accuracy end From f099670c9d83c0b60d9dac9f41753dd1490e7eba Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 14 Nov 2015 23:50:41 -0500 Subject: [PATCH 238/630] prepare for v0.0.5 --- NEWS.md | 9 +++++++++ docs/conf.py | 4 ++-- 2 files changed, 11 insertions(+), 2 deletions(-) diff --git a/NEWS.md b/NEWS.md index f970f7d64703..d50bd5ed9300 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,12 @@ +# v0.0.5 (2015.11.14) + +* char-lstm example. +* Network visualization via GraphViz. +* NN-factory for common models. +* Convenient `@nd_as_jl` macro to work with `NDArray` as Julia Arrays. +* Refactoring: `Symbol` -> `SymbolicNode`. +* More evaluation metrics (@vchuravy, @Andy-P) + # v0.0.4 (2015.11.09) * ADAM optimizer (@cbecker) diff --git a/docs/conf.py b/docs/conf.py index b009877694a0..c2a405765352 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -56,9 +56,9 @@ # built documents. # # The short X.Y version. -version = '0.0.4' +version = '0.0.5' # The full version, including alpha/beta/rc tags. -release = '0.0.4' +release = '0.0.5' # The language for content autogenerated by Sphinx. Refer to documentation # for a list of supported languages. From 37b48f18ac305ec6bf89d592886225d73bf26994 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Kenta=20Sato=20=28=E4=BD=90=E8=97=A4=20=E5=BB=BA=E5=A4=AA?= =?UTF-8?q?=29?= Date: Mon, 16 Nov 2015 00:55:16 +0900 Subject: [PATCH 239/630] fix the sample code in README --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index a6ae2d5cebe8..8bf867f39964 100644 --- a/README.md +++ b/README.md @@ -23,7 +23,7 @@ mlp = @mx.chain mx.Variable(:data) => # data provider batch_size = 100 -include(joinpath(Pkg.dir("MXNet"), "examples/mnist/mnist-data.jl")) +include(Pkg.dir("MXNet", "examples", "mnist", "mnist-data.jl")) train_provider, eval_provider = get_mnist_providers(batch_size) # setup model From e8ab01d26d8ab257222baabb8e4180cd14ec5aaf Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 15 Nov 2015 20:25:37 -0500 Subject: [PATCH 240/630] tweak visualization style. --- docs/tutorial/images/char-lstm-vis.svg | 1284 ++++++++++++++++++------ examples/char-lstm/.gitignore | 1 + src/visualize.jl | 34 +- 3 files changed, 1004 insertions(+), 315 deletions(-) diff --git a/docs/tutorial/images/char-lstm-vis.svg b/docs/tutorial/images/char-lstm-vis.svg index 8c5261ed7f44..cf49d097bdc7 100644 --- a/docs/tutorial/images/char-lstm-vis.svg +++ b/docs/tutorial/images/char-lstm-vis.svg @@ -4,432 +4,1114 @@ - - + + Network Visualization - + + +ptb_embed_3 + +ptb_embed_3 +FullyConnected +num-hidden=256 + + +ptb_lstm_3_i2h + +ptb_lstm_3_i2h +FullyConnected +num-hidden=1024 + + +ptb_lstm_3_i2h->ptb_embed_3 + + + + +_mul14 + +_mul14 +_Mul + + +ptb_lstm_3_i2h->_mul14 + + + -ptb_embed_2 - -ptb_embed_2 -FullyConnected -num-hidden=256 +ptb_embed_2 + +ptb_embed_2 +FullyConnected +num-hidden=256 -ptb_lstm_2_i2h - -ptb_lstm_2_i2h -FullyConnected -num-hidden=1024 +ptb_lstm_2_i2h + +ptb_lstm_2_i2h +FullyConnected +num-hidden=1024 -ptb_lstm_2_i2h->ptb_embed_2 - - +ptb_lstm_2_i2h->ptb_embed_2 + + + + +_mul8 + +_mul8 +_Mul + + +ptb_lstm_2_i2h->_mul8 + + -ptb_embed_1 - -ptb_embed_1 -FullyConnected -num-hidden=256 +ptb_embed_1 + +ptb_embed_1 +FullyConnected +num-hidden=256 -ptb_lstm_1_i2h - -ptb_lstm_1_i2h -FullyConnected -num-hidden=1024 +ptb_lstm_1_i2h + +ptb_lstm_1_i2h +FullyConnected +num-hidden=1024 -ptb_lstm_1_i2h->ptb_embed_1 - - +ptb_lstm_1_i2h->ptb_embed_1 + + + + +_mul2 + +_mul2 +_Mul + + +ptb_lstm_1_i2h->_mul2 + + -ptb_lstm_1_h2h - -ptb_lstm_1_h2h -FullyConnected -num-hidden=1024 +ptb_lstm_1_h2h + +ptb_lstm_1_h2h +FullyConnected +num-hidden=1024 -_plus0 - -_plus0 -_Plus +_plus0 + +_plus0 +_Plus -_plus0->ptb_lstm_1_i2h - - +_plus0->ptb_lstm_1_i2h + + -_plus0->ptb_lstm_1_h2h - - +_plus0->ptb_lstm_1_h2h + + -ptb_lstm_1_gates - -ptb_lstm_1_gates -SliceChannel +ptb_lstm_1_gates + +ptb_lstm_1_gates +SliceChannel -ptb_lstm_1_gates->_plus0 - - +ptb_lstm_1_gates->_plus0 + + + + +_plus2 + +_plus2 +_Plus + + +ptb_lstm_1_gates->_plus2 + + -activation3 - -activation3 -Activation -act-type=sigmoid +activation3 + +activation3 +Activation +act-type=sigmoid -activation3->ptb_lstm_1_gates - - +activation3->ptb_lstm_1_gates + + -activation2 - -activation2 -Activation -act-type=sigmoid +activation2 + +activation2 +Activation +act-type=sigmoid -activation2->ptb_lstm_1_gates - - +activation2->ptb_lstm_1_gates + + -_mul0 - -_mul0 -_Mul +_mul0 + +_mul0 +_Mul -_mul0->activation2 - - +_mul0->activation2 + + -activation0 - -activation0 -Activation -act-type=sigmoid +activation0 + +activation0 +Activation +act-type=sigmoid -activation0->ptb_lstm_1_gates - - +activation0->ptb_lstm_1_gates + + -activation1 - -activation1 -Activation -act-type=tanh +activation1 + +activation1 +Activation +act-type=tanh -activation1->ptb_lstm_1_gates - - +activation1->ptb_lstm_1_gates + + -_mul1 - -_mul1 -_Mul +_mul1 + +_mul1 +_Mul -_mul1->activation0 - - +_mul1->activation0 + + -_mul1->activation1 - - +_mul1->activation1 + + -_plus1 - -_plus1 -_Plus +_plus1 + +_plus1 +_Plus -_plus1->_mul0 - - +_plus1->_mul0 + + -_plus1->_mul1 - - +_plus1->_mul1 + + -activation4 - -activation4 -Activation -act-type=tanh +activation4 + +activation4 +Activation +act-type=tanh -activation4->_plus1 - - - - -_mul2 - -_mul2 -_Mul +activation4->_plus1 + + -_mul2->activation3 - - +_mul2->activation3 + + -_mul2->activation4 - - +_mul2->activation4 + + -ptb_lstm_2_h2h - -ptb_lstm_2_h2h -FullyConnected -num-hidden=1024 +ptb_lstm_2_h2h + +ptb_lstm_2_h2h +FullyConnected +num-hidden=1024 -ptb_lstm_2_h2h->_mul2 - - +ptb_lstm_2_h2h->_mul2 + + - -_plus2 - -_plus2 -_Plus - - -_plus2->ptb_lstm_2_i2h - - - - -_plus2->ptb_lstm_2_h2h - - + +_mul5 + +_mul5 +_Mul + + +ptb_lstm_2_h2h->_mul5 + + + + +_plus4 + +_plus4 +_Plus + + +_plus4->ptb_lstm_2_i2h + + + + +_plus4->ptb_lstm_2_h2h + + -ptb_lstm_2_gates - -ptb_lstm_2_gates -SliceChannel - - -ptb_lstm_2_gates->_plus2 - - +ptb_lstm_2_gates + +ptb_lstm_2_gates +SliceChannel + + +ptb_lstm_2_gates->_plus4 + + + + +_plus6 + +_plus6 +_Plus + + +ptb_lstm_2_gates->_plus6 + + + + +activation13 + +activation13 +Activation +act-type=sigmoid + + +activation13->ptb_lstm_2_gates + + + + +activation12 + +activation12 +Activation +act-type=sigmoid + + +activation12->ptb_lstm_2_gates + + + + +_mul6 + +_mul6 +_Mul + + +_mul6->_plus1 + + + + +_mul6->activation12 + + + + +activation10 + +activation10 +Activation +act-type=sigmoid + + +activation10->ptb_lstm_2_gates + + + + +activation11 + +activation11 +Activation +act-type=tanh + + +activation11->ptb_lstm_2_gates + + + + +_mul7 + +_mul7 +_Mul + + +_mul7->activation10 + + + + +_mul7->activation11 + + + + +_plus5 + +_plus5 +_Plus + + +_plus5->_mul6 + + + + +_plus5->_mul7 + + + + +activation14 + +activation14 +Activation +act-type=tanh + + +activation14->_plus5 + + + + +_mul8->activation13 + + + + +_mul8->activation14 + + + + +ptb_lstm_3_h2h + +ptb_lstm_3_h2h +FullyConnected +num-hidden=1024 + + +ptb_lstm_3_h2h->_mul8 + + + + +_mul11 + +_mul11 +_Mul + + +ptb_lstm_3_h2h->_mul11 + + + + +_plus8 + +_plus8 +_Plus + + +_plus8->ptb_lstm_3_i2h + + + + +_plus8->ptb_lstm_3_h2h + + + + +ptb_lstm_3_gates + +ptb_lstm_3_gates +SliceChannel + + +ptb_lstm_3_gates->_plus8 + + + + +_plus10 + +_plus10 +_Plus + + +ptb_lstm_3_gates->_plus10 + + + + +activation23 + +activation23 +Activation +act-type=sigmoid + + +activation23->ptb_lstm_3_gates + + + + +activation22 + +activation22 +Activation +act-type=sigmoid + + +activation22->ptb_lstm_3_gates + + + + +_mul12 + +_mul12 +_Mul + + +_mul12->_plus5 + + + + +_mul12->activation22 + + + + +activation20 + +activation20 +Activation +act-type=sigmoid + + +activation20->ptb_lstm_3_gates + + + + +activation21 + +activation21 +Activation +act-type=tanh + + +activation21->ptb_lstm_3_gates + + + + +_mul13 + +_mul13 +_Mul + + +_mul13->activation20 + + + + +_mul13->activation21 + + + + +_plus9 + +_plus9 +_Plus + + +_plus9->_mul12 + + + + +_plus9->_mul13 + + + + +activation24 + +activation24 +Activation +act-type=tanh + + +activation24->_plus9 + + + + +_mul14->activation23 + + + + +_mul14->activation24 + + + + +_plus2->ptb_lstm_1_i2h + + + + +_plus2->ptb_lstm_1_h2h + + -activation8 - -activation8 -Activation -act-type=sigmoid +activation8 + +activation8 +Activation +act-type=sigmoid - -activation8->ptb_lstm_2_gates - - + +activation8->ptb_lstm_1_gates + + -activation7 - -activation7 -Activation -act-type=sigmoid +activation7 + +activation7 +Activation +act-type=sigmoid - -activation7->ptb_lstm_2_gates - - + +activation7->ptb_lstm_1_gates + + -_mul3 - -_mul3 -_Mul - - -_mul3->_plus1 - - +_mul3 + +_mul3 +_Mul -_mul3->activation7 - - +_mul3->activation7 + + -activation5 - -activation5 -Activation -act-type=sigmoid +activation5 + +activation5 +Activation +act-type=sigmoid - -activation5->ptb_lstm_2_gates - - + +activation5->ptb_lstm_1_gates + + -activation6 - -activation6 -Activation -act-type=tanh +activation6 + +activation6 +Activation +act-type=tanh - -activation6->ptb_lstm_2_gates - - + +activation6->ptb_lstm_1_gates + + -_mul4 - -_mul4 -_Mul +_mul4 + +_mul4 +_Mul -_mul4->activation5 - - +_mul4->activation5 + + -_mul4->activation6 - - +_mul4->activation6 + + -_plus3 - -_plus3 -_Plus +_plus3 + +_plus3 +_Plus -_plus3->_mul3 - - +_plus3->_mul3 + + -_plus3->_mul4 - - +_plus3->_mul4 + + -activation9 - -activation9 -Activation -act-type=tanh +activation9 + +activation9 +Activation +act-type=tanh -activation9->_plus3 - - - - -_mul5 - -_mul5 -_Mul +activation9->_plus3 + + -_mul5->activation8 - - +_mul5->activation8 + + -_mul5->activation9 - - +_mul5->activation9 + + + + +_plus6->ptb_lstm_2_i2h + + + + +_plus6->ptb_lstm_2_h2h + + + + +activation18 + +activation18 +Activation +act-type=sigmoid + + +activation18->ptb_lstm_2_gates + + + + +activation17 + +activation17 +Activation +act-type=sigmoid + + +activation17->ptb_lstm_2_gates + + + + +_mul9 + +_mul9 +_Mul + + +_mul9->_plus3 + + + + +_mul9->activation17 + + + + +activation15 + +activation15 +Activation +act-type=sigmoid + + +activation15->ptb_lstm_2_gates + + + + +activation16 + +activation16 +Activation +act-type=tanh + + +activation16->ptb_lstm_2_gates + + + + +_mul10 + +_mul10 +_Mul + + +_mul10->activation15 + + + + +_mul10->activation16 + + + + +_plus7 + +_plus7 +_Plus + + +_plus7->_mul9 + + + + +_plus7->_mul10 + + + + +activation19 + +activation19 +Activation +act-type=tanh + + +activation19->_plus7 + + + + +_mul11->activation18 + + + + +_mul11->activation19 + + + + +_plus10->ptb_lstm_3_i2h + + + + +_plus10->ptb_lstm_3_h2h + + + + +activation28 + +activation28 +Activation +act-type=sigmoid + + +activation28->ptb_lstm_3_gates + + + + +activation27 + +activation27 +Activation +act-type=sigmoid + + +activation27->ptb_lstm_3_gates + + + + +_mul15 + +_mul15 +_Mul + + +_mul15->_plus7 + + + + +_mul15->activation27 + + + + +activation25 + +activation25 +Activation +act-type=sigmoid + + +activation25->ptb_lstm_3_gates + + + + +activation26 + +activation26 +Activation +act-type=tanh + + +activation26->ptb_lstm_3_gates + + + + +_mul16 + +_mul16 +_Mul + + +_mul16->activation25 + + + + +_mul16->activation26 + + + + +_plus11 + +_plus11 +_Plus + + +_plus11->_mul15 + + + + +_plus11->_mul16 + + + + +activation29 + +activation29 +Activation +act-type=tanh + + +activation29->_plus11 + + + + +_mul17 + +_mul17 +_Mul + + +_mul17->activation28 + + + + +_mul17->activation29 + + + + +ptb_l2_last_h + +ptb_l2_last_h +BlockGrad + + +ptb_l2_last_h->_mul17 + + -ptb_l1_last_h - -ptb_l1_last_h -BlockGrad - - -ptb_l1_last_h->_mul5 - - +ptb_l1_last_h + +ptb_l1_last_h +BlockGrad + + +ptb_l1_last_h->_mul14 + + + + +ptb_l2_last_c + +ptb_l2_last_c +BlockGrad + + +ptb_l2_last_c->_plus11 + + -ptb_l1_last_c - -ptb_l1_last_c -BlockGrad - - -ptb_l1_last_c->_plus3 - - +ptb_l1_last_c + +ptb_l1_last_c +BlockGrad + + +ptb_l1_last_c->_plus9 + + + + +ptb_pred_3 + +ptb_pred_3 +FullyConnected +num-hidden=128 + + +ptb_pred_3->_mul17 + + + + +ptb_softmax_3 + +ptb_softmax_3 +SoftmaxOutput + + +ptb_softmax_3->ptb_pred_3 + + -ptb_pred_2 - -ptb_pred_2 -FullyConnected -num-hidden=128 +ptb_pred_2 + +ptb_pred_2 +FullyConnected +num-hidden=128 - -ptb_pred_2->_mul5 - - + +ptb_pred_2->_mul11 + + -ptb_softmax_2 - -ptb_softmax_2 -SoftmaxOutput +ptb_softmax_2 + +ptb_softmax_2 +SoftmaxOutput -ptb_softmax_2->ptb_pred_2 - - +ptb_softmax_2->ptb_pred_2 + + -ptb_pred_1 - -ptb_pred_1 -FullyConnected -num-hidden=128 +ptb_pred_1 + +ptb_pred_1 +FullyConnected +num-hidden=128 - -ptb_pred_1->_mul2 - - + +ptb_pred_1->_mul5 + + -ptb_softmax_1 - -ptb_softmax_1 -SoftmaxOutput +ptb_softmax_1 + +ptb_softmax_1 +SoftmaxOutput -ptb_softmax_1->ptb_pred_1 - - +ptb_softmax_1->ptb_pred_1 + + diff --git a/examples/char-lstm/.gitignore b/examples/char-lstm/.gitignore index d8923cc201b1..a393ee67b410 100644 --- a/examples/char-lstm/.gitignore +++ b/examples/char-lstm/.gitignore @@ -3,3 +3,4 @@ vocab.dat checkpoints visualize.dot visualize.svg +visualize.png diff --git a/src/visualize.jl b/src/visualize.jl index 0b5c0c3d8e90..b1fa90ff3851 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -35,15 +35,17 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp nodes = conf["nodes"] heads = unique([x[1]+1 for x in conf["heads"]]) node_attr = Dict(:shape => :box, :fixedsize => true, :width => 1.3, - :height => 0.8034, :style => :filled) + :height => 0.8034, :style => (:rounded, :filled), :penwidth => 2) io = IOBuffer() println(io, "digraph $(_simple_escape(title)) {") println(io, "node [fontsize=10];") println(io, "edge [fontsize=10];") # color map - cm = ("#8dd3c7", "#fb8072", "#ffffb3", "#bebada", "#80b1d3", - "#fdb462", "#b3de69", "#fccde5") + fillcolors = ("#8dd3c7", "#fb8072", "#ffffb3", "#bebada", "#80b1d3", + "#fdb462", "#b3de69", "#fccde5") + edgecolors = ("#245b51", "#941305", "#999900", "#3b3564", "#275372", + "#975102", "#597d1c", "#90094e") # make nodes for i = 1:length(nodes) @@ -57,7 +59,7 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp if i ∈ heads # heads are output nodes label = node["name"] - attr[:fillcolor] = cm[1] + colorkey = 1 else # otherwise, input nodes, might be data, label or parameters continue @@ -67,33 +69,35 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp _extract_shape(node["param"]["kernel"]), _extract_shape(node["param"]["stride"]), node["param"]["num_filter"]) - attr[:fillcolor] = cm[2] + colorkey = 2 elseif op == "FullyConnected" label = format("FullyConnected\nnum-hidden={1}", node["param"]["num_hidden"]) - attr[:fillcolor] = cm[2] + colorkey = 2 elseif op == "Activation" label = format("Activation\nact-type={1}", node["param"]["act_type"]) - attr[:fillcolor] = cm[3] + colorkey = 3 elseif op == "BatchNorm" - attr[:fillcolor] = cm[4] + colorkey = 4 elseif op == "Pooling" label = format("Pooling\ntype={1}\nkernel={2}\nstride={3}", node["param"]["pool_type"], _extract_shape(node["param"]["kernel"]), _extract_shape(node["param"]["stride"])) - attr[:fillcolor] = cm[5] + colorkey = 5 elseif op ∈ ("Concat", "Flatten", "Reshape") - attr[:fillcolor] = cm[6] + colorkey = 6 elseif endswith(op, "Output") || op == "BlockGrad" - attr[:fillcolor] = cm[7] + colorkey = 7 else - attr[:fillcolor] = cm[8] + colorkey = 8 end if op != "null" label = "$name\n$label" end - attr[:label] = label + attr[:fillcolor] = fillcolors[colorkey] + attr[:color] = edgecolors[colorkey] + attr[:label] = label _format_graphviz_node(io, name, attr) end @@ -110,7 +114,7 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp input_node = nodes[item[1]+1] input_name = input_node["name"] if input_node["op"] != "null" || (item[1]+1) ∈ heads - attr = Dict(:dir => :back, :arrowtail => :open) + attr = Dict(:dir => :back, :arrowtail => :open, :color => "#737373") if draw_shape if input_node["op"] != "null" key = symbol(input_name, "_output") @@ -149,6 +153,8 @@ function _format_graphviz_attr(io::IOBuffer, attrs) if isa(v, AbstractString) && v[1] == '#' # color v = _simple_escape(v) + elseif isa(v, Tuple) + v = _simple_escape(join([string(x) for x in v], ",")) end print(io, "$k=$v") end From aea096f55f85ad7fc3c21dd098436fe455af327d Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 15 Nov 2015 20:30:04 -0500 Subject: [PATCH 241/630] use a smaller network for visualization. --- docs/tutorial/images/char-lstm-vis.svg | 1284 ++++++------------------ examples/char-lstm/visualize.jl | 4 +- 2 files changed, 303 insertions(+), 985 deletions(-) diff --git a/docs/tutorial/images/char-lstm-vis.svg b/docs/tutorial/images/char-lstm-vis.svg index cf49d097bdc7..610abab774b7 100644 --- a/docs/tutorial/images/char-lstm-vis.svg +++ b/docs/tutorial/images/char-lstm-vis.svg @@ -4,1114 +4,432 @@ - - + + Network Visualization - - -ptb_embed_3 - -ptb_embed_3 -FullyConnected -num-hidden=256 - - -ptb_lstm_3_i2h - -ptb_lstm_3_i2h -FullyConnected -num-hidden=1024 - - -ptb_lstm_3_i2h->ptb_embed_3 - - - - -_mul14 - -_mul14 -_Mul - - -ptb_lstm_3_i2h->_mul14 - - - + -ptb_embed_2 - -ptb_embed_2 -FullyConnected -num-hidden=256 +ptb_embed_2 + +ptb_embed_2 +FullyConnected +num-hidden=256 -ptb_lstm_2_i2h - -ptb_lstm_2_i2h -FullyConnected -num-hidden=1024 +ptb_lstm_2_i2h + +ptb_lstm_2_i2h +FullyConnected +num-hidden=1024 -ptb_lstm_2_i2h->ptb_embed_2 - - - - -_mul8 - -_mul8 -_Mul - - -ptb_lstm_2_i2h->_mul8 - - +ptb_lstm_2_i2h->ptb_embed_2 + + -ptb_embed_1 - -ptb_embed_1 -FullyConnected -num-hidden=256 +ptb_embed_1 + +ptb_embed_1 +FullyConnected +num-hidden=256 -ptb_lstm_1_i2h - -ptb_lstm_1_i2h -FullyConnected -num-hidden=1024 +ptb_lstm_1_i2h + +ptb_lstm_1_i2h +FullyConnected +num-hidden=1024 -ptb_lstm_1_i2h->ptb_embed_1 - - - - -_mul2 - -_mul2 -_Mul - - -ptb_lstm_1_i2h->_mul2 - - +ptb_lstm_1_i2h->ptb_embed_1 + + -ptb_lstm_1_h2h - -ptb_lstm_1_h2h -FullyConnected -num-hidden=1024 +ptb_lstm_1_h2h + +ptb_lstm_1_h2h +FullyConnected +num-hidden=1024 -_plus0 - -_plus0 -_Plus +_plus0 + +_plus0 +_Plus -_plus0->ptb_lstm_1_i2h - - +_plus0->ptb_lstm_1_i2h + + -_plus0->ptb_lstm_1_h2h - - +_plus0->ptb_lstm_1_h2h + + -ptb_lstm_1_gates - -ptb_lstm_1_gates -SliceChannel +ptb_lstm_1_gates + +ptb_lstm_1_gates +SliceChannel -ptb_lstm_1_gates->_plus0 - - - - -_plus2 - -_plus2 -_Plus - - -ptb_lstm_1_gates->_plus2 - - +ptb_lstm_1_gates->_plus0 + + -activation3 - -activation3 -Activation -act-type=sigmoid +activation3 + +activation3 +Activation +act-type=sigmoid -activation3->ptb_lstm_1_gates - - +activation3->ptb_lstm_1_gates + + -activation2 - -activation2 -Activation -act-type=sigmoid +activation2 + +activation2 +Activation +act-type=sigmoid -activation2->ptb_lstm_1_gates - - +activation2->ptb_lstm_1_gates + + -_mul0 - -_mul0 -_Mul +_mul0 + +_mul0 +_Mul -_mul0->activation2 - - +_mul0->activation2 + + -activation0 - -activation0 -Activation -act-type=sigmoid +activation0 + +activation0 +Activation +act-type=sigmoid -activation0->ptb_lstm_1_gates - - +activation0->ptb_lstm_1_gates + + -activation1 - -activation1 -Activation -act-type=tanh +activation1 + +activation1 +Activation +act-type=tanh -activation1->ptb_lstm_1_gates - - +activation1->ptb_lstm_1_gates + + -_mul1 - -_mul1 -_Mul +_mul1 + +_mul1 +_Mul -_mul1->activation0 - - +_mul1->activation0 + + -_mul1->activation1 - - +_mul1->activation1 + + -_plus1 - -_plus1 -_Plus +_plus1 + +_plus1 +_Plus -_plus1->_mul0 - - +_plus1->_mul0 + + -_plus1->_mul1 - - +_plus1->_mul1 + + -activation4 - -activation4 -Activation -act-type=tanh +activation4 + +activation4 +Activation +act-type=tanh -activation4->_plus1 - - +activation4->_plus1 + + + + +_mul2 + +_mul2 +_Mul -_mul2->activation3 - - +_mul2->activation3 + + -_mul2->activation4 - - +_mul2->activation4 + + -ptb_lstm_2_h2h - -ptb_lstm_2_h2h -FullyConnected -num-hidden=1024 +ptb_lstm_2_h2h + +ptb_lstm_2_h2h +FullyConnected +num-hidden=1024 -ptb_lstm_2_h2h->_mul2 - - +ptb_lstm_2_h2h->_mul2 + + - -_mul5 - -_mul5 -_Mul - - -ptb_lstm_2_h2h->_mul5 - - - - -_plus4 - -_plus4 -_Plus - - -_plus4->ptb_lstm_2_i2h - - - - -_plus4->ptb_lstm_2_h2h - - + +_plus2 + +_plus2 +_Plus + + +_plus2->ptb_lstm_2_i2h + + + + +_plus2->ptb_lstm_2_h2h + + -ptb_lstm_2_gates - -ptb_lstm_2_gates -SliceChannel - - -ptb_lstm_2_gates->_plus4 - - - - -_plus6 - -_plus6 -_Plus - - -ptb_lstm_2_gates->_plus6 - - - - -activation13 - -activation13 -Activation -act-type=sigmoid - - -activation13->ptb_lstm_2_gates - - - - -activation12 - -activation12 -Activation -act-type=sigmoid - - -activation12->ptb_lstm_2_gates - - - - -_mul6 - -_mul6 -_Mul - - -_mul6->_plus1 - - - - -_mul6->activation12 - - - - -activation10 - -activation10 -Activation -act-type=sigmoid - - -activation10->ptb_lstm_2_gates - - - - -activation11 - -activation11 -Activation -act-type=tanh - - -activation11->ptb_lstm_2_gates - - - - -_mul7 - -_mul7 -_Mul - - -_mul7->activation10 - - - - -_mul7->activation11 - - - - -_plus5 - -_plus5 -_Plus - - -_plus5->_mul6 - - - - -_plus5->_mul7 - - - - -activation14 - -activation14 -Activation -act-type=tanh - - -activation14->_plus5 - - - - -_mul8->activation13 - - - - -_mul8->activation14 - - - - -ptb_lstm_3_h2h - -ptb_lstm_3_h2h -FullyConnected -num-hidden=1024 - - -ptb_lstm_3_h2h->_mul8 - - - - -_mul11 - -_mul11 -_Mul - - -ptb_lstm_3_h2h->_mul11 - - - - -_plus8 - -_plus8 -_Plus - - -_plus8->ptb_lstm_3_i2h - - - - -_plus8->ptb_lstm_3_h2h - - - - -ptb_lstm_3_gates - -ptb_lstm_3_gates -SliceChannel - - -ptb_lstm_3_gates->_plus8 - - - - -_plus10 - -_plus10 -_Plus - - -ptb_lstm_3_gates->_plus10 - - - - -activation23 - -activation23 -Activation -act-type=sigmoid - - -activation23->ptb_lstm_3_gates - - - - -activation22 - -activation22 -Activation -act-type=sigmoid - - -activation22->ptb_lstm_3_gates - - - - -_mul12 - -_mul12 -_Mul - - -_mul12->_plus5 - - - - -_mul12->activation22 - - - - -activation20 - -activation20 -Activation -act-type=sigmoid - - -activation20->ptb_lstm_3_gates - - - - -activation21 - -activation21 -Activation -act-type=tanh - - -activation21->ptb_lstm_3_gates - - - - -_mul13 - -_mul13 -_Mul - - -_mul13->activation20 - - - - -_mul13->activation21 - - - - -_plus9 - -_plus9 -_Plus - - -_plus9->_mul12 - - - - -_plus9->_mul13 - - - - -activation24 - -activation24 -Activation -act-type=tanh - - -activation24->_plus9 - - - - -_mul14->activation23 - - - - -_mul14->activation24 - - - - -_plus2->ptb_lstm_1_i2h - - - - -_plus2->ptb_lstm_1_h2h - - +ptb_lstm_2_gates + +ptb_lstm_2_gates +SliceChannel + + +ptb_lstm_2_gates->_plus2 + + -activation8 - -activation8 -Activation -act-type=sigmoid +activation8 + +activation8 +Activation +act-type=sigmoid - -activation8->ptb_lstm_1_gates - - + +activation8->ptb_lstm_2_gates + + -activation7 - -activation7 -Activation -act-type=sigmoid +activation7 + +activation7 +Activation +act-type=sigmoid - -activation7->ptb_lstm_1_gates - - + +activation7->ptb_lstm_2_gates + + -_mul3 - -_mul3 -_Mul +_mul3 + +_mul3 +_Mul + + +_mul3->_plus1 + + -_mul3->activation7 - - +_mul3->activation7 + + -activation5 - -activation5 -Activation -act-type=sigmoid +activation5 + +activation5 +Activation +act-type=sigmoid - -activation5->ptb_lstm_1_gates - - + +activation5->ptb_lstm_2_gates + + -activation6 - -activation6 -Activation -act-type=tanh +activation6 + +activation6 +Activation +act-type=tanh - -activation6->ptb_lstm_1_gates - - + +activation6->ptb_lstm_2_gates + + -_mul4 - -_mul4 -_Mul +_mul4 + +_mul4 +_Mul -_mul4->activation5 - - +_mul4->activation5 + + -_mul4->activation6 - - +_mul4->activation6 + + -_plus3 - -_plus3 -_Plus +_plus3 + +_plus3 +_Plus -_plus3->_mul3 - - +_plus3->_mul3 + + -_plus3->_mul4 - - +_plus3->_mul4 + + -activation9 - -activation9 -Activation -act-type=tanh +activation9 + +activation9 +Activation +act-type=tanh -activation9->_plus3 - - +activation9->_plus3 + + + + +_mul5 + +_mul5 +_Mul -_mul5->activation8 - - +_mul5->activation8 + + -_mul5->activation9 - - - - -_plus6->ptb_lstm_2_i2h - - - - -_plus6->ptb_lstm_2_h2h - - - - -activation18 - -activation18 -Activation -act-type=sigmoid - - -activation18->ptb_lstm_2_gates - - - - -activation17 - -activation17 -Activation -act-type=sigmoid - - -activation17->ptb_lstm_2_gates - - - - -_mul9 - -_mul9 -_Mul - - -_mul9->_plus3 - - - - -_mul9->activation17 - - - - -activation15 - -activation15 -Activation -act-type=sigmoid - - -activation15->ptb_lstm_2_gates - - - - -activation16 - -activation16 -Activation -act-type=tanh - - -activation16->ptb_lstm_2_gates - - - - -_mul10 - -_mul10 -_Mul - - -_mul10->activation15 - - - - -_mul10->activation16 - - - - -_plus7 - -_plus7 -_Plus - - -_plus7->_mul9 - - - - -_plus7->_mul10 - - - - -activation19 - -activation19 -Activation -act-type=tanh - - -activation19->_plus7 - - - - -_mul11->activation18 - - - - -_mul11->activation19 - - - - -_plus10->ptb_lstm_3_i2h - - - - -_plus10->ptb_lstm_3_h2h - - - - -activation28 - -activation28 -Activation -act-type=sigmoid - - -activation28->ptb_lstm_3_gates - - - - -activation27 - -activation27 -Activation -act-type=sigmoid - - -activation27->ptb_lstm_3_gates - - - - -_mul15 - -_mul15 -_Mul - - -_mul15->_plus7 - - - - -_mul15->activation27 - - - - -activation25 - -activation25 -Activation -act-type=sigmoid - - -activation25->ptb_lstm_3_gates - - - - -activation26 - -activation26 -Activation -act-type=tanh - - -activation26->ptb_lstm_3_gates - - - - -_mul16 - -_mul16 -_Mul - - -_mul16->activation25 - - - - -_mul16->activation26 - - - - -_plus11 - -_plus11 -_Plus - - -_plus11->_mul15 - - - - -_plus11->_mul16 - - - - -activation29 - -activation29 -Activation -act-type=tanh - - -activation29->_plus11 - - - - -_mul17 - -_mul17 -_Mul - - -_mul17->activation28 - - - - -_mul17->activation29 - - - - -ptb_l2_last_h - -ptb_l2_last_h -BlockGrad - - -ptb_l2_last_h->_mul17 - - +_mul5->activation9 + + -ptb_l1_last_h - -ptb_l1_last_h -BlockGrad - - -ptb_l1_last_h->_mul14 - - - - -ptb_l2_last_c - -ptb_l2_last_c -BlockGrad - - -ptb_l2_last_c->_plus11 - - +ptb_l1_last_h + +ptb_l1_last_h +BlockGrad + + +ptb_l1_last_h->_mul5 + + -ptb_l1_last_c - -ptb_l1_last_c -BlockGrad - - -ptb_l1_last_c->_plus9 - - - - -ptb_pred_3 - -ptb_pred_3 -FullyConnected -num-hidden=128 - - -ptb_pred_3->_mul17 - - - - -ptb_softmax_3 - -ptb_softmax_3 -SoftmaxOutput - - -ptb_softmax_3->ptb_pred_3 - - +ptb_l1_last_c + +ptb_l1_last_c +BlockGrad + + +ptb_l1_last_c->_plus3 + + -ptb_pred_2 - -ptb_pred_2 -FullyConnected -num-hidden=128 +ptb_pred_2 + +ptb_pred_2 +FullyConnected +num-hidden=128 - -ptb_pred_2->_mul11 - - + +ptb_pred_2->_mul5 + + -ptb_softmax_2 - -ptb_softmax_2 -SoftmaxOutput +ptb_softmax_2 + +ptb_softmax_2 +SoftmaxOutput -ptb_softmax_2->ptb_pred_2 - - +ptb_softmax_2->ptb_pred_2 + + -ptb_pred_1 - -ptb_pred_1 -FullyConnected -num-hidden=128 +ptb_pred_1 + +ptb_pred_1 +FullyConnected +num-hidden=128 - -ptb_pred_1->_mul5 - - + +ptb_pred_1->_mul2 + + -ptb_softmax_1 - -ptb_softmax_1 -SoftmaxOutput +ptb_softmax_1 + +ptb_softmax_1 +SoftmaxOutput -ptb_softmax_1->ptb_pred_1 - - +ptb_softmax_1->ptb_pred_1 + + diff --git a/examples/char-lstm/visualize.jl b/examples/char-lstm/visualize.jl index 336afea30705..acf757515005 100644 --- a/examples/char-lstm/visualize.jl +++ b/examples/char-lstm/visualize.jl @@ -3,8 +3,8 @@ include(joinpath(dirname(@__FILE__), "lstm.jl")) using MXNet -vis_n_layer = 2 -vis_seq_len = 3 +vis_n_layer = 1 +vis_seq_len = 2 vis_n_class = 128 lstm = LSTM(vis_n_layer, vis_seq_len, DIM_HIDDEN, DIM_EMBED, vis_n_class, name=NAME, output_states=true) From 4f094406ff1aa4950843413cec716050421cfb19 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Mon, 16 Nov 2015 16:32:31 +0900 Subject: [PATCH 242/630] implements variants of Xaiver They are several different Xaiver variants used and it is not quite clear if there is a "correct" one. Different variants can be chosen by the combinations of a uniform or normal distribution with a specific calculation of the variance. Currently implemented are different variants from Caffe, the original one by Bengio and Glorot and the one by K. He et. al 2015 (called msra in Caffe). The current default is the one used by the Python interface to MXNet (3 / (in+out)). implement several variants of xaiver rewrite xaiver to use enums --- src/initializer.jl | 52 +++++++++++++++++++++++++++++++++++++++++++--- 1 file changed, 49 insertions(+), 3 deletions(-) diff --git a/src/initializer.jl b/src/initializer.jl index 8f78bfba9367..6a941610e1cd 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -104,14 +104,60 @@ end The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding the difficulty of training deep feedforward neuralnetworks*. + + There are several different version of the XaiverInitializer used in the wild. + The general idea is that the variance of the initialization distribution is controlled + by the dimensionality of the input and output. As a distribution one can either choose + a normal distribution with μ = 0 and σ² or a uniform distribution from -σ to σ. + + Several different ways of calculating the variance are given in the literature or are + used by various libraries. + + - original [Bengio and Glorot 2010]: σ² = 2 / (in + out) + - msra [K. He, X. Zhang, S. Ren, and J. Sun 2015]: σ² = 2 / in + - caffe_avg: 6 / (in + out) + - caffe_in: 3 / in + - caffe_out: 3 / out + - mxnet: 3 / (in + out) + + Distribution and variant can be chosen by enums (prefixed by xv_). + As an example take mx.XaiverInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet), + which is currently the default. =# + +@enum XaiverDistribution xv_uniform xv_normal +@enum XaiverVariant xv_original xv_mrsa xv_caffe_avg xv_caffe_in zv_caffe_out xv_mxnet + immutable XaiverInitializer <: AbstractInitializer + distribution :: XaiverDistribution + variant :: XaiverVariant end +XaiverInitializer(; distribution = xv_uniform, variant = xv_mxnet) = XaiverInitializer(distribution, variant) -function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) +function _init_weight(self :: XaiverInitializer, name :: Base.Symbol, array :: NDArray) dims = size(array) fan_in = prod(dims[2:end]) fan_out = dims[1] - scale = sqrt(3 / (fan_in + fan_out)) - rand!(-scale, scale, array) + + if self.distribution == xv_uniform + func(σ, data) = rand!(-σ, σ, data) + elseif self.distribution == xv_normal + func(σ, data) = randn!(0.0, σ, data) + end + + if self.variant == xv_caffe_avg + var = 6 / (fan_in + fan_out) + elseif self.variant == xv_caffe_in + var = 3 / fan_in + elseif self.variant == xv_caffe_out + var = 3 / fan_out + elseif self.variant == xv_mrsa + var = 2 / fan_in + elseif self.variant == xv_original + var = 2 / (fan_in + fan_out) + elseif self.variant == xv_mxnet + var = 3 / (fan_in + fan_out) + end + + func(√var, array) end From 89cf70d996339190e440f882c4c8779dbb8d6441 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 16 Nov 2015 23:38:05 -0500 Subject: [PATCH 243/630] update doc --- docs/api/initializer.rst | 19 +++++++++++++++++++ src/initializer.jl | 6 +++--- 2 files changed, 22 insertions(+), 3 deletions(-) diff --git a/docs/api/initializer.rst b/docs/api/initializer.rst index 3f4126721542..94a60e4021b0 100644 --- a/docs/api/initializer.rst +++ b/docs/api/initializer.rst @@ -65,5 +65,24 @@ Built-in initializers The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding the difficulty of training deep feedforward neuralnetworks*. + There are several different version of the XaiverInitializer used in the wild. + The general idea is that the variance of the initialization distribution is controlled + by the dimensionality of the input and output. As a distribution one can either choose + a normal distribution with μ = 0 and σ² or a uniform distribution from -σ to σ. + + Several different ways of calculating the variance are given in the literature or are + used by various libraries. + + - original [Bengio and Glorot 2010]: σ² = 2 / (in + out) + - msra [K. He, X. Zhang, S. Ren, and J. Sun 2015]: σ² = 2 / in + - caffe_avg: 6 / (in + out) + - caffe_in: 3 / in + - caffe_out: 3 / out + - mxnet: 3 / (in + out) + + Distribution and variant can be chosen by enums (prefixed by ``xv_``). + As an example take ``mx.XaiverInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet)``, + which is currently the default. + diff --git a/src/initializer.jl b/src/initializer.jl index 6a941610e1cd..2fac334448a5 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -112,7 +112,7 @@ end Several different ways of calculating the variance are given in the literature or are used by various libraries. - + - original [Bengio and Glorot 2010]: σ² = 2 / (in + out) - msra [K. He, X. Zhang, S. Ren, and J. Sun 2015]: σ² = 2 / in - caffe_avg: 6 / (in + out) @@ -120,8 +120,8 @@ end - caffe_out: 3 / out - mxnet: 3 / (in + out) - Distribution and variant can be chosen by enums (prefixed by xv_). - As an example take mx.XaiverInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet), + Distribution and variant can be chosen by enums (prefixed by ``xv_``). + As an example take ``mx.XaiverInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet)``, which is currently the default. =# From 1a935deed153622e357ac90ae5ab159c5c08f978 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 17 Nov 2015 15:00:38 +0900 Subject: [PATCH 244/630] rename Xaiver to Xavier --- src/initializer.jl | 20 ++++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/src/initializer.jl b/src/initializer.jl index 2fac334448a5..01744a760448 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -100,12 +100,12 @@ function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: N end #=doc -.. class:: XaiverInitializer +.. class:: XavierInitializer The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding the difficulty of training deep feedforward neuralnetworks*. - There are several different version of the XaiverInitializer used in the wild. + There are several different version of the XavierInitializer used in the wild. The general idea is that the variance of the initialization distribution is controlled by the dimensionality of the input and output. As a distribution one can either choose a normal distribution with μ = 0 and σ² or a uniform distribution from -σ to σ. @@ -121,20 +121,20 @@ end - mxnet: 3 / (in + out) Distribution and variant can be chosen by enums (prefixed by ``xv_``). - As an example take ``mx.XaiverInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet)``, + As an example take ``mx.XavierInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet)``, which is currently the default. =# -@enum XaiverDistribution xv_uniform xv_normal -@enum XaiverVariant xv_original xv_mrsa xv_caffe_avg xv_caffe_in zv_caffe_out xv_mxnet +@enum XavierDistribution xv_uniform xv_normal +@enum XavierVariant xv_original xv_mrsa xv_caffe_avg xv_caffe_in zv_caffe_out xv_mxnet -immutable XaiverInitializer <: AbstractInitializer - distribution :: XaiverDistribution - variant :: XaiverVariant +immutable XavierInitializer <: AbstractInitializer + distribution :: XavierDistribution + variant :: XavierVariant end -XaiverInitializer(; distribution = xv_uniform, variant = xv_mxnet) = XaiverInitializer(distribution, variant) +XavierInitializer(; distribution = xv_uniform, variant = xv_mxnet) = XavierInitializer(distribution, variant) -function _init_weight(self :: XaiverInitializer, name :: Base.Symbol, array :: NDArray) +function _init_weight(self :: XavierInitializer, name :: Base.Symbol, array :: NDArray) dims = size(array) fan_in = prod(dims[2:end]) fan_out = dims[1] From 5dd866466158b18731461010a3e5cbb5c5f5d0a0 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 17 Nov 2015 15:01:33 +0900 Subject: [PATCH 245/630] rebuild docs --- docs/api/initializer.rst | 6 +++--- docs/api/io.rst | 4 ++-- docs/api/symbolic-node.rst | 2 +- 3 files changed, 6 insertions(+), 6 deletions(-) diff --git a/docs/api/initializer.rst b/docs/api/initializer.rst index 94a60e4021b0..30b2df35664a 100644 --- a/docs/api/initializer.rst +++ b/docs/api/initializer.rst @@ -60,12 +60,12 @@ Built-in initializers -.. class:: XaiverInitializer +.. class:: XavierInitializer The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding the difficulty of training deep feedforward neuralnetworks*. - There are several different version of the XaiverInitializer used in the wild. + There are several different version of the XavierInitializer used in the wild. The general idea is that the variance of the initialization distribution is controlled by the dimensionality of the input and output. As a distribution one can either choose a normal distribution with μ = 0 and σ² or a uniform distribution from -σ to σ. @@ -81,7 +81,7 @@ Built-in initializers - mxnet: 3 / (in + out) Distribution and variant can be chosen by enums (prefixed by ``xv_``). - As an example take ``mx.XaiverInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet)``, + As an example take ``mx.XavierInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet)``, which is currently the default. diff --git a/docs/api/io.rst b/docs/api/io.rst index f1ab959be6f2..6186db52ecc1 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -324,7 +324,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -467,7 +467,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index 78e359537ec3..d847c6a8bd38 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -186,7 +186,7 @@ Public APIs :param momentum: Momentum for moving average - :type momentum: float, optional, default=0.1 + :type momentum: float, optional, default=0.9 :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. From 5b0e1acbeab508bc3e41a787eb91a24c580f02b8 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 18 Nov 2015 18:39:35 -0500 Subject: [PATCH 246/630] remove grad_scale parameter from optimizers (duplicated with lr) --- docs/build-api.jl | 2 +- src/optimizer.jl | 2 +- src/optimizers/adam.jl | 20 +++++++++++++++++++- src/optimizers/sgd.jl | 20 +++++++++++++++++++- 4 files changed, 40 insertions(+), 4 deletions(-) diff --git a/docs/build-api.jl b/docs/build-api.jl index 53ca9f6f7ca1..c8e54677096f 100644 --- a/docs/build-api.jl +++ b/docs/build-api.jl @@ -88,7 +88,7 @@ extract_doc("initializer.rst", "initializer.jl") extract_doc("callback.rst", "callback.jl") extract_doc("model.rst", "model.jl") -extract_doc("optimizer.rst", "optimizer.jl") +extract_doc("optimizer.rst", "optimizer.jl", "optimizers/sgd.jl", "optimizers/adam.jl") extract_doc("metric.rst", "metric.jl") extract_doc("io.rst", "io.jl") diff --git a/src/optimizer.jl b/src/optimizer.jl index a5f0bfd5ec60..0a3f23bc96ba 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -211,7 +211,7 @@ abstract AbstractOptimizerOptions =# function normalized_gradient(opts::AbstractOptimizerOptions, state::OptimizationState, weight::NDArray, grad::NDArray) - grad_scale = opts.grad_scale / state.batch_size + grad_scale = 1.0 / state.batch_size grad = grad_scale * grad if opts.grad_clip > 0 diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl index d8d1d2377836..95eaefe275a1 100644 --- a/src/optimizers/adam.jl +++ b/src/optimizers/adam.jl @@ -1,6 +1,5 @@ @defstruct ADAMOptions AbstractOptimizerOptions ( (lr :: Real = 0.001, lr > 0), - (grad_scale :: Real = 1.0, grad_scale >= 0), (grad_clip :: Real = 0, grad_clip >= 0), (weight_decay :: Real = 0.00001, weight_decay >= 0), (beta1 :: Real = 0.9, beta1 > 0), @@ -9,7 +8,26 @@ lr_scheduler :: Any = nothing ) +#=doc +.. class:: ADAM + The solver described in Diederik Kingma, Jimmy Ba: *Adam: A Method for + Stochastic Optimization*. arXiv:1412.6980 [cs.LG]. + + .. function:: ADAM(; kwargs...) + + :param Real lr: default `0.001`, learning rate. + :param AbstractLearningRateScheduler lr_scheduler: default `nothing`, a + dynamic learning rate scheduler. If set, will overwrite the `lr` + parameter. + :param Real beta1: default `0.9`. + :param Real beta2: default `0.999`. + :param Real epsilon: default `1e-8`. + :param Real grad_clip: default `0`, if positive, will clip the gradient + into the range `[-grad_clip, grad_clip]`. + :param Real weight_decay: default `0.00001`, weight decay is equivalent + to adding a global l2 regularizer for all the parameters. +=# type ADAM <: AbstractOptimizer opts :: ADAMOptions state :: OptimizationState diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index 84ea55f40f11..f3d1b10a66e4 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -1,14 +1,32 @@ @defstruct SGDOptions AbstractOptimizerOptions ( (lr :: Real = 0.01, lr > 0), (momentum :: Real = 0.0, momentum >= 0), - (grad_scale :: Real = 1.0, grad_scale >= 0), (grad_clip :: Real = 0, grad_clip >= 0), (weight_decay :: Real = 0.0001, weight_decay >= 0), lr_scheduler :: Any = nothing, momentum_scheduler :: Any = nothing ) +#=doc +.. class:: SGD + Stochastic gradient descent optimizer. + + .. function:: SGD(; kwargs...) + + :param Real lr: default `0.01`, learning rate. + :param AbstractLearningRateScheduler lr_scheduler: default `nothing`, a + dynamic learning rate scheduler. If set, will overwrite the `lr` + parameter. + :param Real momentum: default `0.0`, the momentum. + :param AbstractMomentumScheduler momentum_scheduler: default `nothing`, + a dynamic momentum scheduler. If set, will overwrite the `momentum` + parameter. + :param Real grad_clip: default `0`, if positive, will clip the gradient + into the bounded range `[-grad_clip, grad_clip]`. + :param Real weight_decay: default `0.0001`, weight decay is equivalent to + adding a global l2 regularizer to the parameters. +=# type SGD <: AbstractOptimizer opts :: SGDOptions state :: OptimizationState From 4fc66b4d5711aab1f8e3b131109ecdcc46dd11e6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 18 Nov 2015 18:40:08 -0500 Subject: [PATCH 247/630] update documents for optimizers --- docs/api/io.rst | 4 ++-- docs/api/optimizer.rst | 44 ++++++++++++++++++++++++++++++++++++++ docs/api/symbolic-node.rst | 2 +- 3 files changed, 47 insertions(+), 3 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index 6186db52ecc1..f1ab959be6f2 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -324,7 +324,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -467,7 +467,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/optimizer.rst b/docs/api/optimizer.rst index bc45cf1744ac..12e898d233b5 100644 --- a/docs/api/optimizer.rst +++ b/docs/api/optimizer.rst @@ -139,3 +139,47 @@ Built-in optimizers + +.. class:: SGD + + Stochastic gradient descent optimizer. + + .. function:: SGD(; kwargs...) + + :param Real lr: default `0.01`, learning rate. + :param AbstractLearningRateScheduler lr_scheduler: default `nothing`, a + dynamic learning rate scheduler. If set, will overwrite the `lr` + parameter. + :param Real momentum: default `0.0`, the momentum. + :param AbstractMomentumScheduler momentum_scheduler: default `nothing`, + a dynamic momentum scheduler. If set, will overwrite the `momentum` + parameter. + :param Real grad_clip: default `0`, if positive, will clip the gradient + into the bounded range `[-grad_clip, grad_clip]`. + :param Real weight_decay: default `0.0001`, weight decay is equivalent to + adding a global l2 regularizer to the parameters. + + + + +.. class:: ADAM + + The solver described in Diederik Kingma, Jimmy Ba: *Adam: A Method for + Stochastic Optimization*. arXiv:1412.6980 [cs.LG]. + + .. function:: ADAM(; kwargs...) + + :param Real lr: default `0.001`, learning rate. + :param AbstractLearningRateScheduler lr_scheduler: default `nothing`, a + dynamic learning rate scheduler. If set, will overwrite the `lr` + parameter. + :param Real beta1: default `0.9`. + :param Real beta2: default `0.999`. + :param Real epsilon: default `1e-8`. + :param Real grad_clip: default `0`, if positive, will clip the gradient + into the range `[-grad_clip, grad_clip]`. + :param Real weight_decay: default `0.00001`, weight decay is equivalent + to adding a global l2 regularizer for all the parameters. + + + diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index d847c6a8bd38..78e359537ec3 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -186,7 +186,7 @@ Public APIs :param momentum: Momentum for moving average - :type momentum: float, optional, default=0.9 + :type momentum: float, optional, default=0.1 :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. From 884c7f84065e0d8d96e7696079c431fe86936308 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 19 Nov 2015 12:17:37 -0500 Subject: [PATCH 248/630] more arithmetic operations on symbolic nodes --- docs/api/symbolic-node.rst | 37 ++++++++++++++++++- src/symbolic-node.jl | 75 ++++++++++++++++++++++++++++++++++---- test/unittest/operator.jl | 36 ++++++++++++++++++ 3 files changed, 139 insertions(+), 9 deletions(-) create mode 100644 test/unittest/operator.jl diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index 78e359537ec3..30420da31f13 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -186,7 +186,7 @@ Public APIs :param momentum: Momentum for moving average - :type momentum: float, optional, default=0.1 + :type momentum: float, optional, default=0.9 :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. @@ -872,6 +872,41 @@ Internal APIs +.. function:: _Power(...) + + Perform an elementwise power. + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: _PowerScalar(...) + + Perform an elementwise power. + + :param array: Input array operand to the operation. + :type array: SymbolicNode + + + :param scalar: scalar value. + :type scalar: float, required + + + :param scalar_on_right: scalar operand is on the right. + :type scalar_on_right: boolean, optional, default=False + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 0b7385ffa1a7..c1b604432718 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -250,16 +250,26 @@ function Base.getindex(self :: SymbolicNode, idx :: Int) end import Base: +, .+ -function +(self :: SymbolicNode, args :: SymbolicNode...) +function +(self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) ret = self for arg in args - ret = _Plus(ret, arg) + if isa(arg, SymbolicNode) + ret = _Plus(ret, arg) + else + ret = _PlusScalar(ret, scalar=MX_float(arg)) + end end ret end -function .+(self :: SymbolicNode, args :: SymbolicNode...) +function .+(self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) +(self, args...) end +function +(s1 :: Real, self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) + +(self, s1, args...) +end +function .+(s1 :: Real, self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) + +(self, s1, args...) +end import Base: -, .- function -(self :: SymbolicNode, arg :: SymbolicNode) @@ -268,20 +278,70 @@ end function .-(self :: SymbolicNode, arg :: SymbolicNode) -(self, arg) end +function -(self :: SymbolicNode, arg :: Real) + _MinusScalar(self, scalar=MX_float(arg)) +end +function .-(self :: SymbolicNode, arg :: Real) + -(self, arg) +end -import Base: .* -function .*(self :: SymbolicNode, args :: SymbolicNode...) +function -(arg :: Real, self :: SymbolicNode) + _MinusScalar(self, scalar=arg, scalar_on_right=true) +end +function .-(arg :: Real, self :: SymbolicNode) + -(arg, self) +end + +function -(self :: SymbolicNode) + -(0, self) +end + +import Base: .*, * +function .*(self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) ret = self for arg in args - ret = _Mul(ret, arg) + if isa(arg, SymbolicNode) + ret = _Mul(ret, arg) + else + ret = _MulScalar(ret, scalar=MX_float(arg)) + end end ret end +function .*(arg :: Real, self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) + .*(self, arg, args...) +end +function *(arg :: Real, self :: SymbolicNode) + _MulScalar(self, scalar=arg) +end +function *(self :: SymbolicNode, arg :: Real) + *(arg, self) +end -import Base: ./ +import Base: ./, / function ./(self :: SymbolicNode, arg :: SymbolicNode) _Div(self, arg) end +function ./(self :: SymbolicNode, arg :: Real) + _DivScalar(self, scalar=MX_float(arg)) +end +function /(self :: SymbolicNode, arg :: Real) + ./(self, arg) +end +function ./(arg :: Real, self :: SymbolicNode) + _DivScalar(self, scalar=arg, scalar_on_right=true) +end + +import Base: .^, ^ +function .^(self :: SymbolicNode, pow :: SymbolicNode) + _Power(self, pow) +end +function .^(self :: SymbolicNode, pow :: AbstractFloat) + _PowerScalar(self, scalar=pow) +end +function ^(self :: SymbolicNode, pow :: AbstractFloat) + .^(self, pow) +end function _compose!(node :: SymbolicNode; kwargs...) name = char_p(0) @@ -519,4 +579,3 @@ macro chain(layers) end return Expr(:block, exprs...) end - diff --git a/test/unittest/operator.jl b/test/unittest/operator.jl new file mode 100644 index 000000000000..2284b1080c7e --- /dev/null +++ b/test/unittest/operator.jl @@ -0,0 +1,36 @@ +module TestOperator +using MXNet +using Base.Test + +using ..Main: rand_dims, reldiff + +function test_scalar_op() + data = mx.Variable(:data) + shape = rand_dims() + info("Operator::scalar_op::dims = $shape") + + data_jl = 5ones(shape) + arr_data = mx.copy(data_jl, mx.cpu()) + arr_grad = mx.zeros(shape) + + test = 2 ./ (4 - ((1+data+1)*2/5) - 0.2) + exec_test = mx.bind(test, mx.cpu(), [arr_data], args_grad=[arr_grad]) + mx.forward(exec_test) + out = copy(exec_test.outputs[1]) + jl_out1 = (4 - ((1+data_jl+1)*2/5) - 0.2) + jl_out = 2 ./ jl_out1 + @test reldiff(copy(out), jl_out) < 1e-6 + + out_grad = 2mx.ones(shape) + jl_grad = 2copy(out_grad) / 5 + jl_grad = 2jl_grad ./ (jl_out1 .^ 2) + mx.backward(exec_test, out_grad) + @test reldiff(copy(arr_grad), jl_grad) < 1e-6 +end + +################################################################################ +# Run tests +################################################################################ +test_scalar_op() + +end From 62c97032a7ffddc066ce4ab94cddb32f4dbffa09 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 19 Nov 2015 09:44:19 +0900 Subject: [PATCH 249/630] rework Xavier to be more flexible --- src/initializer.jl | 43 +++++++++++++++++-------------------------- 1 file changed, 17 insertions(+), 26 deletions(-) diff --git a/src/initializer.jl b/src/initializer.jl index 01744a760448..8263c06ba496 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -113,26 +113,21 @@ end Several different ways of calculating the variance are given in the literature or are used by various libraries. - - original [Bengio and Glorot 2010]: σ² = 2 / (in + out) - - msra [K. He, X. Zhang, S. Ren, and J. Sun 2015]: σ² = 2 / in - - caffe_avg: 6 / (in + out) - - caffe_in: 3 / in - - caffe_out: 3 / out - - mxnet: 3 / (in + out) - - Distribution and variant can be chosen by enums (prefixed by ``xv_``). - As an example take ``mx.XavierInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet)``, - which is currently the default. + - [Bengio and Glorot 2010]: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 1)`` + - [K. He, X. Zhang, S. Ren, and J. Sun 2015]: ``mx.XavierInitializer(distribution = mx.xv_gaussian, regularization = mx.xv_in, magnitude = 2)`` + - caffe_avg: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 3)`` =# @enum XavierDistribution xv_uniform xv_normal -@enum XavierVariant xv_original xv_mrsa xv_caffe_avg xv_caffe_in zv_caffe_out xv_mxnet +@enum XavierRegularization xv_avg xv_in xv_out immutable XavierInitializer <: AbstractInitializer distribution :: XavierDistribution - variant :: XavierVariant + regularization :: XavierRegularization + magnitude :: Float64 end -XavierInitializer(; distribution = xv_uniform, variant = xv_mxnet) = XavierInitializer(distribution, variant) + +XavierInitializer(; distribution = xv_uniform, regularization = xv_avg, magnitude = 3.0) = XavierInitializer(distribution, regularization, magnitude) function _init_weight(self :: XavierInitializer, name :: Base.Symbol, array :: NDArray) dims = size(array) @@ -145,19 +140,15 @@ function _init_weight(self :: XavierInitializer, name :: Base.Symbol, array :: N func(σ, data) = randn!(0.0, σ, data) end - if self.variant == xv_caffe_avg - var = 6 / (fan_in + fan_out) - elseif self.variant == xv_caffe_in - var = 3 / fan_in - elseif self.variant == xv_caffe_out - var = 3 / fan_out - elseif self.variant == xv_mrsa - var = 2 / fan_in - elseif self.variant == xv_original - var = 2 / (fan_in + fan_out) - elseif self.variant == xv_mxnet - var = 3 / (fan_in + fan_out) + if self.regularization == xv_avg + factor = (fan_in + fan_out) / 2 + elseif self.regularization == xv_in + factor = fan_in + elseif self.regularization == xv_out + factor = fan_out end - func(√var, array) + σ = √(self.magnitude / factor) + + func(σ, array) end From 6081fcec039131d24aa0b38fd00bfcf92007e864 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 20 Nov 2015 17:54:08 +0900 Subject: [PATCH 250/630] xavier: rebuild documentation --- docs/api/initializer.rst | 13 +++---------- docs/api/io.rst | 4 ++-- docs/api/symbolic-node.rst | 35 ----------------------------------- 3 files changed, 5 insertions(+), 47 deletions(-) diff --git a/docs/api/initializer.rst b/docs/api/initializer.rst index 30b2df35664a..7123507f7ee9 100644 --- a/docs/api/initializer.rst +++ b/docs/api/initializer.rst @@ -73,16 +73,9 @@ Built-in initializers Several different ways of calculating the variance are given in the literature or are used by various libraries. - - original [Bengio and Glorot 2010]: σ² = 2 / (in + out) - - msra [K. He, X. Zhang, S. Ren, and J. Sun 2015]: σ² = 2 / in - - caffe_avg: 6 / (in + out) - - caffe_in: 3 / in - - caffe_out: 3 / out - - mxnet: 3 / (in + out) - - Distribution and variant can be chosen by enums (prefixed by ``xv_``). - As an example take ``mx.XavierInitializer(distribution = mx.xv_normal, variant = mx.xv_mxnet)``, - which is currently the default. + - [Bengio and Glorot 2010]: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 1)`` + - [K. He, X. Zhang, S. Ren, and J. Sun 2015]: ``mx.XavierInitializer(distribution = mx.xv_gaussian, regularization = mx.xv_in, magnitude = 2)`` + - caffe_avg: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 3)`` diff --git a/docs/api/io.rst b/docs/api/io.rst index f1ab959be6f2..6186db52ecc1 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -324,7 +324,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -467,7 +467,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index 30420da31f13..d847c6a8bd38 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -872,41 +872,6 @@ Internal APIs -.. function:: _Power(...) - - Perform an elementwise power. - - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - - :return: the constructed :class:`SymbolicNode`. - - - - - -.. function:: _PowerScalar(...) - - Perform an elementwise power. - - :param array: Input array operand to the operation. - :type array: SymbolicNode - - - :param scalar: scalar value. - :type scalar: float, required - - - :param scalar_on_right: scalar operand is on the right. - :type scalar_on_right: boolean, optional, default=False - - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - - :return: the constructed :class:`SymbolicNode`. - - - - - From 56f3eef1b9f8d6c4c37a83e2500d0bd8ac4e59c5 Mon Sep 17 00:00:00 2001 From: yeesian Date: Fri, 20 Nov 2015 16:14:25 -0500 Subject: [PATCH 251/630] update README --- README.md | 36 ++++++++++++++++++++++++++++++++---- 1 file changed, 32 insertions(+), 4 deletions(-) diff --git a/README.md b/README.md index 8bf867f39964..08cf95f87de9 100644 --- a/README.md +++ b/README.md @@ -17,8 +17,12 @@ Here is an exmple of how training a simple 3-layer MLP on MNIST looks like: ```julia using MXNet -mlp = @mx.chain mx.Variable(:data) => - mx.MLP([128, 64, 10]) => +mlp = @mx.chain mx.Variable(:data) => + mx.FullyConnected(name=:fc1, num_hidden=128) => + mx.Activation(name=:relu1, act_type=:relu) => + mx.FullyConnected(name=:fc2, num_hidden=64) => + mx.Activation(name=:relu2, act_type=:relu) => + mx.FullyConnected(name=:fc3, num_hidden=10) => mx.SoftmaxOutput(name=:softmax) # data provider @@ -29,11 +33,35 @@ train_provider, eval_provider = get_mnist_providers(batch_size) # setup model model = mx.FeedForward(mlp, context=mx.cpu()) -# optimizer -optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) +# optimization algorithm +optimizer = mx.SGD(lr=0.1, momentum=0.9) # fit parameters mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) ``` +You can also predict using the `model` in the following way: + +```julia +probs = mx.predict(model, eval_provider) + +# collect all labels from eval data +labels = Array[] +for batch in eval_provider + push!(labels, copy(mx.get(eval_provider, batch, :softmax_label))) +end +labels = cat(1, labels...) + +# Now we use compute the accuracy +correct = 0 +for i = 1:length(labels) + # labels are 0...9 + if indmax(probs[:,i]) == labels[i]+1 + correct += 1 + end +end +accuracy = 100correct/length(labels) +println(mx.format("Accuracy on eval set: {1:.2f}%", accuracy)) +``` + For more details, please refer to the [document](http://mxnetjl.readthedocs.org/) and [examples](examples). From e848e8d17d7452f4b846dc5d92485c2fd37846b6 Mon Sep 17 00:00:00 2001 From: yeesian Date: Fri, 20 Nov 2015 16:20:47 -0500 Subject: [PATCH 252/630] spelling :bee: --- README.md | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/README.md b/README.md index 08cf95f87de9..f60ca9f460a0 100644 --- a/README.md +++ b/README.md @@ -7,12 +7,12 @@ [![Join the chat at https://gitter.im/dmlc/mxnet](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/dmlc/mxnet?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge) -MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julialang.org/) package. MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of features include: +MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julialang.org/) package. MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of its features include: * Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. * Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. -Here is an exmple of how training a simple 3-layer MLP on MNIST looks like: +Here is an example of how training a simple 3-layer MLP on MNIST looks like: ```julia using MXNet @@ -64,4 +64,4 @@ accuracy = 100correct/length(labels) println(mx.format("Accuracy on eval set: {1:.2f}%", accuracy)) ``` -For more details, please refer to the [document](http://mxnetjl.readthedocs.org/) and [examples](examples). +For more details, please refer to the [documentation](http://mxnetjl.readthedocs.org/) and [examples](examples). From 7d8de6bf86a87e9387e0824c0425c6a4b980a41e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 21 Nov 2015 22:26:14 -0500 Subject: [PATCH 253/630] fix API change: scalar_on_right -> on_left --- src/symbolic-node.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index c1b604432718..62bf24d18b2b 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -286,7 +286,7 @@ function .-(self :: SymbolicNode, arg :: Real) end function -(arg :: Real, self :: SymbolicNode) - _MinusScalar(self, scalar=arg, scalar_on_right=true) + _MinusScalar(self, scalar=arg, scalar_on_left=true) end function .-(arg :: Real, self :: SymbolicNode) -(arg, self) @@ -329,7 +329,7 @@ function /(self :: SymbolicNode, arg :: Real) ./(self, arg) end function ./(arg :: Real, self :: SymbolicNode) - _DivScalar(self, scalar=arg, scalar_on_right=true) + _DivScalar(self, scalar=arg, scalar_on_left=true) end import Base: .^, ^ From 46257d28b77cc607856ee11fcb12fd6e60559adb Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Mon, 23 Nov 2015 18:04:31 +0900 Subject: [PATCH 254/630] basic interface for setting and getting attributes --- src/symbolic-node.jl | 29 +++++++++++++++++++++++++++++ test/unittest/symbolic-node.jl | 9 +++++++++ 2 files changed, 38 insertions(+) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 62bf24d18b2b..d7584d73baa1 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -122,6 +122,35 @@ function get_internals(self :: SymbolicNode) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end +#=doc +.. function:: get_attr(self :: SymbolicNode, key :: Symbol) + + Get attribute attached to this :class:`SymbolicNode` belonging to key. +=# +function get_attr(self :: SymbolicNode, key :: Symbol) + key_s = bytestring(string(key)) + ref_out = Ref{Cstring}() + ref_success = Ref{Cint}(-1) + @mxcall(:MXSymbolGetAttr, (MX_handle, Cstring, Ref{Cstring}, Ref{Cint}), self, key_s, ref_out, ref_success) + if ref_success[] == 1 + return bytestring(ref_out[]) + else + throw(KeyError(key)) + end +end + +#=doc +.. function:: set_attr(self:: SymbolicNode, key :: Symbol, value :: AbstractString) + + Set the attribute key to value for this :class:`SymbolicNode`. +=# +function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) + key_s = bytestring(string(key)) + value_s = bytestring(value) + + @mxcall(:MXSymbolSetAttr, (MX_handle, Cstring, Cstring), self, key_s, value_s) +end + #=doc .. function:: Variable(name :: Union{Base.Symbol, AbstractString}) diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 33948adfcd40..9dabcf281c89 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -81,6 +81,14 @@ function test_saveload() rm(fname) end +function test_attrs() + info("SymbolicNode::Attributes") + + data = mx.Variable(:data) + + mx.set_attr(data, :test, "1.0") + @test mx.get_attr(data, :test) == "1.0" +end ################################################################################ # Run tests @@ -91,5 +99,6 @@ test_compose() test_infer_shape() test_infer_shape_error() test_saveload() +test_attrs() end From e19ca8ee40c89f43b4f3da31d4cc540f27992037 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 23 Nov 2015 09:05:46 -0500 Subject: [PATCH 255/630] add warning to discourage users from calling set_attr directly --- docs/api/io.rst | 4 +- docs/api/symbolic-node.rst | 103 ++++++++++++++++++++++++++++++++++--- src/symbolic-node.jl | 7 +++ 3 files changed, 104 insertions(+), 10 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index 6186db52ecc1..f1ab959be6f2 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -324,7 +324,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -467,7 +467,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index d847c6a8bd38..e1f301783051 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -80,6 +80,27 @@ Symbolic API +.. function:: get_attr(self :: SymbolicNode, key :: Symbol) + + Get attribute attached to this :class:`SymbolicNode` belonging to key. + + + + +.. function:: set_attr(self:: SymbolicNode, key :: Symbol, value :: AbstractString) + + Set the attribute key to value for this :class:`SymbolicNode`. + + .. warning:: + + It is encouraged not to call this function directly, unless you know exactly what you are doing. The + recommended way of setting attributes is when creating the :class:`SymbolicNode`. Changing + the attributes of a :class:`SymbolicNode` that is already been used somewhere else might + cause unexpected behavior and inconsistency. + + + + .. function:: Variable(name :: Union{Base.Symbol, AbstractString}) Create a symbolic variable with the given name. This is typically used as a placeholder. @@ -220,6 +241,10 @@ Public APIs :param num_args: Number of inputs to be concated. :type num_args: int, required + + :param dim: the dimension to be concated. + :type dim: int, optional, default='1' + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :return: the constructed :class:`SymbolicNode`. @@ -366,6 +391,33 @@ Public APIs +.. function:: Embedding(...) + + Get embedding for one-hot input + + :param data: Input data to the EmbeddingOp. + :type data: SymbolicNode + + + :param weight: Enbedding weight matrix. + :type weight: SymbolicNode + + + :param input_dim: input dim of one-hot encoding + :type input_dim: int, required + + + :param output_dim: output dim of embedding + :type output_dim: int, required + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: Flatten(...) Flatten input @@ -737,8 +789,8 @@ Internal APIs :type scalar: float, required - :param scalar_on_right: scalar operand is on the right. - :type scalar_on_right: boolean, optional, default=False + :param scalar_on_left: scalar operand is on the left. + :type scalar_on_left: boolean, optional, default=False :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. @@ -772,8 +824,8 @@ Internal APIs :type scalar: float, required - :param scalar_on_right: scalar operand is on the right. - :type scalar_on_right: boolean, optional, default=False + :param scalar_on_left: scalar operand is on the left. + :type scalar_on_left: boolean, optional, default=False :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. @@ -807,8 +859,8 @@ Internal APIs :type scalar: float, required - :param scalar_on_right: scalar operand is on the right. - :type scalar_on_right: boolean, optional, default=False + :param scalar_on_left: scalar operand is on the left. + :type scalar_on_left: boolean, optional, default=False :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. @@ -861,8 +913,43 @@ Internal APIs :type scalar: float, required - :param scalar_on_right: scalar operand is on the right. - :type scalar_on_right: boolean, optional, default=False + :param scalar_on_left: scalar operand is on the left. + :type scalar_on_left: boolean, optional, default=False + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: _Power(...) + + Perform an elementwise power. + + :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: _PowerScalar(...) + + Perform an elementwise power. + + :param array: Input array operand to the operation. + :type array: SymbolicNode + + + :param scalar: scalar value. + :type scalar: float, required + + + :param scalar_on_left: scalar operand is on the left. + :type scalar_on_left: boolean, optional, default=False :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index d7584d73baa1..c4eb3b2f1237 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -143,6 +143,13 @@ end .. function:: set_attr(self:: SymbolicNode, key :: Symbol, value :: AbstractString) Set the attribute key to value for this :class:`SymbolicNode`. + + .. warning:: + + It is encouraged not to call this function directly, unless you know exactly what you are doing. The + recommended way of setting attributes is when creating the :class:`SymbolicNode`. Changing + the attributes of a :class:`SymbolicNode` that is already been used somewhere else might + cause unexpected behavior and inconsistency. =# function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) key_s = bytestring(string(key)) From 266d9462926d9d2cb48d6dc3693126c0382ffcd6 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 24 Nov 2015 10:06:36 +0900 Subject: [PATCH 256/630] attr interface for SymbolicNodes --- src/symbolic-node.jl | 35 +++++++++++++++++++++++++++------- test/unittest/symbolic-node.jl | 17 ++++++++++++++++- 2 files changed, 44 insertions(+), 8 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index c4eb3b2f1237..0d7f5937f88a 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -126,6 +126,7 @@ end .. function:: get_attr(self :: SymbolicNode, key :: Symbol) Get attribute attached to this :class:`SymbolicNode` belonging to key. + :return: The value belonging to key as a :class:`Nullable`. =# function get_attr(self :: SymbolicNode, key :: Symbol) key_s = bytestring(string(key)) @@ -133,9 +134,9 @@ function get_attr(self :: SymbolicNode, key :: Symbol) ref_success = Ref{Cint}(-1) @mxcall(:MXSymbolGetAttr, (MX_handle, Cstring, Ref{Cstring}, Ref{Cint}), self, key_s, ref_out, ref_success) if ref_success[] == 1 - return bytestring(ref_out[]) + return Nullable{ByteString}(bytestring(ref_out[])) else - throw(KeyError(key)) + return Nullable{ByteString}() end end @@ -159,15 +160,22 @@ function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) end #=doc -.. function:: Variable(name :: Union{Base.Symbol, AbstractString}) +.. function:: Variable(name :: Union{Symbol, AbstractString}) Create a symbolic variable with the given name. This is typically used as a placeholder. For example, the data node, acting as the starting point of a network architecture. + + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`Variable`. =# -function Variable(name :: Union{Base.Symbol, AbstractString}) +function Variable(name :: Union{Symbol, AbstractString}; attrs = Dict()) + attrs = convert(Dict{Symbol, AbstractString}, attrs) hdr_ref = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateVariable, (char_p, Ref{MX_handle}), name, hdr_ref) - SymbolicNode(MX_SymbolHandle(hdr_ref[])) + node = SymbolicNode(MX_SymbolHandle(hdr_ref[])) + for (k, v) in attrs + set_attr(node, k, v) + end + node end #=doc @@ -489,7 +497,8 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) f_desc *= "This function support variable length positional :class:`SymbolicNode` inputs.\n\n" end f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional.\n\n" + f_desc *= ":param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional.\n" + f_desc *= ":param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`.\n\n" f_desc *= ":return: the constructed :class:`SymbolicNode`.\n\n" return (func_name, f_desc) end @@ -506,7 +515,8 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) param_keys = AbstractString[] param_vals = AbstractString[] - symbol_kws = Dict{Base.Symbol, SymbolicNode}() + symbol_kws = Dict{Symbol, SymbolicNode}() + attrs = Dict{Symbol, AbstractString}() $(if kv_nargs != symbol("") quote @@ -521,6 +531,12 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) if k == :name; continue; end if isa(v, SymbolicNode) symbol_kws[k] = v + elseif k == :attrs + if isa(v, Dict) + attrs = convert(Dict{Symbol, AbstractString}, v) + else + throw(ArgumentError("attrs needs to be a Dictionary")) + end else push!(param_keys, string(k)) push!(param_vals, dump_mx_param(v)) @@ -550,6 +566,11 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) hint = lowercase($func_name_s) name = get!(DEFAULT_NAME_MANAGER, name, hint) + # set attrs + for (k, v) in attrs + set_attr(node, k, v) + end + if length(args) != 0 _compose!(node, name, args...) else diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 9dabcf281c89..e5a5531845ec 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -86,8 +86,23 @@ function test_attrs() data = mx.Variable(:data) + result = mx.get_attr(data, :test) + @test isnull(result) mx.set_attr(data, :test, "1.0") - @test mx.get_attr(data, :test) == "1.0" + result = mx.get_attr(data, :test) + @test !isnull(result) + @test get(result) == "1.0" + + data2 = mx.Variable(:data2, attrs = Dict(:test => "hallo!")) + @test get(mx.get_attr(data2, :test)) == "hallo!" + + conv = mx.Convolution(data = data2, kernel = (1,1), num_filter = 1, attrs = Dict(:a => "a", :π => "π")) + @test isnull(mx.get_attr(conv, :b)) + @test get(mx.get_attr(conv, :a)) == "a" + @test get(mx.get_attr(conv, :π)) == "π" + + @test_throws MethodError mx.Variable(:data3, attrs = Dict(:test => "1.0", :test2 => 1.0)) + @test_throws MethodError mx.Convolution(data=data2, kernel = (1,1), num_filter = 1, attrs = Dict(:test => "1.0", :test2 => 1.0)) end ################################################################################ From 247ec44da550a7340b7657d7fcf4f4f13def562e Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 24 Nov 2015 11:00:20 +0900 Subject: [PATCH 257/630] attrs: Doc rebuild --- docs/api/io.rst | 4 +- docs/api/ndarray.rst | 11 +++ docs/api/symbolic-node.rst | 145 +++++++++++++++++++++++++++---------- 3 files changed, 121 insertions(+), 39 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index f1ab959be6f2..6186db52ecc1 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -324,7 +324,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -467,7 +467,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index 270d85bab837..c5baf5b75301 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -433,6 +433,17 @@ object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the out Public APIs ^^^^^^^^^^^ +.. function:: abs(...) + + Take absolute value of the src + + :param src: Source input to the function + :type src: NDArray + + + + + .. function:: choose_element_0index(...) Choose one element from each line(row for python, column for R/Julia) in lhs according to index indicated by rhs. This function assume rhs uses 0-based index. diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index e1f301783051..3e030378c3ba 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -83,6 +83,7 @@ Symbolic API .. function:: get_attr(self :: SymbolicNode, key :: Symbol) Get attribute attached to this :class:`SymbolicNode` belonging to key. + :return: The value belonging to key as a :class:`Nullable`. @@ -101,11 +102,13 @@ Symbolic API -.. function:: Variable(name :: Union{Base.Symbol, AbstractString}) +.. function:: Variable(name :: Union{Symbol, AbstractString}) Create a symbolic variable with the given name. This is typically used as a placeholder. For example, the data node, acting as the starting point of a network architecture. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`Variable`. + @@ -186,7 +189,8 @@ Public APIs :param act_type: Activation function to be applied. :type act_type: {'relu', 'sigmoid', 'tanh'}, required - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -209,7 +213,8 @@ Public APIs :param momentum: Momentum for moving average :type momentum: float, optional, default=0.9 - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -224,7 +229,8 @@ Public APIs :param data: Input data. :type data: SymbolicNode - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -245,7 +251,8 @@ Public APIs :param dim: the dimension to be concated. :type dim: int, optional, default='1' - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -296,7 +303,8 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=False - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -347,7 +355,8 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=True - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -366,7 +375,8 @@ Public APIs :param p: Fraction of the input that gets dropped out at training time :type p: float, optional, default=0.5 - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -383,7 +393,8 @@ Public APIs :param num_args: Number of inputs to be sumed. :type num_args: int, required - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -410,7 +421,8 @@ Public APIs :param output_dim: output dim of embedding :type output_dim: int, required - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -425,7 +437,8 @@ Public APIs :param data: Input data to flatten. :type data: SymbolicNode - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -456,7 +469,8 @@ Public APIs :param no_bias: Whether to disable bias parameter. :type no_bias: boolean, optional, default=False - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -487,7 +501,8 @@ Public APIs :param nsize: normalization window width in elements. :type nsize: int (non-negative), required - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -518,7 +533,8 @@ Public APIs :param upper_bound: Upper bound of random slope. (For rrelu only) :type upper_bound: float, optional, default=0.334 - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -537,7 +553,8 @@ Public APIs :param label: Input label to function. :type label: SymbolicNode - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -557,7 +574,8 @@ Public APIs :param label: Input label to function. :type label: SymbolicNode - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -588,7 +606,8 @@ Public APIs :param pad: pad for pooling: (y, x) :type pad: Shape(tuple), optional, default=(0, 0) - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -607,7 +626,8 @@ Public APIs :param target_shape: Target new shape :type target_shape: Shape(tuple), required - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -622,7 +642,8 @@ Public APIs :param num_outputs: Number of outputs to be sliced. :type num_outputs: int, required - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -645,7 +666,8 @@ Public APIs :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes :type multi_output: boolean, optional, default=False - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -668,7 +690,8 @@ Public APIs :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes :type multi_output: boolean, optional, default=False - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -691,7 +714,24 @@ Public APIs :param dim2: the second axis to be swapped. :type dim2: int (non-negative), optional, default=0 - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: abs(...) + + Take absolute value of the src + + :param src: Source symbolic input to the function + :type src: SymbolicNode + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -706,7 +746,8 @@ Public APIs :param src: Source symbolic input to the function :type src: SymbolicNode - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -721,7 +762,8 @@ Public APIs :param src: Source symbolic input to the function :type src: SymbolicNode - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -736,7 +778,8 @@ Public APIs :param src: Source symbolic input to the function :type src: SymbolicNode - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -751,7 +794,8 @@ Public APIs :param src: Source symbolic input to the function :type src: SymbolicNode - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -769,7 +813,8 @@ Internal APIs Perform an elementwise div. - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -792,7 +837,8 @@ Internal APIs :param scalar_on_left: scalar operand is on the left. :type scalar_on_left: boolean, optional, default=False - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -804,7 +850,8 @@ Internal APIs Perform an elementwise minus. - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -827,7 +874,8 @@ Internal APIs :param scalar_on_left: scalar operand is on the left. :type scalar_on_left: boolean, optional, default=False - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -839,7 +887,8 @@ Internal APIs Perform an elementwise mul. - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -862,7 +911,24 @@ Internal APIs :param scalar_on_left: scalar operand is on the left. :type scalar_on_left: boolean, optional, default=False - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: _NDArray(...) + + Stub for implementing an operator implemented in native frontend language with ndarray. + + :param info: + :type info: , required + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -881,7 +947,8 @@ Internal APIs :param need_top_grad: Whether this layer needs out grad for backward. Should be false for loss layers. :type need_top_grad: boolean, optional, default=True - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -893,7 +960,8 @@ Internal APIs Perform an elementwise plus. - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -916,7 +984,8 @@ Internal APIs :param scalar_on_left: scalar operand is on the left. :type scalar_on_left: boolean, optional, default=False - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -928,7 +997,8 @@ Internal APIs Perform an elementwise power. - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. @@ -951,7 +1021,8 @@ Internal APIs :param scalar_on_left: scalar operand is on the left. :type scalar_on_left: boolean, optional, default=False - :param Base.Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. :return: the constructed :class:`SymbolicNode`. From c66531f9ea70dfe38fbab7fc7814186829a1862d Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 26 Nov 2015 10:13:56 +0900 Subject: [PATCH 258/630] adds LearningRate.Inv from Mocha --- src/optimizer.jl | 21 ++++++++++++++++++++- 1 file changed, 20 insertions(+), 1 deletion(-) diff --git a/src/optimizer.jl b/src/optimizer.jl index 0a3f23bc96ba..887fd9ab59e0 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -106,8 +106,27 @@ function Exp(base_lr::Real; gamma::Real=0.9, decay_on_iteration::Bool=false) end get_learning_rate(self :: Exp, state :: OptimizationState) = self.learning_rate * self.gamma ^ (self.on_iteration ? state.curr_iter : state.curr_epoch) +#=doc +.. class:: LearningRate.Inv -end # module LearningRate + :math:`\eta_t = \eta_0 * (1 + \gamma * t)^(-power)`. + Here :math:`t` is the epoch count, or the iteration count if ``decay_on_iteration`` + is set to true. +=# +type Inv <: AbstractLearningRateScheduler + learning_rate :: Float64 + gamma :: Float64 + power :: Float64 + on_iteration :: Bool +end +function Inv(base_lr :: Real; gamma::Real=0.9, power::Real=0.5, decay_on_iteration::Bool=false) + @assert(0 < gamma < 1) + @assert(0 <= power) + Inv(Float64(base_lr), Float64(gamma), Float64(power), decay_on_iteration) +end +get_learning_rate(self :: Inv, state :: OptimizationState) = + self.learning_rate * ( 1 + self.gamma * (self.on_iteration ? state.curr_iter : state.curr_epoch)) ^ (-self.power) +end# module LearningRate ################################################################################ function get_lr_scheduler(scheduler :: Any, lr :: Real) if isa(scheduler, AbstractLearningRateScheduler) From 74cc5baa1104a851a8a89bcd22e6ba1c1614f8b7 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 Nov 2015 17:41:05 +0900 Subject: [PATCH 259/630] Fixes usuage of floor https://github.com/dmlc/mxnet/pull/717 a PR upstream added floor/ceil/round, which are now imported as operators, causing problems with the native Julia functions. Luckily there is only one usage. --- src/model.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/model.jl b/src/model.jl index 80f0a9644778..8cb5e5bc39df 100644 --- a/src/model.jl +++ b/src/model.jl @@ -41,7 +41,7 @@ end """ function _split_inputs(batch_size :: Int, n_split :: Int) @assert(batch_size >= n_split) - per_split = floor(Int, batch_size / n_split) + per_split = Base.floor(Int, batch_size / n_split) counts = Base.zeros(Int, n_split)+per_split extra = batch_size - sum(counts) counts[1:extra] += 1 From f094a11cbbd1deb15a516479fdd3e271c8dd0385 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 29 Nov 2015 23:41:49 -0500 Subject: [PATCH 260/630] add missing _init_default --- src/initializer.jl | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/initializer.jl b/src/initializer.jl index 8263c06ba496..0d2a10586f57 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -56,6 +56,10 @@ function _init_zero(self :: AbstractInitializer, name :: Base.Symbol, array :: N array[:] = 0 end +function _init_default(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + error("Do not know how to init $name") +end + #=doc Built-in initializers --------------------- From 2ff90c364f25684bf5d47a23795524f0ae757f80 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 1 Dec 2015 21:20:07 +0900 Subject: [PATCH 261/630] imports operators into the namespace to prevent issues --- src/MXNet.jl | 3 +++ src/model.jl | 2 +- 2 files changed, 4 insertions(+), 1 deletion(-) diff --git a/src/MXNet.jl b/src/MXNet.jl index 42c9e45f477e..c5056320791c 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -8,6 +8,9 @@ export mx module mx using Formatting +# Functions from base that we can safely extend and that are defined by libmxnet. +import Base: round, ceil, floor, cos, sin, abs, sign, exp, sqrt, exp, log, norm + include("base.jl") include("context.jl") diff --git a/src/model.jl b/src/model.jl index 8cb5e5bc39df..80f0a9644778 100644 --- a/src/model.jl +++ b/src/model.jl @@ -41,7 +41,7 @@ end """ function _split_inputs(batch_size :: Int, n_split :: Int) @assert(batch_size >= n_split) - per_split = Base.floor(Int, batch_size / n_split) + per_split = floor(Int, batch_size / n_split) counts = Base.zeros(Int, n_split)+per_split extra = batch_size - sum(counts) counts[1:extra] += 1 From 67c8bb2d6e319d7a95fc574a76736e5c20d05523 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 2 Dec 2015 00:42:26 -0500 Subject: [PATCH 262/630] prepare for v0.0.6 (c.f. #42) --- NEWS.md | 6 ++++++ docs/conf.py | 4 ++-- 2 files changed, 8 insertions(+), 2 deletions(-) diff --git a/NEWS.md b/NEWS.md index d50bd5ed9300..dd95dbb5ffec 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,9 @@ +$ v0.0.6 (2015.12.02) + +* Variants of Xaiver initializers (@vchuravy) +* More arithmetic operators on symbolic nodes +* Basic interface for symbolic node attributes (@vchuravy) + # v0.0.5 (2015.11.14) * char-lstm example. diff --git a/docs/conf.py b/docs/conf.py index c2a405765352..32e0d28f35ba 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -56,9 +56,9 @@ # built documents. # # The short X.Y version. -version = '0.0.5' +version = '0.0.6' # The full version, including alpha/beta/rc tags. -release = '0.0.5' +release = '0.0.6' # The language for content autogenerated by Sphinx. Refer to documentation # for a list of supported languages. From aa1b600cd9683bffe82d26f3d5d29ec928ea47c2 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 3 Dec 2015 10:38:44 -0500 Subject: [PATCH 263/630] backport @defstruct from SimpleStructs.jl --- src/base.jl | 82 ++++++++++++++++++++++++++++++++++-------- src/model.jl | 2 +- src/optimizers/adam.jl | 2 +- src/optimizers/sgd.jl | 2 +- 4 files changed, 71 insertions(+), 17 deletions(-) diff --git a/src/base.jl b/src/base.jl index 0988400b9d31..de48241ac7e9 100644 --- a/src/base.jl +++ b/src/base.jl @@ -161,18 +161,48 @@ is available. The macro will define a constructor that could accept the keyword arguments. """ -macro defstruct(name, super_name, fields) - @assert fields.head == :tuple - fields = fields.args +macro defstruct(name, fields) + _defstruct_impl(false, name, fields) +end + +"""A convenient macro to define immutable structs. The same as +`@defstruct` except that the defined type is immutable. +""" +macro defimmutable(name, fields) + _defstruct_impl(true, name, fields) +end + +"""Internal use only, this value is used to indicate a required value +is not specified. +""" +immutable __Undefined +end + +function _defstruct_impl(is_immutable, name, fields) + if isa(fields, Expr) && fields.head == :tuple + fields = fields.args + else + fields = [fields] + end @assert length(fields) > 0 - name = esc(name) - super_name = esc(super_name) + + if isa(name, Symbol) + name = esc(name) + super_name = :Any + else + @assert(isa(name, Expr) && name.head == :comparison && length(name.args) == 3 && name.args[2] == :(<:), + "name must be of form 'Name <: SuperType'") + @assert(isa(name.args[1], Symbol) && isa(name.args[3], Symbol)) + super_name = esc(name.args[3]) + name = esc(name.args[1]) + end field_defs = Array(Expr, length(fields)) # :(field2 :: Int) field_names = Array(Expr, length(fields)) # :field2 field_defaults = Array(Expr, length(fields)) # :(field2 = 0) field_types = Array(Expr, length(fields)) # Int field_asserts = Array(Expr, length(fields)) # :(field2 >= 0) + required_field = Symbol[] for i = 1:length(fields) field = fields[i] @@ -180,16 +210,30 @@ macro defstruct(name, super_name, fields) field_asserts[i] = esc(field.args[2]) field = field.args[1] end - field_defs[i] = esc(field.args[1]) - field_names[i] = esc(field.args[1].args[1]) - field_types[i] = esc(field.args[1].args[2]) - field_defaults[i] = Expr(:kw, field.args[1].args[1], esc(field.args[2])) + if field.head == :(=) + fname = field.args[1].args[1] + field_defs[i] = esc(field.args[1]) + field_names[i] = esc(fname) + field_types[i] = esc(field.args[1].args[2]) + field_defaults[i] = Expr(:kw, fname, esc(field.args[2])) + else + # no default value provided, required field + fname = field.args[1] + field_defs[i] = esc(field) + field_names[i] = esc(fname) + field_types[i] = esc(field.args[2]) + field_defaults[i] = Expr(:kw, fname, __Undefined()) + push!(required_field, fname) + end end # body of layer type, defining fields type_body = Expr(:block, field_defs...) # constructor + requires = map(required_field) do fname + :(@assert(!isa($fname, __Undefined), "value for " * string($fname) * " is required")) + end converts = map(zip(field_names, field_types)) do param f_name, f_type = param :($f_name = convert($f_type, $f_name)) @@ -198,15 +242,25 @@ macro defstruct(name, super_name, fields) :(@assert($(field_asserts[i]))) end construct = Expr(:call, name, field_names...) - ctor_body = Expr(:block, converts..., asserts..., construct) + ctor_body = Expr(:block, requires..., converts..., asserts..., construct) ctor_def = Expr(:call, name, Expr(:parameters, field_defaults...)) ctor = Expr(:(=), ctor_def, ctor_body) - quote - type $(name) <: $super_name - $type_body + if is_immutable + quote + immutable $(name) <: $(super_name) + $type_body + end + + $ctor end + else + quote + type $(name) <: $(super_name) + $type_body + end - $ctor + $ctor + end end end diff --git a/src/model.jl b/src/model.jl index 80f0a9644778..009471c785f2 100644 --- a/src/model.jl +++ b/src/model.jl @@ -260,7 +260,7 @@ function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params : return (kv, update_on_kvstore) end -@defstruct TrainingOptions Any ( +@defstruct TrainingOptions ( initializer :: AbstractInitializer = UniformInitializer(0.01), n_epoch :: Int = 10, eval_data :: Union{Void, AbstractDataProvider} = nothing, diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl index 95eaefe275a1..6b17f1b3e152 100644 --- a/src/optimizers/adam.jl +++ b/src/optimizers/adam.jl @@ -1,4 +1,4 @@ -@defstruct ADAMOptions AbstractOptimizerOptions ( +@defstruct ADAMOptions <: AbstractOptimizerOptions ( (lr :: Real = 0.001, lr > 0), (grad_clip :: Real = 0, grad_clip >= 0), (weight_decay :: Real = 0.00001, weight_decay >= 0), diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index f3d1b10a66e4..fb6bf195fdb5 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -1,4 +1,4 @@ -@defstruct SGDOptions AbstractOptimizerOptions ( +@defstruct SGDOptions <: AbstractOptimizerOptions ( (lr :: Real = 0.01, lr > 0), (momentum :: Real = 0.0, momentum >= 0), (grad_clip :: Real = 0, grad_clip >= 0), From b51389884da2f2865bc91bf43b1f7143b41c99bc Mon Sep 17 00:00:00 2001 From: Simon Date: Sat, 5 Dec 2015 12:45:36 +0100 Subject: [PATCH 264/630] use download instead of wget This works better on windows. Unzip must be installed though: http://sourceforge.net/projects/gnuwin32/?source=typ_redirect Maybe use one of the Julia zip packages? --- src/util.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/util.jl b/src/util.jl index be27d1e2310c..1e9b0853dc5b 100644 --- a/src/util.jl +++ b/src/util.jl @@ -18,8 +18,8 @@ function get_mnist_ubyte() filenames = [k => joinpath(mnist_dir, v) for (k,v) in filenames] if !all(isfile, values(filenames)) cd(mnist_dir) do - run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/mnist.zip`) - run(`unzip -u mnist.zip`) + mnist_dir = download("http://webdocs.cs.ualberta.ca/~bx3/data/mnist.zip", "mnist.zip") + run(`unzip -u $mnist_dir`) end end return filenames From d612faf9554300e029138a0cc219685d42605c24 Mon Sep 17 00:00:00 2001 From: kasiabozek Date: Wed, 9 Dec 2015 15:59:37 +0900 Subject: [PATCH 265/630] Accuracy metric added to epoch callbacks.. --- src/callback.jl | 8 ++++---- src/model.jl | 13 +++++++------ 2 files changed, 11 insertions(+), 10 deletions(-) diff --git a/src/callback.jl b/src/callback.jl index 9f3d85b576ff..e18184b1131a 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -110,13 +110,13 @@ end function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) end -function Base.call(cb :: EpochCallback, model :: Any, state :: OptimizationState) +function Base.call{T<:Real}(cb :: EpochCallback, model :: Any, state :: OptimizationState, metric :: Vector{Tuple{Base.Symbol, T}}) if state.curr_epoch == 0 if cb.call_on_0 - cb.callback(model, state) + cb.callback(model, state, metric) end elseif state.curr_epoch % cb.frequency == 0 - cb.callback(model, state) + cb.callback(model, state, metric) end end @@ -136,7 +136,7 @@ end =# function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) mkpath(dirname(prefix)) - every_n_epoch(frequency, call_on_0=save_epoch_0) do model, state + every_n_epoch(frequency, call_on_0=save_epoch_0) do model, state, metric save_checkpoint(model, prefix, state) end end diff --git a/src/model.jl b/src/model.jl index 009471c785f2..a8e5c49df28e 100644 --- a/src/model.jl +++ b/src/model.jl @@ -260,7 +260,7 @@ function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params : return (kv, update_on_kvstore) end -@defstruct TrainingOptions ( +@defstruct TrainingOptions Any ( initializer :: AbstractInitializer = UniformInitializer(0.01), n_epoch :: Int = 10, eval_data :: Union{Void, AbstractDataProvider} = nothing, @@ -270,13 +270,14 @@ end callbacks :: Vector{AbstractCallback} = AbstractCallback[], ) -function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, - state::OptimizationState, type_filter::Type) +function _invoke_callbacks{T<:Real}(self::FeedForward, callbacks::Vector{AbstractCallback}, + state::OptimizationState, type_filter::Type; + metric::Vector{Tuple{Base.Symbol, T}} = Vector{Tuple{Base.Symbol, Real}}()) map(callbacks) do cb if isa(cb, type_filter) if type_filter == AbstractEpochCallback # epoch callback have extra access to the model object - cb(self, state) + cb(self, state, metric) else cb(state) end @@ -465,6 +466,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end # end of one epoch time_stop = time() + metric = get(opts.eval_metric) info(format("== Epoch {1:0>3d} ==========", i_epoch)) info("## Training summary") for (name, value) in get(opts.eval_metric) @@ -514,7 +516,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra copy!(self.aux_params[name], aux_avg) end end - _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) + _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback; metric=metric) end # end of all epochs end @@ -573,4 +575,3 @@ function load_checkpoint(self :: FeedForward, prefix :: AbstractString, epoch :: self.aux_params = aux_params return self end - From a5c66935c85a4f746530f4011b3e73a72de60b1e Mon Sep 17 00:00:00 2001 From: kasiabozek Date: Wed, 9 Dec 2015 16:04:20 +0900 Subject: [PATCH 266/630] Accuracy metric added to epoch callbacks. --- src/model.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/model.jl b/src/model.jl index a8e5c49df28e..2745310da03a 100644 --- a/src/model.jl +++ b/src/model.jl @@ -469,7 +469,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra metric = get(opts.eval_metric) info(format("== Epoch {1:0>3d} ==========", i_epoch)) info("## Training summary") - for (name, value) in get(opts.eval_metric) + for (name, value) in metric info(format("{1:>18s} = {2:.4f}", string(name), value)) end info(format("{1:>18s} = {2:.4f} seconds", "time", time_stop-time_start)) From 49a92d1e90e09e468cdb48a99f9898dee52946b9 Mon Sep 17 00:00:00 2001 From: kasiabozek Date: Wed, 9 Dec 2015 17:06:23 +0900 Subject: [PATCH 267/630] Accuracy metric added to epoch callbacks. --- src/model.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/model.jl b/src/model.jl index 2745310da03a..d4b492333f9f 100644 --- a/src/model.jl +++ b/src/model.jl @@ -260,7 +260,7 @@ function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params : return (kv, update_on_kvstore) end -@defstruct TrainingOptions Any ( +@defstruct TrainingOptions ( initializer :: AbstractInitializer = UniformInitializer(0.01), n_epoch :: Int = 10, eval_data :: Union{Void, AbstractDataProvider} = nothing, From 71b49456c4b26ed49179fcf91b19ece3d5740d81 Mon Sep 17 00:00:00 2001 From: BigEpsilon Date: Sat, 12 Dec 2015 20:58:49 +0100 Subject: [PATCH 268/630] Fix compilation errors for julia 0.4.2 --- src/model.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/model.jl b/src/model.jl index d4b492333f9f..c208873e867f 100644 --- a/src/model.jl +++ b/src/model.jl @@ -43,7 +43,7 @@ function _split_inputs(batch_size :: Int, n_split :: Int) @assert(batch_size >= n_split) per_split = floor(Int, batch_size / n_split) counts = Base.zeros(Int, n_split)+per_split - extra = batch_size - sum(counts) + extra = batch_size - Base.sum(counts) counts[1:extra] += 1 cum = [0, cumsum(counts)...] From 8e879d74512d8ae2e7bc78fe9bd2f31eed4ef9a9 Mon Sep 17 00:00:00 2001 From: BigEpsilon Date: Sat, 12 Dec 2015 21:03:30 +0100 Subject: [PATCH 269/630] Fix compilation errors for julia 0.4.2 --- src/io.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/io.jl b/src/io.jl index 48e0a31e32a2..99fcd8516c6b 100644 --- a/src/io.jl +++ b/src/io.jl @@ -435,7 +435,7 @@ immutable ArrayDataBatch <: AbstractDataBatch idx :: UnitRange{Int} end function Base.next(provider :: ArrayDataProvider, state :: ArrayDataProviderState) - idx = state.curr_idx:min(state.curr_idx+provider.batch_size-1, provider.sample_count) + idx = state.curr_idx:Base.min(state.curr_idx+provider.batch_size-1, provider.sample_count) return (ArrayDataBatch(idx), ArrayDataProviderState(idx.stop+1)) end From 5ed54d85355325b61df333e6b80be0939d7f1c57 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 12 Dec 2015 20:51:00 -0500 Subject: [PATCH 270/630] try to fix build-script for installing cblas --- deps/build.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 5c0dd2bb749f..cb9f930c096d 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -31,8 +31,8 @@ if !libmxnet_detected #-------------------------------------------------------------------------------- # Install dependencies, blas @linux_only begin - blas = library_dependency("blas", aliases=["libblas","libblas.so.3"]) - provides(AptGet, "libblas-dev", blas) + blas = library_dependency("cblas", aliases=["libcblas"]) + provides(AptGet, "libatlas-base-dev", blas) provides(Pacman, "blas", blas) provides(Yum, "blas-devel", blas) From f91c200d6b0c6774f0cc3c533217a1d1f1ce97af Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 12 Dec 2015 20:52:20 -0500 Subject: [PATCH 271/630] add Juliapkg badge --- README.md | 1 + 1 file changed, 1 insertion(+) diff --git a/README.md b/README.md index f60ca9f460a0..855680ae6d1a 100644 --- a/README.md +++ b/README.md @@ -3,6 +3,7 @@ [![Build Status](https://travis-ci.org/dmlc/MXNet.jl.svg?branch=master)](https://travis-ci.org/dmlc/MXNet.jl) [![codecov.io](https://codecov.io/github/dmlc/MXNet.jl/coverage.svg?branch=master)](https://codecov.io/github/dmlc/MXNet.jl?branch=master) [![Documentation Status](https://readthedocs.org/projects/mxnetjl/badge/?version=latest)](http://mxnetjl.readthedocs.org/en/latest/?badge=latest) +[![MXNet](http://pkg.julialang.org/badges/MXNet_0.4.svg)](http://pkg.julialang.org/?pkg=MXNet) [![License](http://dmlc.github.io/img/apache2.svg)](LICENSE.md) [![Join the chat at https://gitter.im/dmlc/mxnet](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/dmlc/mxnet?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge) From 0169981ed15d74306996bbba15fc4989cdc0c583 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 14 Dec 2015 16:32:52 -0500 Subject: [PATCH 272/630] try to use the built-in bindeps for building in travis CI --- .travis.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.travis.yml b/.travis.yml index 8771dfa989b6..3dd2874b2cdb 100644 --- a/.travis.yml +++ b/.travis.yml @@ -28,7 +28,7 @@ addons: before_install: - export TRAVIS=test/travis - source $TRAVIS/setup_env.sh - - source $TRAVIS/build_mxnet.sh + #- source $TRAVIS/build_mxnet.sh notifications: email: false From d8e5065a2c99b2d64a02afbcaf202c5d6f2414c2 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 14 Dec 2015 16:39:39 -0500 Subject: [PATCH 273/630] fix travis CI building script --- test/travis/setup_env.sh | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/test/travis/setup_env.sh b/test/travis/setup_env.sh index 242e034120b2..16ce30c62382 100755 --- a/test/travis/setup_env.sh +++ b/test/travis/setup_env.sh @@ -10,3 +10,8 @@ if [ ${TRAVIS_OS_NAME} == "osx" ]; then brew install graphviz brew install opencv fi + +if [ ${TRAVIS_OS_NAME} == "linux" ]; then + alias gcc='gcc-4.8' + alias g++='g++-4.8' +fi From 7a7cfbe7256f514d9fcc2c9b2fdf6ef1a4405c63 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 14 Dec 2015 16:51:26 -0500 Subject: [PATCH 274/630] trying to fix travis CI gcc-4.8 thing --- deps/build.jl | 6 ++++++ test/travis/setup_env.sh | 4 ++-- 2 files changed, 8 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index cb9f930c096d..1be650b500fd 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -60,6 +60,12 @@ if !libmxnet_detected `cp make/config.mk config.mk` @osx_only `cp make/osx.mk config.mk` `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` + if haskey(ENV, "MXNET_CC") + `sed -i -s 's/export CC = gcc/export CC = $(ENV["MXNET_CC"])/g' config.mk` + end + if haskey(ENV, "MXNET_CXX") + `sed -i -s 's/export CXX = g++/export CC = $(ENV["MXNET_CXX"])/g' config.mk` + end `make` `cp lib/libmxnet.so $_libdir` end) diff --git a/test/travis/setup_env.sh b/test/travis/setup_env.sh index 16ce30c62382..d8a454bd83cc 100755 --- a/test/travis/setup_env.sh +++ b/test/travis/setup_env.sh @@ -12,6 +12,6 @@ if [ ${TRAVIS_OS_NAME} == "osx" ]; then fi if [ ${TRAVIS_OS_NAME} == "linux" ]; then - alias gcc='gcc-4.8' - alias g++='g++-4.8' + export MXNET_CC=gcc-4.8 + export MXNET_CXX=g++-4.8 fi From 99e7e66dcc263117751cef6c3ac6998fc4db4015 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 14 Dec 2015 17:00:42 -0500 Subject: [PATCH 275/630] still trying to fix travis CI gcc issue... --- deps/build.jl | 6 ------ test/travis/run_test.sh | 1 + test/travis/setup_env.sh | 6 ++++-- 3 files changed, 5 insertions(+), 8 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 1be650b500fd..cb9f930c096d 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -60,12 +60,6 @@ if !libmxnet_detected `cp make/config.mk config.mk` @osx_only `cp make/osx.mk config.mk` `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` - if haskey(ENV, "MXNET_CC") - `sed -i -s 's/export CC = gcc/export CC = $(ENV["MXNET_CC"])/g' config.mk` - end - if haskey(ENV, "MXNET_CXX") - `sed -i -s 's/export CXX = g++/export CC = $(ENV["MXNET_CXX"])/g' config.mk` - end `make` `cp lib/libmxnet.so $_libdir` end) diff --git a/test/travis/run_test.sh b/test/travis/run_test.sh index a576c69f6979..93f8a97c2568 100755 --- a/test/travis/run_test.sh +++ b/test/travis/run_test.sh @@ -1,4 +1,5 @@ #!/bin/bash +g++ --version if [[ -a .git/shallow ]]; then git fetch --unshallow; fi julia -e 'Pkg.clone(pwd()); Pkg.build("MXNet"); Pkg.test("MXNet"; coverage=true)' diff --git a/test/travis/setup_env.sh b/test/travis/setup_env.sh index d8a454bd83cc..5a33a9e42955 100755 --- a/test/travis/setup_env.sh +++ b/test/travis/setup_env.sh @@ -12,6 +12,8 @@ if [ ${TRAVIS_OS_NAME} == "osx" ]; then fi if [ ${TRAVIS_OS_NAME} == "linux" ]; then - export MXNET_CC=gcc-4.8 - export MXNET_CXX=g++-4.8 + mkdir shadow_bin + ln -s `which gcc-4.8` shadow_bin/gcc + ln -s `which g++-4.8` shadow_bin/g++ + export PATH=$PWD/shadow_bin:$PATH fi From 3861edcf0aeec488942e6f3a1e07c31fe196b3b9 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 14 Dec 2015 17:13:55 -0500 Subject: [PATCH 276/630] clean up travis CI script --- .travis.yml | 1 - test/travis/build_mxnet.sh | 21 --------------------- test/travis/run_test.sh | 1 - 3 files changed, 23 deletions(-) delete mode 100755 test/travis/build_mxnet.sh diff --git a/.travis.yml b/.travis.yml index 3dd2874b2cdb..9f08e176eed2 100644 --- a/.travis.yml +++ b/.travis.yml @@ -28,7 +28,6 @@ addons: before_install: - export TRAVIS=test/travis - source $TRAVIS/setup_env.sh - #- source $TRAVIS/build_mxnet.sh notifications: email: false diff --git a/test/travis/build_mxnet.sh b/test/travis/build_mxnet.sh deleted file mode 100755 index 6774011f6355..000000000000 --- a/test/travis/build_mxnet.sh +++ /dev/null @@ -1,21 +0,0 @@ -#!/bin/bash - -git clone --recursive https://github.com/dmlc/mxnet __mxnet_build -cd __mxnet_build - -if [ ! -f config.mk ]; then - if [ ${TRAVIS_OS_NAME} == "linux" ]; then - cp make/config.mk config.mk - sed -i 's/export CC = gcc/export CC = gcc-4.8/g' config.mk - sed -i 's/export CXX = g++/export CXX = g++-4.8/g' config.mk - fi - - if [ ${TRAVIS_OS_NAME} == "osx" ]; then - cp make/osx.mk config.mk - fi -fi - -make -j4 || exit 1 - -export MXNET_HOME=$PWD -cd .. diff --git a/test/travis/run_test.sh b/test/travis/run_test.sh index 93f8a97c2568..a576c69f6979 100755 --- a/test/travis/run_test.sh +++ b/test/travis/run_test.sh @@ -1,5 +1,4 @@ #!/bin/bash -g++ --version if [[ -a .git/shallow ]]; then git fetch --unshallow; fi julia -e 'Pkg.clone(pwd()); Pkg.build("MXNet"); Pkg.test("MXNet"; coverage=true)' From 3a134e82e5e663ab095e9f836c2860d9ce6a58ec Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 14 Dec 2015 17:19:19 -0500 Subject: [PATCH 277/630] test whether bindeps works well on travis CI to install cblas --- .travis.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.travis.yml b/.travis.yml index 9f08e176eed2..ded60f0045b6 100644 --- a/.travis.yml +++ b/.travis.yml @@ -19,9 +19,9 @@ addons: - git - libcurl4-openssl-dev - unzip - - libatlas-base-dev - - libatlas-dev - - libopencv-dev + #- libatlas-base-dev + #- libatlas-dev + #- libopencv-dev - gcc-4.8 - g++-4.8 From ce57a3907bd8cf9843d6c7956c39f71385e96aec Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 14 Dec 2015 17:25:02 -0500 Subject: [PATCH 278/630] test failed, travis CI is configured to disable sudo --- .travis.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.travis.yml b/.travis.yml index ded60f0045b6..9f08e176eed2 100644 --- a/.travis.yml +++ b/.travis.yml @@ -19,9 +19,9 @@ addons: - git - libcurl4-openssl-dev - unzip - #- libatlas-base-dev - #- libatlas-dev - #- libopencv-dev + - libatlas-base-dev + - libatlas-dev + - libopencv-dev - gcc-4.8 - g++-4.8 From 8edb94be2a4c6250ef4bb26e58ca5fb0b9fee6ff Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 14 Dec 2015 18:24:56 -0500 Subject: [PATCH 279/630] prepare for v0.0.7 --- NEWS.md | 7 +- docs/api/io.rst | 4 +- docs/api/ndarray.rst | 110 ++++++++++++++ docs/api/optimizer.rst | 9 ++ docs/api/symbolic-node.rst | 303 ++++++++++++++++++++++++++++++++++++- docs/conf.py | 4 +- 6 files changed, 427 insertions(+), 10 deletions(-) diff --git a/NEWS.md b/NEWS.md index dd95dbb5ffec..c0d365a7336e 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,4 +1,9 @@ -$ v0.0.6 (2015.12.02) +# v0.0.7 (2015.12.14) + +* Fix compatability with Julia v0.4.2 (@BigEpsilon) +* Metrics in epoch callbacks (@kasiabozek) + +# v0.0.6 (2015.12.02) * Variants of Xaiver initializers (@vchuravy) * More arithmetic operators on symbolic nodes diff --git a/docs/api/io.rst b/docs/api/io.rst index 6186db52ecc1..f1ab959be6f2 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -324,7 +324,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -467,7 +467,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index c5baf5b75301..d2f0c4fc9636 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -444,6 +444,17 @@ Public APIs +.. function:: ceil(...) + + Take ceil value of the src + + :param src: Source input to the function + :type src: NDArray + + + + + .. function:: choose_element_0index(...) Choose one element from each line(row for python, column for R/Julia) in lhs according to index indicated by rhs. This function assume rhs uses 0-based index. @@ -478,6 +489,17 @@ Public APIs +.. function:: cos(...) + + Take cos of the src + + :param src: Source input to the function + :type src: NDArray + + + + + .. function:: dot(...) Calcuate 2D matrix multiplication @@ -504,6 +526,17 @@ Public APIs +.. function:: floor(...) + + Take floor value of the src + + :param src: Source input to the function + :type src: NDArray + + + + + .. function:: log(...) Take log of the src @@ -515,6 +548,28 @@ Public APIs +.. function:: max(...) + + Take max of the src.The result will be ndarray of shape (1,) on the same device. + + :param src: Source input to the function + :type src: NDArray + + + + + +.. function:: min(...) + + Take min of the src.The result will be ndarray of shape (1,) on the same device. + + :param src: Source input to the function + :type src: NDArray + + + + + .. function:: norm(...) Take L2 norm of the src.The result will be ndarray of shape (1,) on the same device. @@ -526,6 +581,50 @@ Public APIs +.. function:: round(...) + + Take round value of the src + + :param src: Source input to the function + :type src: NDArray + + + + + +.. function:: rsqrt(...) + + Take rsqrt of the src + + :param src: Source input to the function + :type src: NDArray + + + + + +.. function:: sign(...) + + Take sign value of the src + + :param src: Source input to the function + :type src: NDArray + + + + + +.. function:: sin(...) + + Take sin of the src + + :param src: Source input to the function + :type src: NDArray + + + + + .. function:: sqrt(...) Take sqrt of the src @@ -547,6 +646,17 @@ Public APIs + +.. function:: sum(...) + + Take sum of the src.The result will be ndarray of shape (1,) on the same device. + + :param src: Source input to the function + :type src: NDArray + + + + Internal APIs ^^^^^^^^^^^^^ diff --git a/docs/api/optimizer.rst b/docs/api/optimizer.rst index 12e898d233b5..03c9c11fed4a 100644 --- a/docs/api/optimizer.rst +++ b/docs/api/optimizer.rst @@ -80,6 +80,15 @@ Common interfaces +.. class:: LearningRate.Inv + + :math:`\eta_t = \eta_0 * (1 + \gamma * t)^(-power)`. + Here :math:`t` is the epoch count, or the iteration count if ``decay_on_iteration`` + is set to true. + + + + .. function:: get_momentum(scheduler, state) :param AbstractMomentumScheduler scheduler: the momentum scheduler. diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index 3e030378c3ba..3ddb299a8807 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -187,7 +187,7 @@ Public APIs :param act_type: Activation function to be applied. - :type act_type: {'relu', 'sigmoid', 'tanh'}, required + :type act_type: {'relu', 'sigmoid', 'softrelu', 'tanh'}, required :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -207,12 +207,16 @@ Public APIs :param eps: Epsilon to prevent div 0 - :type eps: float, optional, default=1e-10 + :type eps: float, optional, default=0.001 :param momentum: Momentum for moving average :type momentum: float, optional, default=0.9 + + :param fix_gamma: Fix gamma while training + :type fix_gamma: boolean, optional, default=True + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -478,6 +482,34 @@ Public APIs +.. function:: IdentityAttachKLSparseReg(...) + + Apply a sparse regularization to the output a sigmoid activation function. + + :param data: Input data. + :type data: SymbolicNode + + + :param sparseness_target: The sparseness target + :type sparseness_target: float, optional, default=0.1 + + + :param penalty: The tradeoff parameter for the sparseness penalty + :type penalty: float, optional, default=0.001 + + + :param momentum: The momentum for running average + :type momentum: float, optional, default=0.9 + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: LRN(...) Apply convolution to input then add a bias. @@ -519,10 +551,10 @@ Public APIs :param act_type: Activation function to be applied. - :type act_type: {'leaky', 'prelu', 'rrelu'},optional, default='leaky' + :type act_type: {'elu', 'leaky', 'prelu', 'rrelu'},optional, default='leaky' - :param slope: Init slope for the activation. (For leaky only) + :param slope: Init slope for the activation. (For leaky and elu only) :type slope: float, optional, default=0.25 @@ -553,6 +585,10 @@ Public APIs :param label: Input label to function. :type label: SymbolicNode + + :param grad_scale: Scale the gradient by a float factor + :type grad_scale: float, optional, default=1 + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -574,6 +610,34 @@ Public APIs :param label: Input label to function. :type label: SymbolicNode + + :param grad_scale: Scale the gradient by a float factor + :type grad_scale: float, optional, default=1 + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: MAERegressionOutput(...) + + Use mean absolute error regression for final output, this is used on final output of a net. + + :param data: Input data to function. + :type data: SymbolicNode + + + :param label: Input label to function. + :type label: SymbolicNode + + + :param grad_scale: Scale the gradient by a float factor + :type grad_scale: float, optional, default=1 + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -623,7 +687,7 @@ Public APIs :type data: SymbolicNode - :param target_shape: Target new shape + :param target_shape: Target new shape. One and only one dim can be 0, in which case it will be infered from the rest of dims :type target_shape: Shape(tuple), required :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. @@ -723,6 +787,36 @@ Public APIs +.. function:: UpSampling(...) + + Perform nearest neighboor/bilinear up sampling to inputs + + This function support variable length positional :class:`SymbolicNode` inputs. + + :param scale: Up sampling scale + :type scale: int (non-negative), required + + + :param num_filter: Input filter. Only used by nearest sample_type. + :type num_filter: int (non-negative), optional, default=0 + + + :param sample_type: upsampling method + :type sample_type: {'bilinear', 'nearest'}, required + + + :param num_args: Number of inputs to be upsampled. For nearest neighbor upsampling, this can be 1-N; the size of output will be(scale*h_0,scale*w_0) and all other inputs will be upsampled to thesame size. For bilinear upsampling this must be 2; 1 input and 1 weight. + :type num_args: int, required + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: abs(...) Take absolute value of the src @@ -739,6 +833,38 @@ Public APIs +.. function:: ceil(...) + + Take ceil value of the src + + :param src: Source symbolic input to the function + :type src: SymbolicNode + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: cos(...) + + Take cos of the src + + :param src: Source symbolic input to the function + :type src: SymbolicNode + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: exp(...) Take exp of the src @@ -755,6 +881,22 @@ Public APIs +.. function:: floor(...) + + Take floor value of the src + + :param src: Source symbolic input to the function + :type src: SymbolicNode + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: log(...) Take log of the src @@ -771,6 +913,70 @@ Public APIs +.. function:: round(...) + + Take round value of the src + + :param src: Source symbolic input to the function + :type src: SymbolicNode + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: rsqrt(...) + + Take rsqrt of the src + + :param src: Source symbolic input to the function + :type src: SymbolicNode + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: sign(...) + + Take sign value of the src + + :param src: Source symbolic input to the function + :type src: SymbolicNode + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: sin(...) + + Take sin of the src + + :param src: Source symbolic input to the function + :type src: SymbolicNode + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: sqrt(...) Take sqrt of the src @@ -809,6 +1015,19 @@ Internal APIs Document and signatures for internal API functions might be incomplete. +.. function:: _CrossDeviceCopy(...) + + Special op to copy data cross device + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: _Div(...) Perform an elementwise div. @@ -846,6 +1065,80 @@ Internal APIs +.. function:: _Maximum(...) + + Perform an elementwise power. + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: _MaximumScalar(...) + + Perform an elementwise maximum. + + :param array: Input array operand to the operation. + :type array: SymbolicNode + + + :param scalar: scalar value. + :type scalar: float, required + + + :param scalar_on_left: scalar operand is on the left. + :type scalar_on_left: boolean, optional, default=False + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: _Minimum(...) + + Perform an elementwise power. + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: _MinimumScalar(...) + + Perform an elementwise minimum. + + :param array: Input array operand to the operation. + :type array: SymbolicNode + + + :param scalar: scalar value. + :type scalar: float, required + + + :param scalar_on_left: scalar operand is on the left. + :type scalar_on_left: boolean, optional, default=False + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: _Minus(...) Perform an elementwise minus. diff --git a/docs/conf.py b/docs/conf.py index 32e0d28f35ba..6293dcf80b3f 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -56,9 +56,9 @@ # built documents. # # The short X.Y version. -version = '0.0.6' +version = '0.0.7' # The full version, including alpha/beta/rc tags. -release = '0.0.6' +release = '0.0.7' # The language for content autogenerated by Sphinx. Refer to documentation # for a list of supported languages. From 4c52eb8eb76c6239b0a447a5624c7b6c7c3586b6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 16 Jan 2016 19:25:19 +0800 Subject: [PATCH 280/630] workaround for #55 --- src/ndarray.jl | 7 +++++++ test/unittest/ndarray.jl | 12 ++++++++++++ 2 files changed, 19 insertions(+) diff --git a/src/ndarray.jl b/src/ndarray.jl index e477bf6fd2f4..d0eaaf2621b4 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -940,6 +940,13 @@ function _import_ndarray_functions(;gen_docs=false) _use_vars = Expr(:ref, :MX_handle, [symbol("in$i") for i=1:n_used_vars]...) _scalars = Expr(:ref, :MX_float, [symbol("sca$i") for i=1:n_scalars]...) _mut_vars = Expr(:ref, :MX_handle, [symbol("out$i") for i=1:n_mutate_vars]...) + + # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped + # See https://github.com/dmlc/MXNet.jl/issues/55 + if func_name == :dot + _use_vars.args[2:end] = flipdim(_use_vars.args[2:end], 1) + end + stmt_call = Expr(:call, :_invoke_mxfunction, func_handle, _use_vars, _scalars, _mut_vars) if n_mutate_vars == 1 stmt_ret = :(return out1) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index b7208f532222..680d2f867263 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -260,6 +260,17 @@ function test_nd_as_jl() @test reldiff(copy(z)[:,2:end], copy(x)[:,2:end]) < 1e-6 end +function test_dot() + dims1 = (2, 3) + dims2 = (3, 8) + info("NDArray::dot") + + x = mx.zeros(dims1) + y = mx.zeros(dims2) + z = mx.dot(x, y) + @test size(z) == (2, 8) +end + ################################################################################ # Run tests @@ -276,5 +287,6 @@ test_saveload() test_clip() test_sqrt() test_nd_as_jl() +test_dot() end From 724007a4469a05e90e6c0fc5f6508192825b7d90 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 16 Jan 2016 19:31:48 +0800 Subject: [PATCH 281/630] add notes about AWS GPUs --- docs/api/io.rst | 51 +++++++++++++++++++- docs/api/ndarray.rst | 11 +++++ docs/api/symbolic-node.rst | 98 +++++++++++++++++++++++++++++++++++++- docs/index.rst | 1 + docs/user-guide/faq.rst | 7 +++ 5 files changed, 164 insertions(+), 4 deletions(-) create mode 100644 docs/user-guide/faq.rst diff --git a/docs/api/io.rst b/docs/api/io.rst index f1ab959be6f2..e5cb3ffb32e5 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -267,6 +267,33 @@ libmxnet data providers +.. function:: CSVIter(...) + + Can also be called with the alias ``CSVProvider``. + Create iterator for dataset in csv. + + :param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data. + :param Base.Symbol label_name: keyword argument, default ``:softmax_label``. The name of the label. Could be ``nothing`` if no label is presented in this dataset. + + :param data_csv: Dataset Param: Data csv path. + :type data_csv: string, required + + + :param data_shape: Dataset Param: Shape of the data. + :type data_shape: Shape(tuple), required + + + :param label_csv: Dataset Param: Label csv path. If is NULL, all labels will be returned as 0 + :type label_csv: string, optional, default='NULL' + + + :param label_shape: Dataset Param: Shape of the label. + :type label_shape: Shape(tuple), optional, default=(1,) + + :return: the constructed :class:`MXDataProvider`. + + + .. function:: ImageRecordIter(...) Can also be called with the alias ``ImageRecordProvider``. @@ -375,6 +402,18 @@ libmxnet data providers :type min_img_size: float, optional, default=0 + :param random_h: Augmentation Param: Maximum value of H channel in HSL color space. + :type random_h: int, optional, default='0' + + + :param random_s: Augmentation Param: Maximum value of S channel in HSL color space. + :type random_s: int, optional, default='0' + + + :param random_l: Augmentation Param: Maximum value of L channel in HSL color space. + :type random_l: int, optional, default='0' + + :param rotate: Augmentation Param: Rotate angle. :type rotate: int, optional, default='-1' @@ -383,6 +422,10 @@ libmxnet data providers :type fill_value: int, optional, default='255' + :param inter_method: Augmentation Param: 0-NN 1-bilinear 2-cubic 3-area 4-lanczos4 9-auto 10-rand. + :type inter_method: int, optional, default='1' + + :param mirror: Augmentation Param: Whether to mirror the image. :type mirror: boolean, optional, default=False @@ -399,14 +442,18 @@ libmxnet data providers :type mean_r: float, optional, default=0 - :param mean_g: Augmentation: Mean value on G channel. + :param mean_g: Augmentation Param: Mean value on G channel. :type mean_g: float, optional, default=0 - :param mean_b: Augmentation: Mean value on B channel. + :param mean_b: Augmentation Param: Mean value on B channel. :type mean_b: float, optional, default=0 + :param mean_a: Augmentation Param: Mean value on Alpha channel. + :type mean_a: float, optional, default=0 + + :param scale: Augmentation Param: Scale in color space. :type scale: float, optional, default=1 diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index d2f0c4fc9636..448f69bd1731 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -444,6 +444,17 @@ Public APIs +.. function:: argmax_channel(...) + + Take sum of the src.The result will be ndarray of shape (1,) on the same device. + + :param src: Source input to the function + :type src: NDArray + + + + + .. function:: ceil(...) Take ceil value of the src diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index 3ddb299a8807..8859a2243b6f 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -180,7 +180,7 @@ Public APIs ^^^^^^^^^^^ .. function:: Activation(...) - Apply activation function to input. + Apply activation function to input.Softmax Activation is only available with CUDNN on GPUand will be computed at each location across channel if input is 4D. :param data: Input data to activation function. :type data: SymbolicNode @@ -242,6 +242,26 @@ Public APIs +.. function:: Cast(...) + + Cast array to a different data type. + + :param data: Input data to cast function. + :type data: SymbolicNode + + + :param dtype: Target data type. + :type dtype: {'float16', 'float32', 'float64', 'int32', 'uint8'}, required + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: Concat(...) Perform an feature concat on channel dim (dim 1) over all the inputs. @@ -288,6 +308,10 @@ Public APIs :type stride: Shape(tuple), optional, default=(1, 1) + :param dilate: convolution dilate: (y, x) + :type dilate: Shape(tuple), optional, default=(1, 1) + + :param pad: pad for convolution: (y, x) :type pad: Shape(tuple), optional, default=(0, 0) @@ -300,7 +324,7 @@ Public APIs :type num_group: int (non-negative), optional, default=1 - :param workspace: Tmp workspace for convolution (MB) + :param workspace: Tmp workspace for convolution (MB). :type workspace: long (non-negative), optional, default=512 @@ -316,6 +340,36 @@ Public APIs +.. function:: Crop(...) + + Crop the 2th and 3th dim of input data, with the corresponding size of w_h orwith widht and height of the second input symbol + + This function support variable length positional :class:`SymbolicNode` inputs. + + :param num_args: Number of inputs for crop, if equals one, then we will use the h_wfor crop heihgt and width, else if equals two, then we will use the heightand width of the second input symbol, we name crop_like here + :type num_args: int, required + + + :param offset: corp offset coordinate: (y, x) + :type offset: Shape(tuple), optional, default=(0, 0) + + + :param h_w: corp height and weight: (h, w) + :type h_w: Shape(tuple), optional, default=(0, 0) + + + :param center_crop: If set to true, then it will use be the center_crop,or it will crop using the shape of crop_like + :type center_crop: boolean, optional, default=False + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + .. function:: Deconvolution(...) Apply deconvolution to input then add a bias. @@ -727,9 +781,37 @@ Public APIs :type grad_scale: float, optional, default=1 + :param ignore_label: the ignore_label will not work in backward, and this onlybe used when multi_output=true + :type ignore_label: float, optional, default=-1 + + :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes :type multi_output: boolean, optional, default=False + + :param use_ignore: If set to true, the ignore_label value will not contributorto the backward gradient + :type use_ignore: boolean, optional, default=False + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: the constructed :class:`SymbolicNode`. + + + + + +.. function:: SoftmaxActivation(...) + + Apply softmax activation to input. This is intended for internal layers. For output (loss layer) please use SoftmaxOutput. If type=instance, this operator will compute a softmax for each instance in the batch; this is the default mode. If type=channel, this operator will compute a num_channel-class softmax at each position of each instance; this can be used for fully convolutional network, image segmentation, etc. + + :param data: Input data to activation function. + :type data: SymbolicNode + + + :param type: Softmax Mode. If set to instance, this operator will compute a softmax for each instance in the batch; this is the default mode. If set to channel, this operator will compute a num_channel-class softmax at each position of each instance; this can be used for fully convolutional network, image segmentation, etc. + :type type: {'channel', 'instance'},optional, default='instance' + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -751,9 +833,17 @@ Public APIs :type grad_scale: float, optional, default=1 + :param ignore_label: the ignore_label will not work in backward, and this onlybe used when multi_output=true + :type ignore_label: float, optional, default=-1 + + :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes :type multi_output: boolean, optional, default=False + + :param use_ignore: If set to true, the ignore_label value will not contributorto the backward gradient + :type use_ignore: boolean, optional, default=False + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -805,6 +895,10 @@ Public APIs :type sample_type: {'bilinear', 'nearest'}, required + :param multi_input_mode: How to handle multiple input. concat means concatenate upsampled images along the channel dimension. sum means add all images together, only available for nearest neighbor upsampling. + :type multi_input_mode: {'concat', 'sum'},optional, default='concat' + + :param num_args: Number of inputs to be upsampled. For nearest neighbor upsampling, this can be 1-N; the size of output will be(scale*h_0,scale*w_0) and all other inputs will be upsampled to thesame size. For bilinear upsampling this must be 2; 1 input and 1 weight. :type num_args: int, required diff --git a/docs/index.rst b/docs/index.rst index 05077bed6904..7e95b6a7c10e 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -27,6 +27,7 @@ For more details, see documentation below. Please also checkout the `examples user-guide/install user-guide/overview + user-guide/faq .. toctree:: :maxdepth: 1 diff --git a/docs/user-guide/faq.rst b/docs/user-guide/faq.rst new file mode 100644 index 000000000000..602c8ab9fda5 --- /dev/null +++ b/docs/user-guide/faq.rst @@ -0,0 +1,7 @@ +FAQ +=== + +Running MXNet on AWS GPU instances +---------------------------------- +See the discussions and notes `here +`_. From c5cbf2440a86f395a7471b40e65d1496eb09f1d3 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 6 Feb 2016 12:17:41 -0500 Subject: [PATCH 282/630] fix seg-fault due to upstream API change --- src/ndarray.jl | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index d0eaaf2621b4..9c4836e60771 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -895,9 +895,13 @@ function _import_ndarray_functions(;gen_docs=false) ref_arg_types = Ref{char_pp}(0) ref_arg_descs = Ref{char_pp}(0) + ref_ret_type = Ref{char_p}(0) + @mxcall(:MXFuncGetInfo, - (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), - func_handle, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, + Ref{char_pp}, Ref{char_pp}, Ref{char_p}), + func_handle, ref_name, ref_desc, ref_narg, ref_arg_names, + ref_arg_types, ref_arg_descs, ref_ret_type) func_name = symbol(bytestring(ref_name[])) From 175d399d7a3f26d1b654638be59ebacec2c6855c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 6 Feb 2016 12:21:52 -0500 Subject: [PATCH 283/630] workaround for jenkins CI --- test/travis/run_test.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/test/travis/run_test.sh b/test/travis/run_test.sh index a576c69f6979..c21864d5de6b 100755 --- a/test/travis/run_test.sh +++ b/test/travis/run_test.sh @@ -1,4 +1,5 @@ #!/bin/bash if [[ -a .git/shallow ]]; then git fetch --unshallow; fi +julia -e 'Pkg.rm("MXNet")' # in case Jenkins CI did not remove existing files julia -e 'Pkg.clone(pwd()); Pkg.build("MXNet"); Pkg.test("MXNet"; coverage=true)' From f277cd7598426295d0812f21b8b33e56e7c34234 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 6 Feb 2016 12:27:32 -0500 Subject: [PATCH 284/630] revert last commit (not useful) --- test/travis/run_test.sh | 1 - 1 file changed, 1 deletion(-) diff --git a/test/travis/run_test.sh b/test/travis/run_test.sh index c21864d5de6b..a576c69f6979 100755 --- a/test/travis/run_test.sh +++ b/test/travis/run_test.sh @@ -1,5 +1,4 @@ #!/bin/bash if [[ -a .git/shallow ]]; then git fetch --unshallow; fi -julia -e 'Pkg.rm("MXNet")' # in case Jenkins CI did not remove existing files julia -e 'Pkg.clone(pwd()); Pkg.build("MXNet"); Pkg.test("MXNet"; coverage=true)' From 30b71427e954cf8e2e1ae98a3e004331f1d8eca5 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 6 Feb 2016 12:35:35 -0500 Subject: [PATCH 285/630] fix one travis CI test error --- src/symbolic-node.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 0d7f5937f88a..83ed11ba4923 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -549,8 +549,8 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) $(if kv_nargs != symbol("") quote if length(symbol_kws) > 0 - @assert(false, $func_name * " takes variable number of SymbolicNode arguments, please pass input Symbols " * - "via positional arguments, instead of keyword arguments.") + @assert(false, $func_name_s * " takes variable number of SymbolicNode arguments, " * + "please pass input Symbols via positional arguments, instead of keyword arguments.") end end end) From 1e4f9f0ae406674106e87e688399e13f7d997286 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 6 Feb 2016 12:50:45 -0500 Subject: [PATCH 286/630] fix error due to upstream API changes on symbolic node function --- docs/api/ndarray.rst | 62 +++++++++++++- docs/api/symbolic-node.rst | 164 ++++++++++++++++++++----------------- src/symbolic-node.jl | 8 +- 3 files changed, 153 insertions(+), 81 deletions(-) diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index 448f69bd1731..be1c74b80bea 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -446,7 +446,7 @@ Public APIs .. function:: argmax_channel(...) - Take sum of the src.The result will be ndarray of shape (1,) on the same device. + Take argmax indices of each channel of the src.The result will be ndarray of shape (num_channel,) on the same device. :param src: Source input to the function :type src: NDArray @@ -513,7 +513,7 @@ Public APIs .. function:: dot(...) - Calcuate 2D matrix multiplication + Calculate 2D matrix multiplication :param lhs: Left operand to the function. :type lhs: NDArray @@ -537,6 +537,25 @@ Public APIs +.. function:: fill_element_0index(...) + + Fill one element of each line(row for python, column for R/Julia) in lhs according to index indicated by rhs and values indicated by mhs. This function assume rhs uses 0-based index. + + :param lhs: Left operand to the function. + :type lhs: NDArray + + + :param mhs: Middle operand to the function. + :type mhs: NDArray + + + :param rhs: Right operand to the function. + :type rhs: NDArray + + + + + .. function:: floor(...) Take floor value of the src @@ -716,6 +735,45 @@ Internal APIs +.. function:: _imdecode(...) + + Decode an image, clip to (x0, y0, x1, y1), substract mean, and write to buffer + + :param mean: image mean + :type mean: NDArray + + + :param index: buffer position for output + :type index: int + + + :param x0: x0 + :type x0: int + + + :param y0: y0 + :type y0: int + + + :param x1: x1 + :type x1: int + + + :param y1: y1 + :type y1: int + + + :param c: channel + :type c: int + + + :param size: length of str_img + :type size: int + + + + + .. function:: _minus(...) diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index 8859a2243b6f..a390b82dd09d 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -192,7 +192,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -220,7 +220,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -236,7 +236,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -256,7 +256,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -268,6 +268,10 @@ Public APIs This function support variable length positional :class:`SymbolicNode` inputs. + :param data: List of tensors to concatenate + :type data: SymbolicNode[] + + :param num_args: Number of inputs to be concated. :type num_args: int, required @@ -278,7 +282,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -305,15 +309,15 @@ Public APIs :param stride: convolution stride: (y, x) - :type stride: Shape(tuple), optional, default=(1, 1) + :type stride: Shape(tuple), optional, default=(1,1) :param dilate: convolution dilate: (y, x) - :type dilate: Shape(tuple), optional, default=(1, 1) + :type dilate: Shape(tuple), optional, default=(1,1) :param pad: pad for convolution: (y, x) - :type pad: Shape(tuple), optional, default=(0, 0) + :type pad: Shape(tuple), optional, default=(0,0) :param num_filter: convolution filter(channel) number @@ -334,7 +338,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -342,7 +346,7 @@ Public APIs .. function:: Crop(...) - Crop the 2th and 3th dim of input data, with the corresponding size of w_h orwith widht and height of the second input symbol + Crop the 2nd and 3rd dim of input data, with the corresponding size of w_h or with width and height of the second input symbol This function support variable length positional :class:`SymbolicNode` inputs. @@ -350,12 +354,12 @@ Public APIs :type num_args: int, required - :param offset: corp offset coordinate: (y, x) - :type offset: Shape(tuple), optional, default=(0, 0) + :param offset: crop offset coordinate: (y, x) + :type offset: Shape(tuple), optional, default=(0,0) - :param h_w: corp height and weight: (h, w) - :type h_w: Shape(tuple), optional, default=(0, 0) + :param h_w: crop height and weight: (h, w) + :type h_w: Shape(tuple), optional, default=(0,0) :param center_crop: If set to true, then it will use be the center_crop,or it will crop using the shape of crop_like @@ -364,7 +368,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -391,11 +395,11 @@ Public APIs :param stride: deconvolution stride: (y, x) - :type stride: Shape(tuple), optional, default=(1, 1) + :type stride: Shape(tuple), optional, default=(1,1) :param pad: pad for deconvolution: (y, x) - :type pad: Shape(tuple), optional, default=(0, 0) + :type pad: Shape(tuple), optional, default=(0,0) :param num_filter: deconvolution filter(channel) number @@ -416,7 +420,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -436,7 +440,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -448,13 +452,13 @@ Public APIs This function support variable length positional :class:`SymbolicNode` inputs. - :param num_args: Number of inputs to be sumed. + :param num_args: Number of inputs to be summed. :type num_args: int, required :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -482,7 +486,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -498,7 +502,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -530,7 +534,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -558,7 +562,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -590,7 +594,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -622,7 +626,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -646,7 +650,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -671,7 +675,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -695,7 +699,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -718,16 +722,16 @@ Public APIs :param stride: stride: for pooling (y, x) - :type stride: Shape(tuple), optional, default=(1, 1) + :type stride: Shape(tuple), optional, default=(1,1) :param pad: pad for pooling: (y, x) - :type pad: Shape(tuple), optional, default=(0, 0) + :type pad: Shape(tuple), optional, default=(0,0) :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -741,13 +745,13 @@ Public APIs :type data: SymbolicNode - :param target_shape: Target new shape. One and only one dim can be 0, in which case it will be infered from the rest of dims + :param target_shape: Target new shape. One and only one dim can be 0, in which case it will be inferred from the rest of dims :type target_shape: Shape(tuple), required :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -763,7 +767,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode[]. @@ -781,21 +785,21 @@ Public APIs :type grad_scale: float, optional, default=1 - :param ignore_label: the ignore_label will not work in backward, and this onlybe used when multi_output=true + :param ignore_label: the ignore_label will not work in backward, and this only be used when multi_output=true :type ignore_label: float, optional, default=-1 - :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes + :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensional input tensor, softmax will generate n*x_1*...*x_n output, each has k classes :type multi_output: boolean, optional, default=False - :param use_ignore: If set to true, the ignore_label value will not contributorto the backward gradient + :param use_ignore: If set to true, the ignore_label value will not contribute to the backward gradient :type use_ignore: boolean, optional, default=False :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -815,7 +819,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -829,25 +833,29 @@ Public APIs :type data: SymbolicNode + :param label: Label data. + :type label: SymbolicNode + + :param grad_scale: Scale the gradient by a float factor :type grad_scale: float, optional, default=1 - :param ignore_label: the ignore_label will not work in backward, and this onlybe used when multi_output=true + :param ignore_label: the ignore_label will not work in backward, and this only be used when multi_output=true :type ignore_label: float, optional, default=-1 - :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensionalinput tensor, softmax will generate n*x_1*...*x_n output, eachhas k classes + :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensional input tensor, softmax will generate n*x_1*...*x_n output, each has k classes :type multi_output: boolean, optional, default=False - :param use_ignore: If set to true, the ignore_label value will not contributorto the backward gradient + :param use_ignore: If set to true, the ignore_label value will not contribute to the backward gradient :type use_ignore: boolean, optional, default=False :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -871,7 +879,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -883,6 +891,10 @@ Public APIs This function support variable length positional :class:`SymbolicNode` inputs. + :param data: Array of tensors to upsample + :type data: SymbolicNode[] + + :param scale: Up sampling scale :type scale: int (non-negative), required @@ -905,7 +917,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -921,7 +933,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -937,7 +949,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -953,7 +965,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -969,7 +981,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -985,7 +997,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -1001,7 +1013,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -1017,7 +1029,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -1033,7 +1045,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -1049,7 +1061,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -1065,7 +1077,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -1081,7 +1093,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -1097,7 +1109,7 @@ Public APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: . @@ -1116,7 +1128,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1129,7 +1141,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1153,7 +1165,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1166,7 +1178,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1190,7 +1202,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1203,7 +1215,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1227,7 +1239,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1240,7 +1252,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1264,7 +1276,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1277,7 +1289,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1301,7 +1313,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1317,7 +1329,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1337,7 +1349,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1350,7 +1362,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1374,7 +1386,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1387,7 +1399,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. @@ -1411,7 +1423,7 @@ Internal APIs :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: the constructed :class:`SymbolicNode`. + :return: SymbolicNode. diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 83ed11ba4923..e83b94aeefa4 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -480,11 +480,13 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) ref_arg_names = Ref{char_pp}(0) ref_arg_types = Ref{char_pp}(0) ref_arg_descs = Ref{char_pp}(0) + ref_ret_type = Ref{char_p}(0) @mxcall(:MXSymbolGetAtomicSymbolInfo, (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, - Ref{char_pp}, Ref{char_p}), - hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, ref_kv_nargs) + Ref{char_pp}, Ref{char_p}, Ref{char_p}), + hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, + ref_kv_nargs, ref_ret_type) func_name_s= bytestring(ref_name[]) func_name = symbol(func_name_s) @@ -499,7 +501,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) f_desc *= ":param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional.\n" f_desc *= ":param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`.\n\n" - f_desc *= ":return: the constructed :class:`SymbolicNode`.\n\n" + f_desc *= ":return: $(_format_typestring(bytestring(ref_ret_type[]))).\n\n" return (func_name, f_desc) end From 579b88106f361f883982e8caad6c9074408ee569 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 6 Feb 2016 13:10:22 -0500 Subject: [PATCH 287/630] fix for breaking changes in Julia nightly --- src/initializer.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/initializer.jl b/src/initializer.jl index 0d2a10586f57..2f1342e9ac80 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -24,7 +24,7 @@ Or, if full behavior customization is needed, override the following function =# abstract AbstractInitializer -function call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +function call{T<:AbstractInitializer}(self :: T, name :: Base.Symbol, array :: NDArray) strname = string(name) if endswith(strname, "bias") _init_bias(self, name, array) From ce3f6d38bde4be9e8dbdac9d76545bf8132c44b6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 8 Feb 2016 11:34:02 -0500 Subject: [PATCH 288/630] another attempt to fix julia v0.5 compatability --- src/initializer.jl | 4 ++-- src/model.jl | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/src/initializer.jl b/src/initializer.jl index 2f1342e9ac80..00e71b19c3cd 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -20,11 +20,11 @@ enough to derive a new type, and implement one or more of the following methods: Or, if full behavior customization is needed, override the following function -.. function:: call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: init(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) =# abstract AbstractInitializer -function call{T<:AbstractInitializer}(self :: T, name :: Base.Symbol, array :: NDArray) +function init{T<:AbstractInitializer}(self :: T, name :: Base.Symbol, array :: NDArray) strname = string(name) if endswith(strname, "bias") _init_bias(self, name, array) diff --git a/src/model.jl b/src/model.jl index c208873e867f..93fc41ca0452 100644 --- a/src/model.jl +++ b/src/model.jl @@ -109,12 +109,12 @@ function init_model(self :: FeedForward, initializer :: AbstractInitializer; ove # initialize the contents of the parameters if !arg_defined || overwrite for (k,v) in self.arg_params - initializer(k, v) + init(initializer, k, v) end end if !aux_defined || overwrite for (k,v) in self.aux_params - initializer(k, v) + init(initializer, k, v) end end From 938b2362a78cad578c5dd1f80200d6d7c41f8d65 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 8 Feb 2016 11:43:54 -0500 Subject: [PATCH 289/630] update doc for initializer --- docs/api/initializer.rst | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/api/initializer.rst b/docs/api/initializer.rst index 7123507f7ee9..6dbb81a001b3 100644 --- a/docs/api/initializer.rst +++ b/docs/api/initializer.rst @@ -21,7 +21,7 @@ enough to derive a new type, and implement one or more of the following methods: Or, if full behavior customization is needed, override the following function -.. function:: call(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +.. function:: init(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) From 06019e2c1c86588137666384bc420ec9632af5b4 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 8 Feb 2016 11:48:21 -0500 Subject: [PATCH 290/630] stricter type anotation for julia v0.5 --- test/unittest/ndarray.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 680d2f867263..2f7d4d9af6dd 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -192,7 +192,7 @@ function test_saveload() # save and load N arrays of different shape arrays = [rand_tensors(rand_dims()) for i = 1:n_arrays] - nd_arrays = [x[2] for x in arrays] + nd_arrays = NDArray[x[2] for x in arrays] mx.save(fname, nd_arrays) data = mx.load(fname, mx.NDArray) @test isa(data, Vector{mx.NDArray}) From 1c707a2147a077c536627b9f337515677eab1a73 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 8 Feb 2016 12:00:19 -0500 Subject: [PATCH 291/630] fix typo --- test/unittest/ndarray.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 2f7d4d9af6dd..67bff2959c8a 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -192,7 +192,7 @@ function test_saveload() # save and load N arrays of different shape arrays = [rand_tensors(rand_dims()) for i = 1:n_arrays] - nd_arrays = NDArray[x[2] for x in arrays] + nd_arrays = mx.NDArray[x[2] for x in arrays] mx.save(fname, nd_arrays) data = mx.load(fname, mx.NDArray) @test isa(data, Vector{mx.NDArray}) From ac709d12662484705c409911db00868509c6c9f4 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 8 Feb 2016 12:56:59 -0500 Subject: [PATCH 292/630] prepare for v0.0.8 --- NEWS.md | 5 +++++ docs/conf.py | 4 ++-- 2 files changed, 7 insertions(+), 2 deletions(-) diff --git a/NEWS.md b/NEWS.md index c0d365a7336e..f11136c8cd46 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,8 @@ +# v0.0.8 (2016.02.08) + +* Fix compatability with Julia v0.5. +* Fix seg-faults introduced by upstream API changes. + # v0.0.7 (2015.12.14) * Fix compatability with Julia v0.4.2 (@BigEpsilon) diff --git a/docs/conf.py b/docs/conf.py index 6293dcf80b3f..7454faa99eee 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -56,9 +56,9 @@ # built documents. # # The short X.Y version. -version = '0.0.7' +version = '0.0.8' # The full version, including alpha/beta/rc tags. -release = '0.0.7' +release = '0.0.8' # The language for content autogenerated by Sphinx. Refer to documentation # for a list of supported languages. From 0b387f7be4505262b1925a852c0806d0a02fc04f Mon Sep 17 00:00:00 2001 From: ultradian Date: Thu, 11 Feb 2016 23:12:08 -0800 Subject: [PATCH 293/630] add further information to install.rst Include information on updating the LD_LIBRARY_PATH which had me stumped for a while. Please feel free to reword for clarity. --- docs/user-guide/install.rst | 2 ++ 1 file changed, 2 insertions(+) diff --git a/docs/user-guide/install.rst b/docs/user-guide/install.rst index 43f882928d39..9609368ca1fd 100644 --- a/docs/user-guide/install.rst +++ b/docs/user-guide/install.rst @@ -52,3 +52,5 @@ Basically, MXNet.jl will search ``libmxnet.so`` or ``libmxnet.dll`` in the follo * ``$MXNET_HOME/lib``: customized libmxnet builds * ``Pkg.dir("MXNet")/deps/usr/lib``: automatic builds * Any system wide library search path + +Note that MXNet.jl will not find ``libmxnet.so`` even if it is on the path if a library it depends upon is missing from the LD_LIBRARY_PATH. Thus, if you are going to compile to add CUDA, the path to the CUDA libraries will have to be added to LD_LIBRARY_PATH. From f26ad9699df77315b4dbf932d3d103a0a52c5c48 Mon Sep 17 00:00:00 2001 From: ultradian Date: Wed, 17 Feb 2016 21:52:05 -0800 Subject: [PATCH 294/630] Update install.rst --- docs/user-guide/install.rst | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/user-guide/install.rst b/docs/user-guide/install.rst index 9609368ca1fd..d53830a0cb37 100644 --- a/docs/user-guide/install.rst +++ b/docs/user-guide/install.rst @@ -53,4 +53,4 @@ Basically, MXNet.jl will search ``libmxnet.so`` or ``libmxnet.dll`` in the follo * ``Pkg.dir("MXNet")/deps/usr/lib``: automatic builds * Any system wide library search path -Note that MXNet.jl will not find ``libmxnet.so`` even if it is on the path if a library it depends upon is missing from the LD_LIBRARY_PATH. Thus, if you are going to compile to add CUDA, the path to the CUDA libraries will have to be added to LD_LIBRARY_PATH. +Note that MXNet.jl will not find ``libmxnet.so`` even if it is on one of the paths above if a library it depends upon is missing from the ``LD_LIBRARY_PATH``. Thus, if you are going to compile to add CUDA, the path to the CUDA libraries will have to be added to ``LD_LIBRARY_PATH``. From 7a5035773b5dbd7c1d20aeda6c94a5a4d65f3cdd Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 6 Apr 2016 10:27:13 +0900 Subject: [PATCH 295/630] MXNet exposes a transpose function --- src/MXNet.jl | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/MXNet.jl b/src/MXNet.jl index c5056320791c..16ad415efe52 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -9,7 +9,8 @@ module mx using Formatting # Functions from base that we can safely extend and that are defined by libmxnet. -import Base: round, ceil, floor, cos, sin, abs, sign, exp, sqrt, exp, log, norm +import Base: round, ceil, floor, cos, sin, abs, sign, exp, sqrt, exp, log, norm, + transpose include("base.jl") include("context.jl") From f8988374a0e7f384c487e285470742e117985216 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 8 Apr 2016 16:30:24 +0900 Subject: [PATCH 296/630] add function to get debug_str, similar to python --- src/executor.jl | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) diff --git a/src/executor.jl b/src/executor.jl index 5844a62e446c..4c72589ae966 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -195,3 +195,22 @@ function copy_params_from(self::Executor, arg_params::Dict{Base.Symbol,NDArray}, end end end + + +""" +Get a debug string about internal execution plan. + +Can be used to get an estimated about the memory cost. +```julia + net = ... # Symbol + dProvider = ... # DataProvider + exec = mx.simple_bind(net, mx.cpu(), data=size(dProvider.data_batch[1])) + dbg_str = mx.debug_str(exec) + println(split(ref, ['\n'])[end-2]) +``` +""" +function debug_str(self :: Executor) + s_ref = Ref{Cstring}() + @mxcall(:MXExecutorPrint, (MX_handle, Ptr{Cstring}), self.handle, s_ref) + bytestring(s_ref[]) +end From acd2a74684a518c0bafa85259362191cd917ba1b Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sun, 10 Apr 2016 20:47:44 +0900 Subject: [PATCH 297/630] output TempSpace allocation --- src/model.jl | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/model.jl b/src/model.jl index 93fc41ca0452..b823a342b529 100644 --- a/src/model.jl +++ b/src/model.jl @@ -129,6 +129,8 @@ function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_sha # the predictor use only the first device self.pred_exec = simple_bind(self.arch, self.ctx[1]; grad_req=GRAD_NOP, data_shapes...) + dbg_str = mx.debug_str(self.pred_exec) + info(string("TempSpace: ", split(dbg_str, ['\n'])[end-2]..., " on ", self.ctx[1])) copy_params_from(self.pred_exec, self.arg_params, self.aux_params) else # make sure the new setup is compatible with the existing one @@ -345,6 +347,8 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra data_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)] label_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)] train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=GRAD_WRITE, data_shapes..., label_shapes...) + dbg_str = mx.debug_str(train_execs[i]) + info(string("TempSpace: ", split(dbg_str, ['\n'])[end-2]..., " on ", self.ctx[i])) copy_params_from(train_execs[i], self.arg_params, self.aux_params) end From 8b8c9c2a961198ff602fe62c151a7f5e1d386ec6 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 14 Apr 2016 14:55:33 +0900 Subject: [PATCH 298/630] cleanup Accuracy --- src/metric.jl | 57 +++++++++++++++++++++------------------------------ 1 file changed, 23 insertions(+), 34 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 5bf14e52a840..053c549df4eb 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -51,47 +51,36 @@ type Accuracy <: AbstractEvalMetric Accuracy() = new(0.0, 0) end -""" -Implementation taken from findmax in Julia base. -Searches for the maximum value in p_dim of a. -I and n are values for the other dimensions. -""" -function _indmax(a, I, p_dim, n) - m = a[I..., 1, n] - mi = 1 - for i in 2:size(a, p_dim) - ai = a[I..., i, n] - if ai > m || m!=m - m = ai - mi = i - end - end - return mi -end - function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDArray) @nd_as_jl ro=(label,pred) begin - if ndims(pred) > 2 # Multidimensional case - # Construct cartesian index - p_dim = ndims(pred)-1 - initial = tuple(fill(1,p_dim-1)...) - dims = size(pred, (1:p_dim-1)...) - crange = CartesianRange(CartesianIndex(initial), CartesianIndex(dims)) - - for sample in 1:size(label, ndims(label)) - for i in crange - l_i = sub2ind(dims, i.I...) - klass = _indmax(pred, i.I, p_dim, sample) - metric.acc_sum += (klass-1) == label[l_i, sample] - metric.n_sample += 1 + # Samples are stored in the last dimension + @assert size(label, ndims(label)) == size(pred, ndims(pred)) + + if ndims(pred) == 4 # Multidimensional case + # Reshape label to be of the same shape as pred. + # Except for the third dimension where the predictions are stored. + labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) + + for sample in 1:size(labels, 4) + for j in 1:size(labels, 2) + for i in 1:size(labels, 1) + label = labels[i, j, 1, sample] + klasses = sub(pred, i, j, :, sample) + klass = indmax(klasses) - 1 # Classes start at 0...k-1 + + metric.acc_sum += klass == label + metric.n_sample += 1 + end end end - else # 1-dimensional case + elseif ndims(pred) == 2 # 1-dimensional case for sample in 1:size(label, 1) - klass = indmax(pred[:, sample]) - metric.acc_sum += (klass-1) == label[sample] + klass = indmax(sub(pred, :, sample)) - 1 + metric.acc_sum += klass == label[sample] metric.n_sample += 1 end + else + error("Can't handle prediction with dimensions $(ndims(pred)).") end end end From 91821482c7612e88c25399aac94980c3593d9cab Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 14 Apr 2016 15:29:01 +0900 Subject: [PATCH 299/630] add average cross-entropy metric --- docs/api/metric.rst | 9 ++++++++ src/metric.jl | 56 +++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 65 insertions(+) diff --git a/docs/api/metric.rst b/docs/api/metric.rst index db503d5e6849..966d682ba2b7 100644 --- a/docs/api/metric.rst +++ b/docs/api/metric.rst @@ -56,3 +56,12 @@ set. + +.. class:: ACE + + Averaged cross-entropy for classification. This also know als logloss. + + Calculated the averaged cross entropy for multi-dimentions output. + + + diff --git a/src/metric.jl b/src/metric.jl index 053c549df4eb..a22794e9f158 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -144,3 +144,59 @@ function reset!(metric :: MSE) metric.mse_sum = 0.0 metric.n_sample = 0 end + +#=doc +.. class:: ACE + + Averaged cross-entropy for classification. This also know als logloss. + + Calculated the averaged cross entropy for multi-dimentions output. +=# +type ACE <: AbstractEvalMetric + ace_sum :: Float64 + n_sample :: Int + + ACE() = new(0.0, 0) +end + +function get(metric :: ACE) + return [(:ACE, - metric.ace_sum / metric.n_sample)] +end + +function reset!(metric :: ACE) + metric.ace_sum = 0.0 + metric.n_sample = 0 +end + +function _update_single_output(metric :: ACE, label :: NDArray, pred :: NDArray) + @nd_as_jl ro=(label,pred) begin + # Samples are stored in the last dimension + @assert size(label, ndims(label)) == size(pred, ndims(pred)) + @assert ndims(pred) == 4 + + labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) + for sample in 1:size(labels, 4) + for j in 1:size(labels, 2) + for i in 1:size(labels, 1) + label = labels[i, j, 1, sample] + + # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification + # Since we can only target labels right now this is the only thing we can do. + target = Int(label) + 1 # klasses are 0...k-1 => julia indexing + p_k = pred[i, j, target, sample] + + metric.ace_sum += log(p_k) + metric.n_sample += 1 + end + end + end + end +end + +function update!(metric :: ACE, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + @assert length(labels) == length(preds) + for i = 1:length(labels) + _update_single_output(metric, labels[i], preds[i]) + end +end + From 3170c4eb22b30b1a4c3bfd6a21a42800a6061e5a Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 14 Apr 2016 15:29:20 +0900 Subject: [PATCH 300/630] update documentation --- docs/api/io.rst | 4 ++-- docs/api/ndarray.rst | 41 +++++++++++++++++++++++++++++++++++++ docs/api/symbolic-node.rst | 42 +++++++++++++++++++++++++++++++++++--- 3 files changed, 82 insertions(+), 5 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index e5cb3ffb32e5..8ec67cf6d073 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -351,7 +351,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -514,7 +514,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 + :type prefetch_buffer: long (non-negative), optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index be1c74b80bea..b72f0faa5cfe 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -687,6 +687,28 @@ Public APIs + +.. function:: sum_mid_internal(...) + + Take sum on medium dimension of the 3D src. + + :param src: Source input to the function + :type src: NDArray + + + + + +.. function:: transpose(...) + + Transpose the input matrix and return a new one + + :param src: Source input to the function + :type src: NDArray + + + + Internal APIs ^^^^^^^^^^^^^ @@ -694,6 +716,25 @@ Internal APIs Document and signatures for internal API functions might be incomplete. +.. function:: _broadcast(...) + + Broadcast array in the given axis to the given size + + :param src: source ndarray + :type src: NDArray + + + :param axis: axis to broadcast + :type axis: int + + + :param size: size of broadcast + :type size: int + + + + + .. function:: _copyto(...) diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index a390b82dd09d..e303afba21dc 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -346,11 +346,15 @@ Public APIs .. function:: Crop(...) - Crop the 2nd and 3rd dim of input data, with the corresponding size of w_h or with width and height of the second input symbol + Crop the 2nd and 3rd dim of input data, with the corresponding size of h_w or with width and height of the second input symbol, i.e., with one input, we need h_w to specify the crop height and width, otherwise the second input symbol's size will be used This function support variable length positional :class:`SymbolicNode` inputs. - :param num_args: Number of inputs for crop, if equals one, then we will use the h_wfor crop heihgt and width, else if equals two, then we will use the heightand width of the second input symbol, we name crop_like here + :param data: Tensor or List of Tensors, the second input will be used as crop_like shape reference + :type data: SymbolicNode or SymbolicNode[] + + + :param num_args: Number of inputs for crop, if equals one, then we will use the h_wfor crop height and width, else if equals two, then we will use the heightand width of the second input symbol, we name crop_like here :type num_args: int, required @@ -374,6 +378,34 @@ Public APIs +.. function:: CuDNNBatchNorm(...) + + Apply batch normalization to input. + + :param data: Input data to batch normalization + :type data: SymbolicNode + + + :param eps: Epsilon to prevent div 0 + :type eps: float, optional, default=0.001 + + + :param momentum: Momentum for moving average + :type momentum: float, optional, default=0.9 + + + :param fix_gamma: Fix gamma while training + :type fix_gamma: boolean, optional, default=False + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: SymbolicNode. + + + + + .. function:: Deconvolution(...) Apply deconvolution to input then add a bias. @@ -759,11 +791,15 @@ Public APIs .. function:: SliceChannel(...) - Slice channel into many outputs with equally divided channel + Slice input equally along specified axis :param num_outputs: Number of outputs to be sliced. :type num_outputs: int, required + + :param axis: Dimension along which to slice. + :type axis: int, optional, default='1' + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. From d85549b86e259db6859ccc96da4e0053653d756a Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sat, 16 Apr 2016 23:20:14 +0900 Subject: [PATCH 301/630] adds MultiACE or ACE per class --- src/metric.jl | 57 +++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 57 insertions(+) diff --git a/src/metric.jl b/src/metric.jl index a22794e9f158..7916d45b639c 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -200,3 +200,60 @@ function update!(metric :: ACE, labels :: Vector{NDArray}, preds :: Vector{NDArr end end +#=doc +.. class:: MultiACE + + Averaged cross-entropy for classification. This also know als logloss. + This variant keeps track of the different losses per class. + + Calculated the averaged cross entropy for multi-dimentions output. +=# +type MultiACE <: AbstractEvalMetric + aces :: Vector{Float64} + counts :: Vector{Int} + + MultiACE(nclasses) = new(Base.zeros(nclasses), Base.zeros(Int, nclasses)) +end + +function get(metric :: MultiACE) + aces = [(symbol("ACE_$(i-0)"), - metric.aces[i] / metric.counts[i]) for i in 1:length(metric.aces)] + push!(aces, (:ACE, - Base.sum(metric.aces) / Base.sum(metric.counts))) + return aces +end + +function reset!(metric :: MultiACE) + metric.aces = Base.zero(metric.aces) + metric.counts = Base.zero(metric.counts) +end + +function _update_single_output(metric :: MultiACE, label :: NDArray, pred :: NDArray) + @nd_as_jl ro=(label,pred) begin + # Samples are stored in the last dimension + @assert size(label, ndims(label)) == size(pred, ndims(pred)) + @assert ndims(pred) == 4 + + labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) + for sample in 1:size(labels, 4) + for j in 1:size(labels, 2) + for i in 1:size(labels, 1) + label = labels[i, j, 1, sample] + + # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification + # Since we can only target labels right now this is the only thing we can do. + target = Int(label) + 1 # klasses are 0...k-1 => julia indexing + p_k = pred[i, j, target, sample] + + metric.aces[target] += log(p_k) + metric.counts[target] += 1 + end + end + end + end +end + +function update!(metric :: MultiACE, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + @assert length(labels) == length(preds) + for i = 1:length(labels) + _update_single_output(metric, labels[i], preds[i]) + end +end From 1a73ddae6ec17e90b2ef375f173ecb787f2888c1 Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Mon, 18 Apr 2016 10:48:49 -0700 Subject: [PATCH 302/630] Use openblas from Julia, instead of installing yet another BLAS library --- deps/build.jl | 17 ++++------------- 1 file changed, 4 insertions(+), 13 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index cb9f930c096d..177765bfe869 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -6,7 +6,7 @@ libmxnet_detected = false if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") info("Trying to load existing libmxnet...") - lib = Libdl.find_library(["libmxnet.so","libmxnet.dll"], ["$(ENV["MXNET_HOME"])/lib"]) + lib = Libdl.find_library(["libmxnet"], ["$(ENV["MXNET_HOME"])/lib"]) if !isempty(lib) info("Existing libmxnet detected at $lib, skip building...") libmxnet_detected = true @@ -28,20 +28,11 @@ if !libmxnet_detected error("Automatic building libxmnet on Windows is currently not supported yet.") end - #-------------------------------------------------------------------------------- - # Install dependencies, blas - @linux_only begin - blas = library_dependency("cblas", aliases=["libcblas"]) - provides(AptGet, "libatlas-base-dev", blas) - provides(Pacman, "blas", blas) - provides(Yum, "blas-devel", blas) - - @BinDeps.install Dict(:blas => :blas) - end + openblas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) #-------------------------------------------------------------------------------- # Build libmxnet - mxnet = library_dependency("mxnet", aliases=["libmxnet.so"]) + mxnet = library_dependency("mxnet", aliases=["libmxnet"]) _prefix = joinpath(BinDeps.depsdir(mxnet), "usr") _srcdir = joinpath(BinDeps.depsdir(mxnet),"src") @@ -60,7 +51,7 @@ if !libmxnet_detected `cp make/config.mk config.mk` @osx_only `cp make/osx.mk config.mk` `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` - `make` + `make USE_BLAS=openblas MSHADOW_LDFLAGS=-L$(basename(openblas_path)) -j` `cp lib/libmxnet.so $_libdir` end) end From 0c5086ae088899136cb68b5aef0fa6f3ed163ca1 Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Mon, 18 Apr 2016 12:17:28 -0700 Subject: [PATCH 303/630] Simplify linking --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 177765bfe869..7e86297ede89 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -51,7 +51,7 @@ if !libmxnet_detected `cp make/config.mk config.mk` @osx_only `cp make/osx.mk config.mk` `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` - `make USE_BLAS=openblas MSHADOW_LDFLAGS=-L$(basename(openblas_path)) -j` + `make USE_BLAS=openblas MSHADOW_LDFLAGS="$openblas_path" -j` `cp lib/libmxnet.so $_libdir` end) end From 7be95f60df18f13ebb8557c1d2977030035022ca Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Mon, 18 Apr 2016 12:28:39 -0700 Subject: [PATCH 304/630] Bundle generic cblas.h header for users that don't have libblas-dev installed already --- deps/build.jl | 1 + deps/cblas.h | 580 ++++++++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 581 insertions(+) create mode 100644 deps/cblas.h diff --git a/deps/build.jl b/deps/build.jl index 7e86297ede89..5a4073537bf2 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -51,6 +51,7 @@ if !libmxnet_detected `cp make/config.mk config.mk` @osx_only `cp make/osx.mk config.mk` `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` + `cp ../../cblas.h include/cblas.h` `make USE_BLAS=openblas MSHADOW_LDFLAGS="$openblas_path" -j` `cp lib/libmxnet.so $_libdir` end) diff --git a/deps/cblas.h b/deps/cblas.h new file mode 100644 index 000000000000..941b570c78de --- /dev/null +++ b/deps/cblas.h @@ -0,0 +1,580 @@ +#ifndef CBLAS_H +#define CBLAS_H +#include + +// This header file copied from the Netlib libblas distribution package + +/* Allow the use in C++ code. */ +#ifdef __cplusplus +extern "C" +{ +#endif + +/* + * Enumerated and derived types + */ +#define CBLAS_INDEX size_t /* this may vary between platforms */ + +enum CBLAS_ORDER {CblasRowMajor=101, CblasColMajor=102}; +enum CBLAS_TRANSPOSE {CblasNoTrans=111, CblasTrans=112, CblasConjTrans=113}; +enum CBLAS_UPLO {CblasUpper=121, CblasLower=122}; +enum CBLAS_DIAG {CblasNonUnit=131, CblasUnit=132}; +enum CBLAS_SIDE {CblasLeft=141, CblasRight=142}; + +/* + * =========================================================================== + * Prototypes for level 1 BLAS functions (complex are recast as routines) + * =========================================================================== + */ +float cblas_sdsdot(const int N, const float alpha, const float *X, + const int incX, const float *Y, const int incY); +double cblas_dsdot(const int N, const float *X, const int incX, const float *Y, + const int incY); +float cblas_sdot(const int N, const float *X, const int incX, + const float *Y, const int incY); +double cblas_ddot(const int N, const double *X, const int incX, + const double *Y, const int incY); + +/* + * Functions having prefixes Z and C only + */ +void cblas_cdotu_sub(const int N, const void *X, const int incX, + const void *Y, const int incY, void *dotu); +void cblas_cdotc_sub(const int N, const void *X, const int incX, + const void *Y, const int incY, void *dotc); + +void cblas_zdotu_sub(const int N, const void *X, const int incX, + const void *Y, const int incY, void *dotu); +void cblas_zdotc_sub(const int N, const void *X, const int incX, + const void *Y, const int incY, void *dotc); + + +/* + * Functions having prefixes S D SC DZ + */ +float cblas_snrm2(const int N, const float *X, const int incX); +float cblas_sasum(const int N, const float *X, const int incX); + +double cblas_dnrm2(const int N, const double *X, const int incX); +double cblas_dasum(const int N, const double *X, const int incX); + +float cblas_scnrm2(const int N, const void *X, const int incX); +float cblas_scasum(const int N, const void *X, const int incX); + +double cblas_dznrm2(const int N, const void *X, const int incX); +double cblas_dzasum(const int N, const void *X, const int incX); + + +/* + * Functions having standard 4 prefixes (S D C Z) + */ +CBLAS_INDEX cblas_isamax(const int N, const float *X, const int incX); +CBLAS_INDEX cblas_idamax(const int N, const double *X, const int incX); +CBLAS_INDEX cblas_icamax(const int N, const void *X, const int incX); +CBLAS_INDEX cblas_izamax(const int N, const void *X, const int incX); + +/* + * =========================================================================== + * Prototypes for level 1 BLAS routines + * =========================================================================== + */ + +/* + * Routines with standard 4 prefixes (s, d, c, z) + */ +void cblas_sswap(const int N, float *X, const int incX, + float *Y, const int incY); +void cblas_scopy(const int N, const float *X, const int incX, + float *Y, const int incY); +void cblas_saxpy(const int N, const float alpha, const float *X, + const int incX, float *Y, const int incY); + +void cblas_dswap(const int N, double *X, const int incX, + double *Y, const int incY); +void cblas_dcopy(const int N, const double *X, const int incX, + double *Y, const int incY); +void cblas_daxpy(const int N, const double alpha, const double *X, + const int incX, double *Y, const int incY); + +void cblas_cswap(const int N, void *X, const int incX, + void *Y, const int incY); +void cblas_ccopy(const int N, const void *X, const int incX, + void *Y, const int incY); +void cblas_caxpy(const int N, const void *alpha, const void *X, + const int incX, void *Y, const int incY); + +void cblas_zswap(const int N, void *X, const int incX, + void *Y, const int incY); +void cblas_zcopy(const int N, const void *X, const int incX, + void *Y, const int incY); +void cblas_zaxpy(const int N, const void *alpha, const void *X, + const int incX, void *Y, const int incY); + + +/* + * Routines with S and D prefix only + */ +void cblas_srotg(float *a, float *b, float *c, float *s); +void cblas_srotmg(float *d1, float *d2, float *b1, const float b2, float *P); +void cblas_srot(const int N, float *X, const int incX, + float *Y, const int incY, const float c, const float s); +void cblas_srotm(const int N, float *X, const int incX, + float *Y, const int incY, const float *P); + +void cblas_drotg(double *a, double *b, double *c, double *s); +void cblas_drotmg(double *d1, double *d2, double *b1, const double b2, double *P); +void cblas_drot(const int N, double *X, const int incX, + double *Y, const int incY, const double c, const double s); +void cblas_drotm(const int N, double *X, const int incX, + double *Y, const int incY, const double *P); + + +/* + * Routines with S D C Z CS and ZD prefixes + */ +void cblas_sscal(const int N, const float alpha, float *X, const int incX); +void cblas_dscal(const int N, const double alpha, double *X, const int incX); +void cblas_cscal(const int N, const void *alpha, void *X, const int incX); +void cblas_zscal(const int N, const void *alpha, void *X, const int incX); +void cblas_csscal(const int N, const float alpha, void *X, const int incX); +void cblas_zdscal(const int N, const double alpha, void *X, const int incX); + +/* + * =========================================================================== + * Prototypes for level 2 BLAS + * =========================================================================== + */ + +/* + * Routines with standard 4 prefixes (S, D, C, Z) + */ +void cblas_sgemv(const enum CBLAS_ORDER order, + const enum CBLAS_TRANSPOSE TransA, const int M, const int N, + const float alpha, const float *A, const int lda, + const float *X, const int incX, const float beta, + float *Y, const int incY); +void cblas_sgbmv(const enum CBLAS_ORDER order, + const enum CBLAS_TRANSPOSE TransA, const int M, const int N, + const int KL, const int KU, const float alpha, + const float *A, const int lda, const float *X, + const int incX, const float beta, float *Y, const int incY); +void cblas_strmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const float *A, const int lda, + float *X, const int incX); +void cblas_stbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const int K, const float *A, const int lda, + float *X, const int incX); +void cblas_stpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const float *Ap, float *X, const int incX); +void cblas_strsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const float *A, const int lda, float *X, + const int incX); +void cblas_stbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const int K, const float *A, const int lda, + float *X, const int incX); +void cblas_stpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const float *Ap, float *X, const int incX); + +void cblas_dgemv(const enum CBLAS_ORDER order, + const enum CBLAS_TRANSPOSE TransA, const int M, const int N, + const double alpha, const double *A, const int lda, + const double *X, const int incX, const double beta, + double *Y, const int incY); +void cblas_dgbmv(const enum CBLAS_ORDER order, + const enum CBLAS_TRANSPOSE TransA, const int M, const int N, + const int KL, const int KU, const double alpha, + const double *A, const int lda, const double *X, + const int incX, const double beta, double *Y, const int incY); +void cblas_dtrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const double *A, const int lda, + double *X, const int incX); +void cblas_dtbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const int K, const double *A, const int lda, + double *X, const int incX); +void cblas_dtpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const double *Ap, double *X, const int incX); +void cblas_dtrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const double *A, const int lda, double *X, + const int incX); +void cblas_dtbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const int K, const double *A, const int lda, + double *X, const int incX); +void cblas_dtpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const double *Ap, double *X, const int incX); + +void cblas_cgemv(const enum CBLAS_ORDER order, + const enum CBLAS_TRANSPOSE TransA, const int M, const int N, + const void *alpha, const void *A, const int lda, + const void *X, const int incX, const void *beta, + void *Y, const int incY); +void cblas_cgbmv(const enum CBLAS_ORDER order, + const enum CBLAS_TRANSPOSE TransA, const int M, const int N, + const int KL, const int KU, const void *alpha, + const void *A, const int lda, const void *X, + const int incX, const void *beta, void *Y, const int incY); +void cblas_ctrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const void *A, const int lda, + void *X, const int incX); +void cblas_ctbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const int K, const void *A, const int lda, + void *X, const int incX); +void cblas_ctpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const void *Ap, void *X, const int incX); +void cblas_ctrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const void *A, const int lda, void *X, + const int incX); +void cblas_ctbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const int K, const void *A, const int lda, + void *X, const int incX); +void cblas_ctpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const void *Ap, void *X, const int incX); + +void cblas_zgemv(const enum CBLAS_ORDER order, + const enum CBLAS_TRANSPOSE TransA, const int M, const int N, + const void *alpha, const void *A, const int lda, + const void *X, const int incX, const void *beta, + void *Y, const int incY); +void cblas_zgbmv(const enum CBLAS_ORDER order, + const enum CBLAS_TRANSPOSE TransA, const int M, const int N, + const int KL, const int KU, const void *alpha, + const void *A, const int lda, const void *X, + const int incX, const void *beta, void *Y, const int incY); +void cblas_ztrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const void *A, const int lda, + void *X, const int incX); +void cblas_ztbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const int K, const void *A, const int lda, + void *X, const int incX); +void cblas_ztpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const void *Ap, void *X, const int incX); +void cblas_ztrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const void *A, const int lda, void *X, + const int incX); +void cblas_ztbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const int K, const void *A, const int lda, + void *X, const int incX); +void cblas_ztpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, + const int N, const void *Ap, void *X, const int incX); + + +/* + * Routines with S and D prefixes only + */ +void cblas_ssymv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const float alpha, const float *A, + const int lda, const float *X, const int incX, + const float beta, float *Y, const int incY); +void cblas_ssbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const int K, const float alpha, const float *A, + const int lda, const float *X, const int incX, + const float beta, float *Y, const int incY); +void cblas_sspmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const float alpha, const float *Ap, + const float *X, const int incX, + const float beta, float *Y, const int incY); +void cblas_sger(const enum CBLAS_ORDER order, const int M, const int N, + const float alpha, const float *X, const int incX, + const float *Y, const int incY, float *A, const int lda); +void cblas_ssyr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const float alpha, const float *X, + const int incX, float *A, const int lda); +void cblas_sspr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const float alpha, const float *X, + const int incX, float *Ap); +void cblas_ssyr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const float alpha, const float *X, + const int incX, const float *Y, const int incY, float *A, + const int lda); +void cblas_sspr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const float alpha, const float *X, + const int incX, const float *Y, const int incY, float *A); + +void cblas_dsymv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const double alpha, const double *A, + const int lda, const double *X, const int incX, + const double beta, double *Y, const int incY); +void cblas_dsbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const int K, const double alpha, const double *A, + const int lda, const double *X, const int incX, + const double beta, double *Y, const int incY); +void cblas_dspmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const double alpha, const double *Ap, + const double *X, const int incX, + const double beta, double *Y, const int incY); +void cblas_dger(const enum CBLAS_ORDER order, const int M, const int N, + const double alpha, const double *X, const int incX, + const double *Y, const int incY, double *A, const int lda); +void cblas_dsyr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const double alpha, const double *X, + const int incX, double *A, const int lda); +void cblas_dspr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const double alpha, const double *X, + const int incX, double *Ap); +void cblas_dsyr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const double alpha, const double *X, + const int incX, const double *Y, const int incY, double *A, + const int lda); +void cblas_dspr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const double alpha, const double *X, + const int incX, const double *Y, const int incY, double *A); + + +/* + * Routines with C and Z prefixes only + */ +void cblas_chemv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const void *alpha, const void *A, + const int lda, const void *X, const int incX, + const void *beta, void *Y, const int incY); +void cblas_chbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const int K, const void *alpha, const void *A, + const int lda, const void *X, const int incX, + const void *beta, void *Y, const int incY); +void cblas_chpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const void *alpha, const void *Ap, + const void *X, const int incX, + const void *beta, void *Y, const int incY); +void cblas_cgeru(const enum CBLAS_ORDER order, const int M, const int N, + const void *alpha, const void *X, const int incX, + const void *Y, const int incY, void *A, const int lda); +void cblas_cgerc(const enum CBLAS_ORDER order, const int M, const int N, + const void *alpha, const void *X, const int incX, + const void *Y, const int incY, void *A, const int lda); +void cblas_cher(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const float alpha, const void *X, const int incX, + void *A, const int lda); +void cblas_chpr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const float alpha, const void *X, + const int incX, void *A); +void cblas_cher2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const int N, + const void *alpha, const void *X, const int incX, + const void *Y, const int incY, void *A, const int lda); +void cblas_chpr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const int N, + const void *alpha, const void *X, const int incX, + const void *Y, const int incY, void *Ap); + +void cblas_zhemv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const void *alpha, const void *A, + const int lda, const void *X, const int incX, + const void *beta, void *Y, const int incY); +void cblas_zhbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const int K, const void *alpha, const void *A, + const int lda, const void *X, const int incX, + const void *beta, void *Y, const int incY); +void cblas_zhpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const void *alpha, const void *Ap, + const void *X, const int incX, + const void *beta, void *Y, const int incY); +void cblas_zgeru(const enum CBLAS_ORDER order, const int M, const int N, + const void *alpha, const void *X, const int incX, + const void *Y, const int incY, void *A, const int lda); +void cblas_zgerc(const enum CBLAS_ORDER order, const int M, const int N, + const void *alpha, const void *X, const int incX, + const void *Y, const int incY, void *A, const int lda); +void cblas_zher(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const double alpha, const void *X, const int incX, + void *A, const int lda); +void cblas_zhpr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, + const int N, const double alpha, const void *X, + const int incX, void *A); +void cblas_zher2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const int N, + const void *alpha, const void *X, const int incX, + const void *Y, const int incY, void *A, const int lda); +void cblas_zhpr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const int N, + const void *alpha, const void *X, const int incX, + const void *Y, const int incY, void *Ap); + +/* + * =========================================================================== + * Prototypes for level 3 BLAS + * =========================================================================== + */ + +/* + * Routines with standard 4 prefixes (S, D, C, Z) + */ +void cblas_sgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_TRANSPOSE TransB, const int M, const int N, + const int K, const float alpha, const float *A, + const int lda, const float *B, const int ldb, + const float beta, float *C, const int ldc); +void cblas_ssymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const int M, const int N, + const float alpha, const float *A, const int lda, + const float *B, const int ldb, const float beta, + float *C, const int ldc); +void cblas_ssyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const float alpha, const float *A, const int lda, + const float beta, float *C, const int ldc); +void cblas_ssyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const float alpha, const float *A, const int lda, + const float *B, const int ldb, const float beta, + float *C, const int ldc); +void cblas_strmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_DIAG Diag, const int M, const int N, + const float alpha, const float *A, const int lda, + float *B, const int ldb); +void cblas_strsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_DIAG Diag, const int M, const int N, + const float alpha, const float *A, const int lda, + float *B, const int ldb); + +void cblas_dgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_TRANSPOSE TransB, const int M, const int N, + const int K, const double alpha, const double *A, + const int lda, const double *B, const int ldb, + const double beta, double *C, const int ldc); +void cblas_dsymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const int M, const int N, + const double alpha, const double *A, const int lda, + const double *B, const int ldb, const double beta, + double *C, const int ldc); +void cblas_dsyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const double alpha, const double *A, const int lda, + const double beta, double *C, const int ldc); +void cblas_dsyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const double alpha, const double *A, const int lda, + const double *B, const int ldb, const double beta, + double *C, const int ldc); +void cblas_dtrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_DIAG Diag, const int M, const int N, + const double alpha, const double *A, const int lda, + double *B, const int ldb); +void cblas_dtrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_DIAG Diag, const int M, const int N, + const double alpha, const double *A, const int lda, + double *B, const int ldb); + +void cblas_cgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_TRANSPOSE TransB, const int M, const int N, + const int K, const void *alpha, const void *A, + const int lda, const void *B, const int ldb, + const void *beta, void *C, const int ldc); +void cblas_csymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const int M, const int N, + const void *alpha, const void *A, const int lda, + const void *B, const int ldb, const void *beta, + void *C, const int ldc); +void cblas_csyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const void *alpha, const void *A, const int lda, + const void *beta, void *C, const int ldc); +void cblas_csyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const void *alpha, const void *A, const int lda, + const void *B, const int ldb, const void *beta, + void *C, const int ldc); +void cblas_ctrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_DIAG Diag, const int M, const int N, + const void *alpha, const void *A, const int lda, + void *B, const int ldb); +void cblas_ctrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_DIAG Diag, const int M, const int N, + const void *alpha, const void *A, const int lda, + void *B, const int ldb); + +void cblas_zgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_TRANSPOSE TransB, const int M, const int N, + const int K, const void *alpha, const void *A, + const int lda, const void *B, const int ldb, + const void *beta, void *C, const int ldc); +void cblas_zsymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const int M, const int N, + const void *alpha, const void *A, const int lda, + const void *B, const int ldb, const void *beta, + void *C, const int ldc); +void cblas_zsyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const void *alpha, const void *A, const int lda, + const void *beta, void *C, const int ldc); +void cblas_zsyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const void *alpha, const void *A, const int lda, + const void *B, const int ldb, const void *beta, + void *C, const int ldc); +void cblas_ztrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_DIAG Diag, const int M, const int N, + const void *alpha, const void *A, const int lda, + void *B, const int ldb); +void cblas_ztrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, + const enum CBLAS_DIAG Diag, const int M, const int N, + const void *alpha, const void *A, const int lda, + void *B, const int ldb); + + +/* + * Routines with prefixes C and Z only + */ +void cblas_chemm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const int M, const int N, + const void *alpha, const void *A, const int lda, + const void *B, const int ldb, const void *beta, + void *C, const int ldc); +void cblas_cherk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const float alpha, const void *A, const int lda, + const float beta, void *C, const int ldc); +void cblas_cher2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const void *alpha, const void *A, const int lda, + const void *B, const int ldb, const float beta, + void *C, const int ldc); + +void cblas_zhemm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, + const enum CBLAS_UPLO Uplo, const int M, const int N, + const void *alpha, const void *A, const int lda, + const void *B, const int ldb, const void *beta, + void *C, const int ldc); +void cblas_zherk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const double alpha, const void *A, const int lda, + const double beta, void *C, const int ldc); +void cblas_zher2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, + const enum CBLAS_TRANSPOSE Trans, const int N, const int K, + const void *alpha, const void *A, const int lda, + const void *B, const int ldb, const double beta, + void *C, const int ldc); + +void cblas_xerbla(int p, const char *rout, const char *form, ...); + +#ifdef __cplusplus +} +#endif + +#endif From 0ec6dca56a70a4399de369973b29e14f74bd98df Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Mon, 18 Apr 2016 12:35:56 -0700 Subject: [PATCH 305/630] Oh, it really does call itself `libmxnet.so` on non-linux platforms too --- deps/build.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 5a4073537bf2..ed77726f7051 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -6,7 +6,7 @@ libmxnet_detected = false if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") info("Trying to load existing libmxnet...") - lib = Libdl.find_library(["libmxnet"], ["$(ENV["MXNET_HOME"])/lib"]) + lib = Libdl.find_library(["libmxnet", "libmxnet.so"], ["$(ENV["MXNET_HOME"])/lib"]) if !isempty(lib) info("Existing libmxnet detected at $lib, skip building...") libmxnet_detected = true @@ -32,7 +32,7 @@ if !libmxnet_detected #-------------------------------------------------------------------------------- # Build libmxnet - mxnet = library_dependency("mxnet", aliases=["libmxnet"]) + mxnet = library_dependency("mxnet", aliases=["libmxnet", "libmxnet.so"]) _prefix = joinpath(BinDeps.depsdir(mxnet), "usr") _srcdir = joinpath(BinDeps.depsdir(mxnet),"src") From 60c16e22840ec5cac8f2df0e5049326034994e44 Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Mon, 18 Apr 2016 14:42:50 -0700 Subject: [PATCH 306/630] Cut down cblas.h to only the stuff we need, make this work on ILP64 --- deps/build.jl | 6 + deps/cblas.h | 605 +++++--------------------------------------------- 2 files changed, 58 insertions(+), 553 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index ed77726f7051..bddecb135dde 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -30,6 +30,11 @@ if !libmxnet_detected openblas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) + ilp64 = "" + if Base.blas_vendor() == :openblas64 + ilp64 = "-DINTERFACE64" + end + #-------------------------------------------------------------------------------- # Build libmxnet mxnet = library_dependency("mxnet", aliases=["libmxnet", "libmxnet.so"]) @@ -51,6 +56,7 @@ if !libmxnet_detected `cp make/config.mk config.mk` @osx_only `cp make/osx.mk config.mk` `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` + `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` `cp ../../cblas.h include/cblas.h` `make USE_BLAS=openblas MSHADOW_LDFLAGS="$openblas_path" -j` `cp lib/libmxnet.so $_libdir` diff --git a/deps/cblas.h b/deps/cblas.h index 941b570c78de..c08fb5f6af9d 100644 --- a/deps/cblas.h +++ b/deps/cblas.h @@ -1,580 +1,79 @@ #ifndef CBLAS_H #define CBLAS_H -#include - -// This header file copied from the Netlib libblas distribution package - -/* Allow the use in C++ code. */ -#ifdef __cplusplus -extern "C" -{ -#endif /* - * Enumerated and derived types - */ -#define CBLAS_INDEX size_t /* this may vary between platforms */ - -enum CBLAS_ORDER {CblasRowMajor=101, CblasColMajor=102}; -enum CBLAS_TRANSPOSE {CblasNoTrans=111, CblasTrans=112, CblasConjTrans=113}; -enum CBLAS_UPLO {CblasUpper=121, CblasLower=122}; -enum CBLAS_DIAG {CblasNonUnit=131, CblasUnit=132}; -enum CBLAS_SIDE {CblasLeft=141, CblasRight=142}; - -/* - * =========================================================================== - * Prototypes for level 1 BLAS functions (complex are recast as routines) - * =========================================================================== - */ -float cblas_sdsdot(const int N, const float alpha, const float *X, - const int incX, const float *Y, const int incY); -double cblas_dsdot(const int N, const float *X, const int incX, const float *Y, - const int incY); -float cblas_sdot(const int N, const float *X, const int incX, - const float *Y, const int incY); -double cblas_ddot(const int N, const double *X, const int incX, - const double *Y, const int incY); - -/* - * Functions having prefixes Z and C only - */ -void cblas_cdotu_sub(const int N, const void *X, const int incX, - const void *Y, const int incY, void *dotu); -void cblas_cdotc_sub(const int N, const void *X, const int incX, - const void *Y, const int incY, void *dotc); - -void cblas_zdotu_sub(const int N, const void *X, const int incX, - const void *Y, const int incY, void *dotu); -void cblas_zdotc_sub(const int N, const void *X, const int incX, - const void *Y, const int incY, void *dotc); - - -/* - * Functions having prefixes S D SC DZ - */ -float cblas_snrm2(const int N, const float *X, const int incX); -float cblas_sasum(const int N, const float *X, const int incX); - -double cblas_dnrm2(const int N, const double *X, const int incX); -double cblas_dasum(const int N, const double *X, const int incX); - -float cblas_scnrm2(const int N, const void *X, const int incX); -float cblas_scasum(const int N, const void *X, const int incX); - -double cblas_dznrm2(const int N, const void *X, const int incX); -double cblas_dzasum(const int N, const void *X, const int incX); - - -/* - * Functions having standard 4 prefixes (S D C Z) - */ -CBLAS_INDEX cblas_isamax(const int N, const float *X, const int incX); -CBLAS_INDEX cblas_idamax(const int N, const double *X, const int incX); -CBLAS_INDEX cblas_icamax(const int N, const void *X, const int incX); -CBLAS_INDEX cblas_izamax(const int N, const void *X, const int incX); - -/* - * =========================================================================== - * Prototypes for level 1 BLAS routines - * =========================================================================== - */ - -/* - * Routines with standard 4 prefixes (s, d, c, z) + * This file modified from the OpenBLAS repository, */ -void cblas_sswap(const int N, float *X, const int incX, - float *Y, const int incY); -void cblas_scopy(const int N, const float *X, const int incX, - float *Y, const int incY); -void cblas_saxpy(const int N, const float alpha, const float *X, - const int incX, float *Y, const int incY); -void cblas_dswap(const int N, double *X, const int incX, - double *Y, const int incY); -void cblas_dcopy(const int N, const double *X, const int incX, - double *Y, const int incY); -void cblas_daxpy(const int N, const double alpha, const double *X, - const int incX, double *Y, const int incY); - -void cblas_cswap(const int N, void *X, const int incX, - void *Y, const int incY); -void cblas_ccopy(const int N, const void *X, const int incX, - void *Y, const int incY); -void cblas_caxpy(const int N, const void *alpha, const void *X, - const int incX, void *Y, const int incY); - -void cblas_zswap(const int N, void *X, const int incX, - void *Y, const int incY); -void cblas_zcopy(const int N, const void *X, const int incX, - void *Y, const int incY); -void cblas_zaxpy(const int N, const void *alpha, const void *X, - const int incX, void *Y, const int incY); - - -/* - * Routines with S and D prefix only - */ -void cblas_srotg(float *a, float *b, float *c, float *s); -void cblas_srotmg(float *d1, float *d2, float *b1, const float b2, float *P); -void cblas_srot(const int N, float *X, const int incX, - float *Y, const int incY, const float c, const float s); -void cblas_srotm(const int N, float *X, const int incX, - float *Y, const int incY, const float *P); - -void cblas_drotg(double *a, double *b, double *c, double *s); -void cblas_drotmg(double *d1, double *d2, double *b1, const double b2, double *P); -void cblas_drot(const int N, double *X, const int incX, - double *Y, const int incY, const double c, const double s); -void cblas_drotm(const int N, double *X, const int incX, - double *Y, const int incY, const double *P); +#include +#ifdef __cplusplus +extern "C" { + /* Assume C declarations for C++ */ +#endif /* __cplusplus */ -/* - * Routines with S D C Z CS and ZD prefixes - */ -void cblas_sscal(const int N, const float alpha, float *X, const int incX); -void cblas_dscal(const int N, const double alpha, double *X, const int incX); -void cblas_cscal(const int N, const void *alpha, void *X, const int incX); -void cblas_zscal(const int N, const void *alpha, void *X, const int incX); -void cblas_csscal(const int N, const float alpha, void *X, const int incX); -void cblas_zdscal(const int N, const double alpha, void *X, const int incX); /* - * =========================================================================== - * Prototypes for level 2 BLAS - * =========================================================================== - */ - -/* - * Routines with standard 4 prefixes (S, D, C, Z) - */ -void cblas_sgemv(const enum CBLAS_ORDER order, - const enum CBLAS_TRANSPOSE TransA, const int M, const int N, - const float alpha, const float *A, const int lda, - const float *X, const int incX, const float beta, - float *Y, const int incY); -void cblas_sgbmv(const enum CBLAS_ORDER order, - const enum CBLAS_TRANSPOSE TransA, const int M, const int N, - const int KL, const int KU, const float alpha, - const float *A, const int lda, const float *X, - const int incX, const float beta, float *Y, const int incY); -void cblas_strmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const float *A, const int lda, - float *X, const int incX); -void cblas_stbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const int K, const float *A, const int lda, - float *X, const int incX); -void cblas_stpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const float *Ap, float *X, const int incX); -void cblas_strsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const float *A, const int lda, float *X, - const int incX); -void cblas_stbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const int K, const float *A, const int lda, - float *X, const int incX); -void cblas_stpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const float *Ap, float *X, const int incX); - -void cblas_dgemv(const enum CBLAS_ORDER order, - const enum CBLAS_TRANSPOSE TransA, const int M, const int N, - const double alpha, const double *A, const int lda, - const double *X, const int incX, const double beta, - double *Y, const int incY); -void cblas_dgbmv(const enum CBLAS_ORDER order, - const enum CBLAS_TRANSPOSE TransA, const int M, const int N, - const int KL, const int KU, const double alpha, - const double *A, const int lda, const double *X, - const int incX, const double beta, double *Y, const int incY); -void cblas_dtrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const double *A, const int lda, - double *X, const int incX); -void cblas_dtbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const int K, const double *A, const int lda, - double *X, const int incX); -void cblas_dtpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const double *Ap, double *X, const int incX); -void cblas_dtrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const double *A, const int lda, double *X, - const int incX); -void cblas_dtbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const int K, const double *A, const int lda, - double *X, const int incX); -void cblas_dtpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const double *Ap, double *X, const int incX); - -void cblas_cgemv(const enum CBLAS_ORDER order, - const enum CBLAS_TRANSPOSE TransA, const int M, const int N, - const void *alpha, const void *A, const int lda, - const void *X, const int incX, const void *beta, - void *Y, const int incY); -void cblas_cgbmv(const enum CBLAS_ORDER order, - const enum CBLAS_TRANSPOSE TransA, const int M, const int N, - const int KL, const int KU, const void *alpha, - const void *A, const int lda, const void *X, - const int incX, const void *beta, void *Y, const int incY); -void cblas_ctrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const void *A, const int lda, - void *X, const int incX); -void cblas_ctbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const int K, const void *A, const int lda, - void *X, const int incX); -void cblas_ctpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const void *Ap, void *X, const int incX); -void cblas_ctrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const void *A, const int lda, void *X, - const int incX); -void cblas_ctbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const int K, const void *A, const int lda, - void *X, const int incX); -void cblas_ctpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const void *Ap, void *X, const int incX); - -void cblas_zgemv(const enum CBLAS_ORDER order, - const enum CBLAS_TRANSPOSE TransA, const int M, const int N, - const void *alpha, const void *A, const int lda, - const void *X, const int incX, const void *beta, - void *Y, const int incY); -void cblas_zgbmv(const enum CBLAS_ORDER order, - const enum CBLAS_TRANSPOSE TransA, const int M, const int N, - const int KL, const int KU, const void *alpha, - const void *A, const int lda, const void *X, - const int incX, const void *beta, void *Y, const int incY); -void cblas_ztrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const void *A, const int lda, - void *X, const int incX); -void cblas_ztbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const int K, const void *A, const int lda, - void *X, const int incX); -void cblas_ztpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const void *Ap, void *X, const int incX); -void cblas_ztrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const void *A, const int lda, void *X, - const int incX); -void cblas_ztbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const int K, const void *A, const int lda, - void *X, const int incX); -void cblas_ztpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE TransA, const enum CBLAS_DIAG Diag, - const int N, const void *Ap, void *X, const int incX); - - -/* - * Routines with S and D prefixes only - */ -void cblas_ssymv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const float alpha, const float *A, - const int lda, const float *X, const int incX, - const float beta, float *Y, const int incY); -void cblas_ssbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const int K, const float alpha, const float *A, - const int lda, const float *X, const int incX, - const float beta, float *Y, const int incY); -void cblas_sspmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const float alpha, const float *Ap, - const float *X, const int incX, - const float beta, float *Y, const int incY); -void cblas_sger(const enum CBLAS_ORDER order, const int M, const int N, - const float alpha, const float *X, const int incX, - const float *Y, const int incY, float *A, const int lda); -void cblas_ssyr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const float alpha, const float *X, - const int incX, float *A, const int lda); -void cblas_sspr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const float alpha, const float *X, - const int incX, float *Ap); -void cblas_ssyr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const float alpha, const float *X, - const int incX, const float *Y, const int incY, float *A, - const int lda); -void cblas_sspr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const float alpha, const float *X, - const int incX, const float *Y, const int incY, float *A); - -void cblas_dsymv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const double alpha, const double *A, - const int lda, const double *X, const int incX, - const double beta, double *Y, const int incY); -void cblas_dsbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const int K, const double alpha, const double *A, - const int lda, const double *X, const int incX, - const double beta, double *Y, const int incY); -void cblas_dspmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const double alpha, const double *Ap, - const double *X, const int incX, - const double beta, double *Y, const int incY); -void cblas_dger(const enum CBLAS_ORDER order, const int M, const int N, - const double alpha, const double *X, const int incX, - const double *Y, const int incY, double *A, const int lda); -void cblas_dsyr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const double alpha, const double *X, - const int incX, double *A, const int lda); -void cblas_dspr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const double alpha, const double *X, - const int incX, double *Ap); -void cblas_dsyr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const double alpha, const double *X, - const int incX, const double *Y, const int incY, double *A, - const int lda); -void cblas_dspr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const double alpha, const double *X, - const int incX, const double *Y, const int incY, double *A); - - -/* - * Routines with C and Z prefixes only + * Since all of GotoBlas was written without const, + * we disable it at build time. */ -void cblas_chemv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const void *alpha, const void *A, - const int lda, const void *X, const int incX, - const void *beta, void *Y, const int incY); -void cblas_chbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const int K, const void *alpha, const void *A, - const int lda, const void *X, const int incX, - const void *beta, void *Y, const int incY); -void cblas_chpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const void *alpha, const void *Ap, - const void *X, const int incX, - const void *beta, void *Y, const int incY); -void cblas_cgeru(const enum CBLAS_ORDER order, const int M, const int N, - const void *alpha, const void *X, const int incX, - const void *Y, const int incY, void *A, const int lda); -void cblas_cgerc(const enum CBLAS_ORDER order, const int M, const int N, - const void *alpha, const void *X, const int incX, - const void *Y, const int incY, void *A, const int lda); -void cblas_cher(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const float alpha, const void *X, const int incX, - void *A, const int lda); -void cblas_chpr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const float alpha, const void *X, - const int incX, void *A); -void cblas_cher2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const int N, - const void *alpha, const void *X, const int incX, - const void *Y, const int incY, void *A, const int lda); -void cblas_chpr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const int N, - const void *alpha, const void *X, const int incX, - const void *Y, const int incY, void *Ap); - -void cblas_zhemv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const void *alpha, const void *A, - const int lda, const void *X, const int incX, - const void *beta, void *Y, const int incY); -void cblas_zhbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const int K, const void *alpha, const void *A, - const int lda, const void *X, const int incX, - const void *beta, void *Y, const int incY); -void cblas_zhpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const void *alpha, const void *Ap, - const void *X, const int incX, - const void *beta, void *Y, const int incY); -void cblas_zgeru(const enum CBLAS_ORDER order, const int M, const int N, - const void *alpha, const void *X, const int incX, - const void *Y, const int incY, void *A, const int lda); -void cblas_zgerc(const enum CBLAS_ORDER order, const int M, const int N, - const void *alpha, const void *X, const int incX, - const void *Y, const int incY, void *A, const int lda); -void cblas_zher(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const double alpha, const void *X, const int incX, - void *A, const int lda); -void cblas_zhpr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, - const int N, const double alpha, const void *X, - const int incX, void *A); -void cblas_zher2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const int N, - const void *alpha, const void *X, const int incX, - const void *Y, const int incY, void *A, const int lda); -void cblas_zhpr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const int N, - const void *alpha, const void *X, const int incX, - const void *Y, const int incY, void *Ap); +#ifndef OPENBLAS_CONST +# define OPENBLAS_CONST const +#endif /* - * =========================================================================== - * Prototypes for level 3 BLAS - * =========================================================================== + * Add definitions for BLASLONG and blasint */ -/* - * Routines with standard 4 prefixes (S, D, C, Z) - */ -void cblas_sgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_TRANSPOSE TransB, const int M, const int N, - const int K, const float alpha, const float *A, - const int lda, const float *B, const int ldb, - const float beta, float *C, const int ldc); -void cblas_ssymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const int M, const int N, - const float alpha, const float *A, const int lda, - const float *B, const int ldb, const float beta, - float *C, const int ldc); -void cblas_ssyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const float alpha, const float *A, const int lda, - const float beta, float *C, const int ldc); -void cblas_ssyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const float alpha, const float *A, const int lda, - const float *B, const int ldb, const float beta, - float *C, const int ldc); -void cblas_strmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_DIAG Diag, const int M, const int N, - const float alpha, const float *A, const int lda, - float *B, const int ldb); -void cblas_strsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_DIAG Diag, const int M, const int N, - const float alpha, const float *A, const int lda, - float *B, const int ldb); +#if defined(OS_WINDOWS) && defined(__64BIT__) +typedef long long BLASLONG; +typedef unsigned long long BLASULONG; +#else +typedef long BLASLONG; +typedef unsigned long BLASULONG; +#endif -void cblas_dgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_TRANSPOSE TransB, const int M, const int N, - const int K, const double alpha, const double *A, - const int lda, const double *B, const int ldb, - const double beta, double *C, const int ldc); -void cblas_dsymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const int M, const int N, - const double alpha, const double *A, const int lda, - const double *B, const int ldb, const double beta, - double *C, const int ldc); -void cblas_dsyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const double alpha, const double *A, const int lda, - const double beta, double *C, const int ldc); -void cblas_dsyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const double alpha, const double *A, const int lda, - const double *B, const int ldb, const double beta, - double *C, const int ldc); -void cblas_dtrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_DIAG Diag, const int M, const int N, - const double alpha, const double *A, const int lda, - double *B, const int ldb); -void cblas_dtrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_DIAG Diag, const int M, const int N, - const double alpha, const double *A, const int lda, - double *B, const int ldb); +#ifdef INTERFACE64 +typedef BLASLONG blasint; +#else +typedef int blasint; +#endif -void cblas_cgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_TRANSPOSE TransB, const int M, const int N, - const int K, const void *alpha, const void *A, - const int lda, const void *B, const int ldb, - const void *beta, void *C, const int ldc); -void cblas_csymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const int M, const int N, - const void *alpha, const void *A, const int lda, - const void *B, const int ldb, const void *beta, - void *C, const int ldc); -void cblas_csyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const void *alpha, const void *A, const int lda, - const void *beta, void *C, const int ldc); -void cblas_csyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const void *alpha, const void *A, const int lda, - const void *B, const int ldb, const void *beta, - void *C, const int ldc); -void cblas_ctrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_DIAG Diag, const int M, const int N, - const void *alpha, const void *A, const int lda, - void *B, const int ldb); -void cblas_ctrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_DIAG Diag, const int M, const int N, - const void *alpha, const void *A, const int lda, - void *B, const int ldb); +#ifdef INTERFACE64 +#define cblas_sgemm cblas_sgemm64_ +#define cblas_sgemv cblas_sgemv64_ +#define cblas_sger cblas_sger64_ +#define cblas_dgemm cblas_dgemm64_ +#define cblas_dgemv cblas_dgemv64_ +#define cblas_dger cblas_dger64_ +#define dblas_sdot cblas_sdot64_ +#define dblas_ddot cblas_ddot64_ +#endif -void cblas_zgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_TRANSPOSE TransB, const int M, const int N, - const int K, const void *alpha, const void *A, - const int lda, const void *B, const int ldb, - const void *beta, void *C, const int ldc); -void cblas_zsymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const int M, const int N, - const void *alpha, const void *A, const int lda, - const void *B, const int ldb, const void *beta, - void *C, const int ldc); -void cblas_zsyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const void *alpha, const void *A, const int lda, - const void *beta, void *C, const int ldc); -void cblas_zsyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const void *alpha, const void *A, const int lda, - const void *B, const int ldb, const void *beta, - void *C, const int ldc); -void cblas_ztrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_DIAG Diag, const int M, const int N, - const void *alpha, const void *A, const int lda, - void *B, const int ldb); -void cblas_ztrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE TransA, - const enum CBLAS_DIAG Diag, const int M, const int N, - const void *alpha, const void *A, const int lda, - void *B, const int ldb); +typedef enum CBLAS_ORDER {CblasRowMajor=101, CblasColMajor=102} CBLAS_ORDER; +typedef enum CBLAS_TRANSPOSE {CblasNoTrans=111, CblasTrans=112, CblasConjTrans=113, CblasConjNoTrans=114} CBLAS_TRANSPOSE; +typedef enum CBLAS_UPLO {CblasUpper=121, CblasLower=122} CBLAS_UPLO; +typedef enum CBLAS_DIAG {CblasNonUnit=131, CblasUnit=132} CBLAS_DIAG; +typedef enum CBLAS_SIDE {CblasLeft=141, CblasRight=142} CBLAS_SIDE; -/* - * Routines with prefixes C and Z only - */ -void cblas_chemm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const int M, const int N, - const void *alpha, const void *A, const int lda, - const void *B, const int ldb, const void *beta, - void *C, const int ldc); -void cblas_cherk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const float alpha, const void *A, const int lda, - const float beta, void *C, const int ldc); -void cblas_cher2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const void *alpha, const void *A, const int lda, - const void *B, const int ldb, const float beta, - void *C, const int ldc); +float cblas_sdot(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float *y, OPENBLAS_CONST blasint incy); +double cblas_ddot(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST double *y, OPENBLAS_CONST blasint incy); -void cblas_zhemm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, - const enum CBLAS_UPLO Uplo, const int M, const int N, - const void *alpha, const void *A, const int lda, - const void *B, const int ldb, const void *beta, - void *C, const int ldc); -void cblas_zherk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const double alpha, const void *A, const int lda, - const double beta, void *C, const int ldc); -void cblas_zher2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, - const enum CBLAS_TRANSPOSE Trans, const int N, const int K, - const void *alpha, const void *A, const int lda, - const void *B, const int ldb, const double beta, - void *C, const int ldc); +void cblas_sgemv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE trans, OPENBLAS_CONST blasint m, OPENBLAS_CONST blasint n, + OPENBLAS_CONST float alpha, OPENBLAS_CONST float *a, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float beta, float *y, OPENBLAS_CONST blasint incy); +void cblas_dgemv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE trans, OPENBLAS_CONST blasint m, OPENBLAS_CONST blasint n, + OPENBLAS_CONST double alpha, OPENBLAS_CONST double *a, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST double beta, double *y, OPENBLAS_CONST blasint incy); +void cblas_sger (OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *Y, OPENBLAS_CONST blasint incY, float *A, OPENBLAS_CONST blasint lda); +void cblas_dger (OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *Y, OPENBLAS_CONST blasint incY, double *A, OPENBLAS_CONST blasint lda); -void cblas_xerbla(int p, const char *rout, const char *form, ...); +void cblas_sgemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransB, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_dgemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransB, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double beta, double *C, OPENBLAS_CONST blasint ldc); #ifdef __cplusplus } -#endif +#endif /* __cplusplus */ #endif From 7f445b907443800cb24765cea3fbad272de1d8ae Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Mon, 18 Apr 2016 14:52:27 -0700 Subject: [PATCH 307/630] Fix typo --- deps/cblas.h | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/deps/cblas.h b/deps/cblas.h index c08fb5f6af9d..a99c8fc9920f 100644 --- a/deps/cblas.h +++ b/deps/cblas.h @@ -46,8 +46,8 @@ typedef int blasint; #define cblas_dgemm cblas_dgemm64_ #define cblas_dgemv cblas_dgemv64_ #define cblas_dger cblas_dger64_ -#define dblas_sdot cblas_sdot64_ -#define dblas_ddot cblas_ddot64_ +#define cblas_sdot cblas_sdot64_ +#define cblas_ddot cblas_ddot64_ #endif From 9474561cb95765410e9f5bacd5c4ad8b412ae30f Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Mon, 18 Apr 2016 14:56:43 -0700 Subject: [PATCH 308/630] More intelligent parallelized build --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index bddecb135dde..50fd0a907ae7 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -58,7 +58,7 @@ if !libmxnet_detected `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` `cp ../../cblas.h include/cblas.h` - `make USE_BLAS=openblas MSHADOW_LDFLAGS="$openblas_path" -j` + `make USE_BLAS=openblas MSHADOW_LDFLAGS="$openblas_path" -j$(max(1, CPU_CORES - 1))` `cp lib/libmxnet.so $_libdir` end) end From 39786c5904ec9ee912488eeb136682f9427afe08 Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Mon, 18 Apr 2016 15:58:57 -0700 Subject: [PATCH 309/630] Just remove parallel build, it's making Travis angry --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 50fd0a907ae7..e0e0a0e1388f 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -58,7 +58,7 @@ if !libmxnet_detected `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` `cp ../../cblas.h include/cblas.h` - `make USE_BLAS=openblas MSHADOW_LDFLAGS="$openblas_path" -j$(max(1, CPU_CORES - 1))` + `make USE_BLAS=openblas MSHADOW_LDFLAGS="$openblas_path"` `cp lib/libmxnet.so $_libdir` end) end From b38e2ccae4183b861f591db9f5a26b8ab1b94fc8 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 21 Apr 2016 09:35:35 -0400 Subject: [PATCH 310/630] update docs --- docs/api/io.rst | 4 +- docs/api/metric.rst | 10 ++ docs/api/ndarray.rst | 69 ++++++++++--- docs/api/symbolic-node.rst | 199 +++++++++++++++++++++++++++++-------- 4 files changed, 229 insertions(+), 53 deletions(-) diff --git a/docs/api/io.rst b/docs/api/io.rst index 8ec67cf6d073..e5cb3ffb32e5 100644 --- a/docs/api/io.rst +++ b/docs/api/io.rst @@ -351,7 +351,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :param rand_crop: Augmentation Param: Whether to random crop on the image @@ -514,7 +514,7 @@ libmxnet data providers :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: long (non-negative), optional, default=4 + :type prefetch_buffer: , optional, default=4 :return: the constructed :class:`MXDataProvider`. diff --git a/docs/api/metric.rst b/docs/api/metric.rst index 966d682ba2b7..0f3cc2d81358 100644 --- a/docs/api/metric.rst +++ b/docs/api/metric.rst @@ -65,3 +65,13 @@ set. + +.. class:: MultiACE + + Averaged cross-entropy for classification. This also know als logloss. + This variant keeps track of the different losses per class. + + Calculated the averaged cross entropy for multi-dimentions output. + + + diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst index b72f0faa5cfe..b94232b25e50 100644 --- a/docs/api/ndarray.rst +++ b/docs/api/ndarray.rst @@ -748,13 +748,13 @@ Internal APIs .. function:: _div(...) + Multiply lhs by rhs - - :param lhs: Left operand to the function. + :param lhs: Left operand to the function :type lhs: NDArray - :param rhs: Right operand to the function. + :param rhs: Right operand to the function :type rhs: NDArray @@ -815,15 +815,45 @@ Internal APIs -.. function:: _minus(...) +.. function:: _maximum(...) + Elementwise max of lhs by rhs + :param lhs: Left operand to the function + :type lhs: NDArray - :param lhs: Left operand to the function. + + :param rhs: Right operand to the function + :type rhs: NDArray + + + + + +.. function:: _minimum(...) + + Elementwise min of lhs by rhs + + :param lhs: Left operand to the function :type lhs: NDArray - :param rhs: Right operand to the function. + :param rhs: Right operand to the function + :type rhs: NDArray + + + + + +.. function:: _minus(...) + + Minus lhs and rhs + + :param lhs: Left operand to the function + :type lhs: NDArray + + + :param rhs: Right operand to the function :type rhs: NDArray @@ -847,13 +877,13 @@ Internal APIs .. function:: _mul(...) + Multiply lhs and rhs - - :param lhs: Left operand to the function. + :param lhs: Left operand to the function :type lhs: NDArray - :param rhs: Right operand to the function. + :param rhs: Right operand to the function :type rhs: NDArray @@ -892,13 +922,13 @@ Internal APIs .. function:: _plus(...) + Add lhs and rhs - - :param lhs: Left operand to the function. + :param lhs: Left operand to the function :type lhs: NDArray - :param rhs: Right operand to the function. + :param rhs: Right operand to the function :type rhs: NDArray @@ -920,6 +950,21 @@ Internal APIs +.. function:: _power(...) + + Elementwise power(lhs, rhs) + + :param lhs: Left operand to the function + :type lhs: NDArray + + + :param rhs: Right operand to the function + :type rhs: NDArray + + + + + .. function:: _random_gaussian(...) diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst index e303afba21dc..125b391046cb 100644 --- a/docs/api/symbolic-node.rst +++ b/docs/api/symbolic-node.rst @@ -498,7 +498,7 @@ Public APIs .. function:: Embedding(...) - Get embedding for one-hot input + Get embedding for one-hot input. A n-dimensional input tensor will be trainsformed into a (n+1)-dimensional tensor, where a new dimension is added for the embedding results. :param data: Input data to the EmbeddingOp. :type data: SymbolicNode @@ -800,6 +800,10 @@ Public APIs :param axis: Dimension along which to slice. :type axis: int, optional, default='1' + + :param squeeze_axis: If true AND the sliced dimension becomes 1, squeeze that dimension. + :type squeeze_axis: boolean, optional, default=False + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -963,8 +967,12 @@ Public APIs Take absolute value of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -979,8 +987,12 @@ Public APIs Take ceil value of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -995,8 +1007,12 @@ Public APIs Take cos of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1011,8 +1027,12 @@ Public APIs Take exp of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1027,8 +1047,12 @@ Public APIs Take floor value of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1043,8 +1067,12 @@ Public APIs Take log of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1059,8 +1087,12 @@ Public APIs Take round value of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1075,8 +1107,12 @@ Public APIs Take rsqrt of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1091,8 +1127,12 @@ Public APIs Take sign value of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1107,8 +1147,12 @@ Public APIs Take sin of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1123,8 +1167,12 @@ Public APIs Take sqrt of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1139,8 +1187,32 @@ Public APIs Take square of the src - :param src: Source symbolic input to the function - :type src: SymbolicNode + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode + + :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. + :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. + + :return: . + + + + + +.. function:: transpose(...) + + Transpose the input matrix and return a new one + + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. @@ -1172,12 +1244,19 @@ Internal APIs .. function:: _Div(...) - Perform an elementwise div. + Multiply lhs by rhs + + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: SymbolicNode. + :return: . @@ -1209,12 +1288,19 @@ Internal APIs .. function:: _Maximum(...) - Perform an elementwise power. + Elementwise max of lhs by rhs + + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: SymbolicNode. + :return: . @@ -1246,12 +1332,19 @@ Internal APIs .. function:: _Minimum(...) - Perform an elementwise power. + Elementwise min of lhs by rhs + + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: SymbolicNode. + :return: . @@ -1283,12 +1376,19 @@ Internal APIs .. function:: _Minus(...) - Perform an elementwise minus. + Minus lhs and rhs + + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: SymbolicNode. + :return: . @@ -1320,12 +1420,19 @@ Internal APIs .. function:: _Mul(...) - Perform an elementwise mul. + Multiply lhs and rhs + + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: SymbolicNode. + :return: . @@ -1393,12 +1500,19 @@ Internal APIs .. function:: _Plus(...) - Perform an elementwise plus. + Add lhs and rhs + + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: SymbolicNode. + :return: . @@ -1430,12 +1544,19 @@ Internal APIs .. function:: _Power(...) - Perform an elementwise power. + Elementwise power(lhs, rhs) + + :param lhs: Left symbolic input to the function + :type lhs: SymbolicNode + + + :param rhs: Left symbolic input to the function + :type rhs: SymbolicNode :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - :return: SymbolicNode. + :return: . From bbe31513ade7cdf1db04ead6c7195d679e56d99e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sat, 23 Apr 2016 10:03:54 -0400 Subject: [PATCH 311/630] fix for upstream changes dmlc/mxnet#1857 --- src/symbolic-node.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index e83b94aeefa4..da0833242def 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -330,7 +330,7 @@ function .-(self :: SymbolicNode, arg :: Real) end function -(arg :: Real, self :: SymbolicNode) - _MinusScalar(self, scalar=arg, scalar_on_left=true) + _RMinusScalar(self, scalar=arg) end function .-(arg :: Real, self :: SymbolicNode) -(arg, self) @@ -373,7 +373,7 @@ function /(self :: SymbolicNode, arg :: Real) ./(self, arg) end function ./(arg :: Real, self :: SymbolicNode) - _DivScalar(self, scalar=arg, scalar_on_left=true) + _RDivScalar(self, scalar=arg) end import Base: .^, ^ From 4bf4037bc2344d507950216d74561c801970a6fe Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Mon, 25 Apr 2016 21:58:28 +0900 Subject: [PATCH 312/630] check if their are predefined weights and use them --- src/model.jl | 45 ++++++++++++++++++++++++++++++++------------- 1 file changed, 32 insertions(+), 13 deletions(-) diff --git a/src/model.jl b/src/model.jl index b823a342b529..3458e6a579fa 100644 --- a/src/model.jl +++ b/src/model.jl @@ -92,32 +92,51 @@ function init_model(self :: FeedForward, initializer :: AbstractInitializer; ove param_names = setdiff(arg_names, input_names) aux_names = list_auxiliary_states(self.arch) - arg_defined = true - aux_defined = true - arg_shapes, out_shapes, aux_shapes = infer_shape(self.arch; input_shapes...) + + # If target dict is not yet defined set a temporary one if !isdefined(self, :arg_params) - param_name_shapes = filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) - self.arg_params = Dict([name => empty(shape) for (name,shape) in param_name_shapes]) - arg_defined = false + self.arg_params = Dict{Symbol, NDArray}() end if !isdefined(self, :aux_params) - self.aux_params = Dict([name => empty(shape) for (name,shape) in zip(aux_names,aux_shapes)]) - aux_defined = false + self.aux_params = Dict{Symbol, NDArray}() + end + + arg_params = Dict{Symbol, NDArray}() + aux_params = Dict{Symbol, NDArray}() + + for (name, shape) in filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) + if haskey(self.arg_params, name) + shape == size(self.arg_params[name]) || error("Shape mismatch for $name.") + arg_params[name] = self.arg_params[name] + else + arg_params[name] = empty(shape) + end end - # initialize the contents of the parameters - if !arg_defined || overwrite - for (k,v) in self.arg_params + for (name, shape) in zip(aux_names, aux_shapes) + if haskey(self.aux_params, name) + shape == size(self.arg_params[name]) || error("Shape mismatch for $name.") + aux_params[name] = self.aux_params[name] + else + aux_params[name] = empty(shape) + end + end + + for (k,v) in arg_params + if overwrite || !haskey(self.arg_params, k) init(initializer, k, v) end end - if !aux_defined || overwrite - for (k,v) in self.aux_params + for (k,v) in aux_params + if overwrite || !haskey(self.aux_params, k) init(initializer, k, v) end end + self.arg_params = arg_params + self.aux_params = aux_params + return (arg_names, param_names, aux_names) end From 4c7a066ce4469479b96eb39ecbf7d0504bd6acbd Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Mon, 25 Apr 2016 23:23:45 +0900 Subject: [PATCH 313/630] be more lenient in model loading --- src/model.jl | 24 ++++++++++++++++-------- 1 file changed, 16 insertions(+), 8 deletions(-) diff --git a/src/model.jl b/src/model.jl index 3458e6a579fa..683510b13854 100644 --- a/src/model.jl +++ b/src/model.jl @@ -107,20 +107,28 @@ function init_model(self :: FeedForward, initializer :: AbstractInitializer; ove for (name, shape) in filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) if haskey(self.arg_params, name) - shape == size(self.arg_params[name]) || error("Shape mismatch for $name.") - arg_params[name] = self.arg_params[name] - else - arg_params[name] = empty(shape) + if shape == size(self.arg_params[name]) + arg_params[name] = self.arg_params[name] + continue + else + warn("Shape mismatch for $name. Overwriting with new one.") + delete!(self.arg_params, name) + end end + arg_params[name] = empty(shape) end for (name, shape) in zip(aux_names, aux_shapes) if haskey(self.aux_params, name) - shape == size(self.arg_params[name]) || error("Shape mismatch for $name.") - aux_params[name] = self.aux_params[name] - else - aux_params[name] = empty(shape) + if shape == size(self.auxg_params[name]) + aux_params[name] = self.aux_params[name] + continue + else + warn("Shape mismatch for $name. Overwriting with new one.") + delete!(self.aux_params, name) + end end + aux_params[name] = empty(shape) end for (k,v) in arg_params From 98b7cf2341f3045e0babf1d274aec5cdb3c7df76 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 26 Apr 2016 12:54:40 +0900 Subject: [PATCH 314/630] add SymbolListAttr --- src/symbolic-node.jl | 25 ++++++++++++++++++++++++- test/unittest/symbolic-node.jl | 1 + 2 files changed, 25 insertions(+), 1 deletion(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index da0833242def..1ddc5e682319 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -132,7 +132,8 @@ function get_attr(self :: SymbolicNode, key :: Symbol) key_s = bytestring(string(key)) ref_out = Ref{Cstring}() ref_success = Ref{Cint}(-1) - @mxcall(:MXSymbolGetAttr, (MX_handle, Cstring, Ref{Cstring}, Ref{Cint}), self, key_s, ref_out, ref_success) + @mxcall(:MXSymbolGetAttr, (MX_handle, Cstring, Ref{Cstring}, Ref{Cint}), + self, key_s, ref_out, ref_success) if ref_success[] == 1 return Nullable{ByteString}(bytestring(ref_out[])) else @@ -140,6 +141,28 @@ function get_attr(self :: SymbolicNode, key :: Symbol) end end +#=doc +.. function: list_attr(self :: SymbolicNode) + + Get all attributes from symbol. + :return: Dictionary of attributes. +=# +function list_attr(self :: SymbolicNode) + ref_sz = Ref{MX_uint}(0) + ref_strings = Ref{char_pp}(0) + @mxcall(:MXSymbolListAttr, (MX_handle, Ref{MX_uint}, Ref{char_pp}), + self, ref_sz, ref_strings) + narg = 2*ref_sz[] + strings = pointer_to_array(ref_strings[], narg) + out = Dict{Symbol, ByteString}() + for i in 1:2:narg + key = symbol(bytestring(strings[i])) + value = bytestring(strings[i+1]) + out[key] = value + end + return out +end + #=doc .. function:: set_attr(self:: SymbolicNode, key :: Symbol, value :: AbstractString) diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index e5a5531845ec..825602723151 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -100,6 +100,7 @@ function test_attrs() @test isnull(mx.get_attr(conv, :b)) @test get(mx.get_attr(conv, :a)) == "a" @test get(mx.get_attr(conv, :π)) == "π" + @test mx.list_attr(conv) == Dict(:a => "a", :π => "π") @test_throws MethodError mx.Variable(:data3, attrs = Dict(:test => "1.0", :test2 => 1.0)) @test_throws MethodError mx.Convolution(data=data2, kernel = (1,1), num_filter = 1, attrs = Dict(:test => "1.0", :test2 => 1.0)) From b0fc16f117b1c6e12d5a5bab6550b0d298384c06 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 26 Apr 2016 15:16:42 +0900 Subject: [PATCH 315/630] get idx that need to be frozen --- src/model.jl | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/src/model.jl b/src/model.jl index 683510b13854..da54614ac935 100644 --- a/src/model.jl +++ b/src/model.jl @@ -430,6 +430,16 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # invoke callbacks on epoch 0 _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) + # get grad attribute to allow for freezing + freeze_names = Symbol[] + for (attr, value) in list_attr(self.arch) + sattr = string(attr) + if endswith(sattr, "grad") && value == "freeze" + push!(freeze_names, symbol(sattr[1:end-5])) + end + end + freeze_idx = filter(i -> in(arg_names[i], freeze_names), 1:length(arg_names)) + info("Start training...") for i_epoch = 1:opts.n_epoch time_start = time() From ce599a969e76c6dfeefed32c03e89b9b046d2b8d Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 26 Apr 2016 15:20:57 +0900 Subject: [PATCH 316/630] skip parameter update on frozen weights --- src/model.jl | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/model.jl b/src/model.jl index da54614ac935..7dede8d05206 100644 --- a/src/model.jl +++ b/src/model.jl @@ -473,6 +473,10 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # update parameters for idx = 1:length(param_names) + if in(idx, freeze_idx) + continue # Skip parameter update entirely + end + # gradient synchronization if !isa(kvstore, Void) # push gradient, priority is negative index From 9880bdf57b350b2602684446d3bfe0f3a2a0094b Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 26 Apr 2016 18:02:17 +0900 Subject: [PATCH 317/630] set GRAD_NOP for all frozen params --- src/executor.jl | 29 +++++++++++++++++++---------- src/model.jl | 32 +++++++++++++++++++++----------- 2 files changed, 40 insertions(+), 21 deletions(-) diff --git a/src/executor.jl b/src/executor.jl index 4c72589ae966..e4b943c0c764 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -128,22 +128,31 @@ function bind(self :: SymbolicNode; kwargs...) bind(self, context, args; kwargs...) end -function simple_bind(self :: SymbolicNode, ctx :: Context; grad_req :: GRAD_REQ=GRAD_WRITE, kwargs...) +function simple_bind(self :: SymbolicNode, ctx :: Context; + grad_req :: Union{GRAD_REQ, Dict{Symbol, GRAD_REQ}}=GRAD_WRITE, + kwargs...) arg_shapes, out_shapes, aux_shapes = infer_shape(self; kwargs...) @assert(!isa(arg_shapes, Void), "Information not enough to perform complete shape inference") arg_arrays = NDArray[zeros(shape, ctx) for shape in arg_shapes] arg_names = list_arguments(self) - if grad_req == GRAD_NOP - grad_arrays = Dict{Base.Symbol,NDArray}() - else + + grad_arrays = Dict{Symbol,NDArray}() + + if grad_req != GRAD_NOP + shapes = zip(arg_names, arg_shapes) + + # if not in provided data, should be parameters provided_data_names = [x[1] for x in kwargs] - grad_arrays = Dict{Base.Symbol,NDArray}() - for (name, shape) in zip(arg_names, arg_shapes) - # if not in provided data, should be parameters - if !in(name, provided_data_names) - grad_arrays[name] = zeros(shape, ctx) - end + shapes = filter(x -> !in(x[1], provided_data_names), shapes) + + # Remove all gradients for nop params + # if isa(grad_req, Dict{Symbol, GRAD_REQ}) + # shapes = filter(x -> grad_req[x[1]] != GRAD_NOP,shapes) + # end + + for (name, shape) in shapes + grad_arrays[name] = zeros(shape, ctx) end end diff --git a/src/model.jl b/src/model.jl index 7dede8d05206..f5dffc457bc6 100644 --- a/src/model.jl +++ b/src/model.jl @@ -369,11 +369,31 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra kvstore, update_on_kvstore = _create_kvstore(kvstore, length(self.ctx), self.arg_params) end + # get grad attribute to allow for freezing + freeze_names = Symbol[] + for (attr, value) in list_attr(self.arch) + sattr = string(attr) + if endswith(sattr, "grad") && value == "freeze" + push!(freeze_names, symbol(sattr[1:end-5])) + end + end + freeze_idx = filter(i -> in(arg_names[i], freeze_names), 1:length(arg_names)) + + # Setup grad_req as a dictionary + grad_req = Dict{Symbol, GRAD_REQ}() + for param in param_names + if in(param, freeze_names) + grad_req[param] = GRAD_NOP + else + grad_req[param] = GRAD_WRITE + end + end + train_execs = Array(Executor, num_dev) for i = 1:num_dev data_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)] label_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)] - train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=GRAD_WRITE, data_shapes..., label_shapes...) + train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=grad_req, data_shapes..., label_shapes...) dbg_str = mx.debug_str(train_execs[i]) info(string("TempSpace: ", split(dbg_str, ['\n'])[end-2]..., " on ", self.ctx[i])) @@ -430,16 +450,6 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # invoke callbacks on epoch 0 _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) - # get grad attribute to allow for freezing - freeze_names = Symbol[] - for (attr, value) in list_attr(self.arch) - sattr = string(attr) - if endswith(sattr, "grad") && value == "freeze" - push!(freeze_names, symbol(sattr[1:end-5])) - end - end - freeze_idx = filter(i -> in(arg_names[i], freeze_names), 1:length(arg_names)) - info("Start training...") for i_epoch = 1:opts.n_epoch time_start = time() From 68180f75fd411dd62301b848e8299aeaa9b8c68e Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 26 Apr 2016 18:54:29 +0900 Subject: [PATCH 318/630] ids derived from arg_names and param_names are not relatable. --- src/model.jl | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/model.jl b/src/model.jl index f5dffc457bc6..c025dc17091c 100644 --- a/src/model.jl +++ b/src/model.jl @@ -377,7 +377,8 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra push!(freeze_names, symbol(sattr[1:end-5])) end end - freeze_idx = filter(i -> in(arg_names[i], freeze_names), 1:length(arg_names)) + # Needs to correspond to the correct id in the update loop layer idx=1:length(param_names). + freeze_idx = filter(i -> in(param_names[i], freeze_names), 1:length(param_names)) # Setup grad_req as a dictionary grad_req = Dict{Symbol, GRAD_REQ}() From deb021dab22f1ed1790ce8a74642cbc23d52dc85 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 26 Apr 2016 14:13:40 -0400 Subject: [PATCH 319/630] (temporarily) disable Julia nightly test --- .travis.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.travis.yml b/.travis.yml index 9f08e176eed2..df63021f35aa 100644 --- a/.travis.yml +++ b/.travis.yml @@ -6,7 +6,7 @@ os: - osx julia: - 0.4 - - nightly + #- nightly # dependent apt packages addons: From c948dc39c77f3cf1846aaaea6c6d6234aa9547cf Mon Sep 17 00:00:00 2001 From: Michael Wallace Louwrens Date: Mon, 9 May 2016 01:18:10 +0200 Subject: [PATCH 320/630] Added 7z alternative for mnist Added try catch around the unzip and added 7z extraction alternative. --- src/util.jl | 20 ++++++++++++++++++-- 1 file changed, 18 insertions(+), 2 deletions(-) diff --git a/src/util.jl b/src/util.jl index 1e9b0853dc5b..d6ce97a3e5ca 100644 --- a/src/util.jl +++ b/src/util.jl @@ -19,7 +19,15 @@ function get_mnist_ubyte() if !all(isfile, values(filenames)) cd(mnist_dir) do mnist_dir = download("http://webdocs.cs.ualberta.ca/~bx3/data/mnist.zip", "mnist.zip") - run(`unzip -u $mnist_dir`) + try + run(`unzip -u $mnist_dir`) + catch + try + run(pipe(`7z x $mnist_dir`,stdout=DevNull)) + catch + error("Extraction Failed:No extraction program found in path") + end + end end end return filenames @@ -34,7 +42,15 @@ function get_cifar10() if !all(isfile, values(filenames)) cd(cifar10_dir) do run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/cifar10.zip`) - run(`unzip -u cifar10.zip`) + try + run(`unzip -u cifar10.zip`) + catch + try + run(pipe(`7z x cifar10.zip`,stdout=DevNull)) + catch + error("Extraction Failed:No extraction program found in path") + end + end end end From 013b88b8c7580f057fcdf3aeac3777a57ca8a04d Mon Sep 17 00:00:00 2001 From: Michael Wallace Louwrens Date: Mon, 9 May 2016 01:38:14 +0200 Subject: [PATCH 321/630] Change where set_attr is called in _define_atomic_symbol_creator MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Where `set_attr` was originally called in `_define_atomic_symbol_creator` would cause `list_attr` to return a dictionary with extra bias and weight fields as seen here: ` Dict{Symbol,ByteString}(:convolution0_a=>"a",:convolution0_π=>"π",:convolution0_bias_a=>"a",:convolution0_weight_π=>"π",:convolution0_bias_π=>"π",:convolution0_weight_a=>"a",:data2_test=>"hallo!") ` The test still fails however as `list_attr` still contains the name of the source before the key. --- src/symbolic-node.jl | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 1ddc5e682319..0bc3b593da8a 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -591,17 +591,17 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) hint = lowercase($func_name_s) name = get!(DEFAULT_NAME_MANAGER, name, hint) - # set attrs - for (k, v) in attrs - set_attr(node, k, v) - end - if length(args) != 0 _compose!(node, name, args...) else _compose!(node; name=name, symbol_kws...) end + # set attrs + for (k, v) in attrs + set_attr(node, k, v) + end + return node end From 463f202e6fa4ad6eaaa2f82e93ddd2d4ec782981 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Mon, 9 May 2016 11:52:24 +0900 Subject: [PATCH 322/630] add support for ListAttrShallow --- src/model.jl | 2 +- src/symbolic-node.jl | 24 +++++++++++++++++++++++- 2 files changed, 24 insertions(+), 2 deletions(-) diff --git a/src/model.jl b/src/model.jl index c025dc17091c..3984eb9d1389 100644 --- a/src/model.jl +++ b/src/model.jl @@ -371,7 +371,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # get grad attribute to allow for freezing freeze_names = Symbol[] - for (attr, value) in list_attr(self.arch) + for (attr, value) in list_all_attr(self.arch) sattr = string(attr) if endswith(sattr, "grad") && value == "freeze" push!(freeze_names, symbol(sattr[1:end-5])) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 0bc3b593da8a..dcaae9bd5dc6 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -144,10 +144,32 @@ end #=doc .. function: list_attr(self :: SymbolicNode) - Get all attributes from symbol. + Get all attributes from a symbol. :return: Dictionary of attributes. =# function list_attr(self :: SymbolicNode) + ref_sz = Ref{MX_uint}(0) + ref_strings = Ref{char_pp}(0) + @mxcall(:MXSymbolListAttrShallow, (MX_handle, Ref{MX_uint}, Ref{char_pp}), + self, ref_sz, ref_strings) + narg = 2*ref_sz[] + strings = pointer_to_array(ref_strings[], narg) + out = Dict{Symbol, ByteString}() + for i in 1:2:narg + key = symbol(bytestring(strings[i])) + value = bytestring(strings[i+1]) + out[key] = value + end + return out +end + +#=doc +.. function: list_all_attr(self :: SymbolicNode) + + Get all attributes from the symbol graph. + :return: Dictionary of attributes. +=# +function list_all_attr(self :: SymbolicNode) ref_sz = Ref{MX_uint}(0) ref_strings = Ref{char_pp}(0) @mxcall(:MXSymbolListAttr, (MX_handle, Ref{MX_uint}, Ref{char_pp}), From baa9c2a98749b465edafeaed51e41e2bdf221d32 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Sun, 8 May 2016 23:22:42 -0400 Subject: [PATCH 323/630] revert #91 --- src/symbolic-node.jl | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index dcaae9bd5dc6..4ce5b59a18ea 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -613,17 +613,17 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) hint = lowercase($func_name_s) name = get!(DEFAULT_NAME_MANAGER, name, hint) + # set attrs + for (k, v) in attrs + set_attr(node, k, v) + end + if length(args) != 0 _compose!(node, name, args...) else _compose!(node; name=name, symbol_kws...) end - # set attrs - for (k, v) in attrs - set_attr(node, k, v) - end - return node end From 64a63f7797b946e334e38fbb08bd7ddd79634c12 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 11 May 2016 14:15:54 +0900 Subject: [PATCH 324/630] Deduplicate and generalise metric update! MXNet allows for the design of networks that use the same label for multiple outputs. Instead of failing for these kinds of networks, warn the user and try to proceed. --- src/metric.jl | 40 +++++++++++++--------------------------- 1 file changed, 13 insertions(+), 27 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 7916d45b639c..7e76b969d0a0 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -36,6 +36,19 @@ set. =# abstract AbstractEvalMetric +# Generic update! version +function update!{T <: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + if length(labels) != length(preds) + Base.warn_once( + "The number of labels ($(length(labels))) does not correspond to the\ + number of outputs ($(length(preds))). The calculated metric might not be accuracte.") + end + for (label, pred) in zip(labels, preds) + _update_single_output(metric, label, pred) + end +end + + #=doc .. class:: Accuracy @@ -85,13 +98,6 @@ function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDA end end -function update!(metric :: Accuracy, labels :: Vector{NDArray}, preds :: Vector{NDArray}) - @assert length(labels) == length(preds) - for i = 1:length(labels) - _update_single_output(metric, labels[i], preds[i]) - end -end - import Base: get function get(metric :: Accuracy) return [(:accuracy, metric.acc_sum / metric.n_sample)] @@ -129,13 +135,6 @@ function _update_single_output(metric :: MSE, label :: NDArray, pred :: NDArray) end end -function update!(metric :: MSE, labels :: Vector{NDArray}, preds :: Vector{NDArray}) - @assert length(labels) == length(preds) - for i = 1:length(labels) - _update_single_output(metric, labels[i], preds[i]) - end -end - function get(metric :: MSE) return [(:MSE, metric.mse_sum / metric.n_sample)] end @@ -193,13 +192,6 @@ function _update_single_output(metric :: ACE, label :: NDArray, pred :: NDArray) end end -function update!(metric :: ACE, labels :: Vector{NDArray}, preds :: Vector{NDArray}) - @assert length(labels) == length(preds) - for i = 1:length(labels) - _update_single_output(metric, labels[i], preds[i]) - end -end - #=doc .. class:: MultiACE @@ -251,9 +243,3 @@ function _update_single_output(metric :: MultiACE, label :: NDArray, pred :: NDA end end -function update!(metric :: MultiACE, labels :: Vector{NDArray}, preds :: Vector{NDArray}) - @assert length(labels) == length(preds) - for i = 1:length(labels) - _update_single_output(metric, labels[i], preds[i]) - end -end From 3a013b889a923b6aaaa27caead707ab64f830b36 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 25 May 2016 14:03:17 +0900 Subject: [PATCH 325/630] fixup expr check for v0.5 --- src/base.jl | 13 +++++++++++-- 1 file changed, 11 insertions(+), 2 deletions(-) diff --git a/src/base.jl b/src/base.jl index de48241ac7e9..2dc570147b61 100644 --- a/src/base.jl +++ b/src/base.jl @@ -189,10 +189,19 @@ function _defstruct_impl(is_immutable, name, fields) if isa(name, Symbol) name = esc(name) super_name = :Any + elseif VERSION >= v"0.5-" + @assert(isa(name, Expr) && name.head == :(<:) && length(name.args) == 2 && + isa(name.args[1], Symbol) && isa(name.args[2], Symbol), + "name must be of form 'Name <: SuperType'") + + super_name = esc(name.args[2]) + name = esc(name.args[1]) else - @assert(isa(name, Expr) && name.head == :comparison && length(name.args) == 3 && name.args[2] == :(<:), + @assert(isa(name, Expr) && name.head == :comparison && + length(name.args) == 3 && name.args[2] == :(<:) && + isa(name.args[1], Symbol) && isa(name.args[3], Symbol), "name must be of form 'Name <: SuperType'") - @assert(isa(name.args[1], Symbol) && isa(name.args[3], Symbol)) + super_name = esc(name.args[3]) name = esc(name.args[1]) end From e6d07f0268d1ae84fd874ca40306ccf99ecd0c57 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 25 May 2016 14:25:34 +0900 Subject: [PATCH 326/630] fix deprications on v0.5 --- REQUIRE | 3 ++- src/MXNet.jl | 3 +++ src/base.jl | 2 +- src/executor.jl | 2 +- src/io.jl | 6 +++--- src/kvstore.jl | 2 +- src/metric.jl | 2 +- src/model.jl | 8 ++++---- src/name.jl | 10 +++++----- src/ndarray.jl | 26 +++++++++++++------------- src/nn-factory.jl | 4 ++-- src/symbolic-node.jl | 38 +++++++++++++++++++------------------- src/util.jl | 6 +++--- src/visualize.jl | 4 ++-- 14 files changed, 60 insertions(+), 56 deletions(-) diff --git a/REQUIRE b/REQUIRE index fea260919fbc..d97c567e15db 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,4 +1,5 @@ -julia 0.4 +julia 0.4+ +Compat Formatting BinDeps JSON diff --git a/src/MXNet.jl b/src/MXNet.jl index 16ad415efe52..31618b795ed5 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -6,6 +6,9 @@ module MXNet # functions with the same names as built-in utilities like "zeros", etc. export mx module mx + +using Compat + using Formatting # Functions from base that we can safely extend and that are defined by libmxnet. diff --git a/src/base.jl b/src/base.jl index 2dc570147b61..bd67a7c2ac52 100644 --- a/src/base.jl +++ b/src/base.jl @@ -42,7 +42,7 @@ function mx_get_last_error() if msg == C_NULL throw(MXError("Failed to get last error message")) end - return bytestring(msg) + return @compat String(msg) end "Utility macro to call MXNet API functions" diff --git a/src/executor.jl b/src/executor.jl index e4b943c0c764..86f3f65921f4 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -221,5 +221,5 @@ Can be used to get an estimated about the memory cost. function debug_str(self :: Executor) s_ref = Ref{Cstring}() @mxcall(:MXExecutorPrint, (MX_handle, Ptr{Cstring}), self.handle, s_ref) - bytestring(s_ref[]) + @compat String(s_ref[]) end diff --git a/src/io.jl b/src/io.jl index 99fcd8516c6b..46fbcfe86a2d 100644 --- a/src/io.jl +++ b/src/io.jl @@ -584,7 +584,7 @@ function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) - iter_name = symbol(bytestring(ref_name[])) + iter_name = Symbol(String(ref_name[])) if gen_docs if endswith(string(iter_name), "Iter") @@ -592,7 +592,7 @@ function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) else f_desc = "" end - f_desc *= bytestring(ref_desc[]) * "\n\n" + f_desc *= String(ref_desc[]) * "\n\n" f_desc *= ":param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data.\n" f_desc *= ":param Base.Symbol label_name: keyword argument, default ``:softmax_label``. " * "The name of the label. Could be ``nothing`` if no label is presented in this dataset.\n\n" @@ -617,7 +617,7 @@ function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) # add an alias XXXProvider => XXXIter if endswith(string(iter_name), "Iter") - alias_name = symbol(string(iter_name)[1:end-4] * "Provider") + alias_name = Symbol(string(iter_name)[1:end-4] * "Provider") eval(:($alias_name = $iter_name)) end end diff --git a/src/kvstore.jl b/src/kvstore.jl index d52433f567b2..bc2e65c6fdd3 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -87,7 +87,7 @@ end function get_type(self :: KVStore) type_ref = Ref{char_p}(0) @mxcall(:MXKVStoreGetType, (MX_handle, Ref{char_p}), self, type_ref) - return symbol(bytestring(type_ref[])) + return Symbol(@compat String(type_ref[])) end function get_num_workers(self :: KVStore) diff --git a/src/metric.jl b/src/metric.jl index 7e76b969d0a0..1f601980ad13 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -208,7 +208,7 @@ type MultiACE <: AbstractEvalMetric end function get(metric :: MultiACE) - aces = [(symbol("ACE_$(i-0)"), - metric.aces[i] / metric.counts[i]) for i in 1:length(metric.aces)] + aces = [(Symbol("ACE_$(i-0)"), - metric.aces[i] / metric.counts[i]) for i in 1:length(metric.aces)] push!(aces, (:ACE, - Base.sum(metric.aces) / Base.sum(metric.counts))) return aces end diff --git a/src/model.jl b/src/model.jl index 3984eb9d1389..d9b81d02f3d9 100644 --- a/src/model.jl +++ b/src/model.jl @@ -374,7 +374,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra for (attr, value) in list_all_attr(self.arch) sattr = string(attr) if endswith(sattr, "grad") && value == "freeze" - push!(freeze_names, symbol(sattr[1:end-5])) + push!(freeze_names, Symbol(sattr[1:end-5])) end end # Needs to correspond to the correct id in the update loop layer idx=1:length(param_names). @@ -582,8 +582,8 @@ end function save_checkpoint(sym :: SymbolicNode, arg_params :: Dict{Base.Symbol, NDArray}, aux_params :: Dict{Base.Symbol, NDArray}, prefix :: AbstractString, epoch :: Int) save("$prefix-symbol.json", sym) - save_dict = merge(Dict([symbol("arg:$k") => v for (k,v) in arg_params]), - Dict([symbol("aux:$k") => v for (k,v) in aux_params])) + save_dict = merge(Dict([Symbol("arg:$k") => v for (k,v) in arg_params]), + Dict([Symbol("aux:$k") => v for (k,v) in aux_params])) save_filename = format("{1}-{2:04d}.params", prefix, epoch) save(save_filename, save_dict) info("Saved checkpoint to '$save_filename'") @@ -596,7 +596,7 @@ function load_checkpoint(prefix :: AbstractString, epoch :: Int) aux_params = Dict{Base.Symbol, NDArray}() for (k,v) in saved_dict tp, name = split(string(k), ':') - name = symbol(name) + name = Symbol(name) if tp == "arg" arg_params[name] = v else diff --git a/src/name.jl b/src/name.jl index 5ebf10917ce6..2ec531834232 100644 --- a/src/name.jl +++ b/src/name.jl @@ -9,14 +9,14 @@ import Base: get! # is automatically generated based on the hint string. function _default_get_name!(counter :: NameCounter, name :: NameType, hint :: NameType) if isa(name, Base.Symbol) || !isempty(name) - return symbol(name) + return Symbol(name) end - hint = symbol(hint) + hint = Symbol(hint) if !haskey(counter, hint) counter[hint] = 0 end - name = symbol("$hint$(counter[hint])") + name = Symbol("$hint$(counter[hint])") counter[hint] += 1 return name end @@ -34,11 +34,11 @@ type PrefixNameManager <: AbstractNameManager prefix :: Base.Symbol counter :: NameCounter end -PrefixNameManager(prefix :: NameType) = PrefixNameManager(symbol(prefix), NameCounter()) +PrefixNameManager(prefix :: NameType) = PrefixNameManager(Symbol(prefix), NameCounter()) function get!(manager :: PrefixNameManager, name :: NameType, hint :: NameType) name = _default_get_name!(manager.counter, name, hint) - return symbol("$(manager.prefix)$name") + return Symbol("$(manager.prefix)$name") end DEFAULT_NAME_MANAGER = BasicNameManager() diff --git a/src/ndarray.jl b/src/ndarray.jl index 9c4836e60771..1ed620d800e5 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -788,7 +788,7 @@ function load(filename::AbstractString, ::Type{NDArray}) return [NDArray(MX_NDArrayHandle(hdr)) for hdr in pointer_to_array(out_hdrs[], out_size)] else @assert out_size == out_name_size - return Dict([(symbol(bytestring(k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in + return Dict([(Symbol(@compat String(k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in zip(pointer_to_array(out_names[], out_size), pointer_to_array(out_hdrs[], out_size))]) end end @@ -903,11 +903,11 @@ function _import_ndarray_functions(;gen_docs=false) func_handle, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs, ref_ret_type) - func_name = symbol(bytestring(ref_name[])) + func_name = Symbol(@compat String(ref_name[])) if gen_docs # generate document only - f_desc = bytestring(ref_desc[]) * "\n\n" + f_desc = @compat String(ref_desc[]) * "\n\n" f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) docs[func_name] = f_desc else @@ -932,18 +932,18 @@ function _import_ndarray_functions(;gen_docs=false) # general ndarray function if arg_before_scalar - args = vcat([Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + args = vcat([Expr(:(::), Symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), Symbol("sca$i"), Real) for i=1:n_scalars], + [Expr(:(::), Symbol("out$i"), NDArray) for i=1:n_mutate_vars]) else - args = vcat([Expr(:(::), symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + args = vcat([Expr(:(::), Symbol("sca$i"), Real) for i=1:n_scalars], + [Expr(:(::), Symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), Symbol("out$i"), NDArray) for i=1:n_mutate_vars]) end - _use_vars = Expr(:ref, :MX_handle, [symbol("in$i") for i=1:n_used_vars]...) - _scalars = Expr(:ref, :MX_float, [symbol("sca$i") for i=1:n_scalars]...) - _mut_vars = Expr(:ref, :MX_handle, [symbol("out$i") for i=1:n_mutate_vars]...) + _use_vars = Expr(:ref, :MX_handle, [Symbol("in$i") for i=1:n_used_vars]...) + _scalars = Expr(:ref, :MX_float, [Symbol("sca$i") for i=1:n_scalars]...) + _mut_vars = Expr(:ref, :MX_handle, [Symbol("out$i") for i=1:n_mutate_vars]...) # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped # See https://github.com/dmlc/MXNet.jl/issues/55 @@ -955,7 +955,7 @@ function _import_ndarray_functions(;gen_docs=false) if n_mutate_vars == 1 stmt_ret = :(return out1) else - stmt_ret = Expr(:return, Expr(:tuple, [symbol("out$i") for i=1:n_mutate_vars]...)) + stmt_ret = Expr(:return, Expr(:tuple, [Symbol("out$i") for i=1:n_mutate_vars]...)) end func_body = Expr(:block, stmt_call, stmt_ret) diff --git a/src/nn-factory.jl b/src/nn-factory.jl index 984f50a5f782..3725587f37a1 100644 --- a/src/nn-factory.jl +++ b/src/nn-factory.jl @@ -39,10 +39,10 @@ function MLP(input, spec; hidden_activation::Base.Symbol=:relu, prefix=gensym()) n_unit = s act_type = hidden_activation end - input = FullyConnected(input, name=symbol(prefix, "fc$i"), num_hidden=n_unit) + input = FullyConnected(input, name=Symbol(prefix, "fc$i"), num_hidden=n_unit) if i < n_layer || isa(s, Tuple) # will not add activation unless the user explicitly specified - input = Activation(input, name=symbol(prefix, "$act_type$i"), act_type=act_type) + input = Activation(input, name=Symbol(prefix, "$act_type$i"), act_type=act_type) end end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 4ce5b59a18ea..2b9d466c8e95 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -62,7 +62,7 @@ macro _list_symbol_info(self, func_name) $self, ref_sz, ref_names) narg = ref_sz[] names = pointer_to_array(ref_names[], narg) - names = [symbol(bytestring(x)) for x in names] + names = [Symbol(@compat String(x)) for x in names] return names end end @@ -129,13 +129,13 @@ end :return: The value belonging to key as a :class:`Nullable`. =# function get_attr(self :: SymbolicNode, key :: Symbol) - key_s = bytestring(string(key)) + key_s = @compat String(string(key)) ref_out = Ref{Cstring}() ref_success = Ref{Cint}(-1) @mxcall(:MXSymbolGetAttr, (MX_handle, Cstring, Ref{Cstring}, Ref{Cint}), self, key_s, ref_out, ref_success) if ref_success[] == 1 - return Nullable{ByteString}(bytestring(ref_out[])) + return Nullable{ByteString}(@compat String(ref_out[])) else return Nullable{ByteString}() end @@ -156,8 +156,8 @@ function list_attr(self :: SymbolicNode) strings = pointer_to_array(ref_strings[], narg) out = Dict{Symbol, ByteString}() for i in 1:2:narg - key = symbol(bytestring(strings[i])) - value = bytestring(strings[i+1]) + key = Symbol(@compat String(strings[i])) + value = @compat String(strings[i+1]) out[key] = value end return out @@ -178,8 +178,8 @@ function list_all_attr(self :: SymbolicNode) strings = pointer_to_array(ref_strings[], narg) out = Dict{Symbol, ByteString}() for i in 1:2:narg - key = symbol(bytestring(strings[i])) - value = bytestring(strings[i+1]) + key = Symbol(@compat String(strings[i])) + value = @compat String(strings[i+1]) out[key] = value end return out @@ -198,8 +198,8 @@ end cause unexpected behavior and inconsistency. =# function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) - key_s = bytestring(string(key)) - value_s = bytestring(value) + key_s = @compat String(string(key)) + value_s = @compat String(value) @mxcall(:MXSymbolSetAttr, (MX_handle, Cstring, Cstring), self, key_s, value_s) end @@ -325,7 +325,7 @@ end indicating the index, as in the list of :func:`list_outputs`. =# function Base.getindex(self :: SymbolicNode, idx :: Union{Base.Symbol, AbstractString}) - idx = symbol(idx) + idx = Symbol(idx) i_idx = find(idx .== list_outputs(self)) @assert(length(i_idx) > 0, "Cannot find output with name '$idx'") @assert(length(i_idx) < 2, "Found duplicated output with name '$idx'") @@ -474,7 +474,7 @@ end function to_json(self :: SymbolicNode) ref_json = Ref{char_p}(0) @mxcall(:MXSymbolSaveToJSON, (MX_handle, Ref{char_p}), self, ref_json) - return bytestring(ref_json[]) + return @compat String(ref_json[]) end #=doc @@ -533,20 +533,20 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, ref_kv_nargs, ref_ret_type) - func_name_s= bytestring(ref_name[]) - func_name = symbol(func_name_s) - kv_nargs_s = bytestring(ref_kv_nargs[]) - kv_nargs = symbol(kv_nargs_s) + func_name_s= @compat String(ref_name[]) + func_name = Symbol(func_name_s) + kv_nargs_s = @compat String(ref_kv_nargs[]) + kv_nargs = Symbol(kv_nargs_s) if gen_docs - f_desc = bytestring(ref_desc[]) * "\n\n" + f_desc = @compat String(ref_desc[]) * "\n\n" if !isempty(kv_nargs_s) f_desc *= "This function support variable length positional :class:`SymbolicNode` inputs.\n\n" end f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) f_desc *= ":param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional.\n" f_desc *= ":param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`.\n\n" - f_desc *= ":return: $(_format_typestring(bytestring(ref_ret_type[]))).\n\n" + f_desc *= ":return: $(_format_typestring(@compat String(ref_ret_type[]))).\n\n" return (func_name, f_desc) end @@ -565,7 +565,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) symbol_kws = Dict{Symbol, SymbolicNode}() attrs = Dict{Symbol, AbstractString}() - $(if kv_nargs != symbol("") + $(if kv_nargs != Symbol("") quote if !in($kv_nargs_s, param_keys) push!(param_keys, $kv_nargs_s) @@ -593,7 +593,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) if length(args) != 0 && length(symbol_kws) != 0 @assert(false, $func_name_s * " only accepts Symbols either as positional or keyword arguments, not both.") end - $(if kv_nargs != symbol("") + $(if kv_nargs != Symbol("") quote if length(symbol_kws) > 0 @assert(false, $func_name_s * " takes variable number of SymbolicNode arguments, " * diff --git a/src/util.jl b/src/util.jl index d6ce97a3e5ca..73c3316fa9f7 100644 --- a/src/util.jl +++ b/src/util.jl @@ -75,14 +75,14 @@ function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{ch docstrings = AbstractString[] for i = 1:narg - arg_name = bytestring(arg_names[i]) + arg_name = @compat String(arg_names[i]) if arg_name ∈ param_keys && remove_dup continue end push!(param_keys, arg_name) - arg_type = _format_typestring(bytestring(arg_types[i])) - arg_desc = bytestring(arg_descs[i]) + arg_type = _format_typestring(@compat String(arg_types[i])) + arg_desc = @compat String(arg_descs[i]) push!(docstrings, ":param $arg_name: $arg_desc\n:type $arg_name: $arg_type\n\n") end return join(docstrings, "\n") diff --git a/src/visualize.jl b/src/visualize.jl index b1fa90ff3851..3d46b9c38cb3 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -117,10 +117,10 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp attr = Dict(:dir => :back, :arrowtail => :open, :color => "#737373") if draw_shape if input_node["op"] != "null" - key = symbol(input_name, "_output") + key = Symbol(input_name, "_output") shape = shape_dict[key][1:end-1] else - key = symbol(input_name) + key = Symbol(input_name) shape = shape_dict[key][1:end-1] end label = "(" * join([string(x) for x in shape], ",") * ")" From 55f2a42dfaaf67e27fd08ffda5f48abee445dbfc Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 25 May 2016 14:28:08 +0900 Subject: [PATCH 327/630] fix overwriting of inner function --- src/initializer.jl | 12 +++++------- 1 file changed, 5 insertions(+), 7 deletions(-) diff --git a/src/initializer.jl b/src/initializer.jl index 00e71b19c3cd..8be33bdf66d2 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -138,12 +138,6 @@ function _init_weight(self :: XavierInitializer, name :: Base.Symbol, array :: N fan_in = prod(dims[2:end]) fan_out = dims[1] - if self.distribution == xv_uniform - func(σ, data) = rand!(-σ, σ, data) - elseif self.distribution == xv_normal - func(σ, data) = randn!(0.0, σ, data) - end - if self.regularization == xv_avg factor = (fan_in + fan_out) / 2 elseif self.regularization == xv_in @@ -154,5 +148,9 @@ function _init_weight(self :: XavierInitializer, name :: Base.Symbol, array :: N σ = √(self.magnitude / factor) - func(σ, array) + if self.distribution == xv_uniform + rand!(-σ, σ, array) + elseif self.distribution == xv_normal + randn!(0.0, σ, array) + end end From 48b723a96d3a1f90149c01e62be38fccff315bdd Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 25 May 2016 14:34:28 +0900 Subject: [PATCH 328/630] fix ByteString deprication and deprications in tests --- src/MXNet.jl | 1 + src/symbolic-node.jl | 8 ++++---- test/unittest/name.jl | 8 ++++---- test/unittest/ndarray.jl | 2 +- 4 files changed, 10 insertions(+), 9 deletions(-) diff --git a/src/MXNet.jl b/src/MXNet.jl index 31618b795ed5..cdbacbe64be0 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -8,6 +8,7 @@ export mx module mx using Compat +import Compat.String using Formatting diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 2b9d466c8e95..da251e4cc74f 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -135,9 +135,9 @@ function get_attr(self :: SymbolicNode, key :: Symbol) @mxcall(:MXSymbolGetAttr, (MX_handle, Cstring, Ref{Cstring}, Ref{Cint}), self, key_s, ref_out, ref_success) if ref_success[] == 1 - return Nullable{ByteString}(@compat String(ref_out[])) + return Nullable{String}(@compat String(ref_out[])) else - return Nullable{ByteString}() + return Nullable{String}() end end @@ -154,7 +154,7 @@ function list_attr(self :: SymbolicNode) self, ref_sz, ref_strings) narg = 2*ref_sz[] strings = pointer_to_array(ref_strings[], narg) - out = Dict{Symbol, ByteString}() + out = Dict{Symbol, String}() for i in 1:2:narg key = Symbol(@compat String(strings[i])) value = @compat String(strings[i+1]) @@ -176,7 +176,7 @@ function list_all_attr(self :: SymbolicNode) self, ref_sz, ref_strings) narg = 2*ref_sz[] strings = pointer_to_array(ref_strings[], narg) - out = Dict{Symbol, ByteString}() + out = Dict{Symbol, String}() for i in 1:2:narg key = Symbol(@compat String(strings[i])) value = @compat String(strings[i+1]) diff --git a/test/unittest/name.jl b/test/unittest/name.jl index a7dd6f7bfc35..aca039670286 100644 --- a/test/unittest/name.jl +++ b/test/unittest/name.jl @@ -10,8 +10,8 @@ function test_default() @test get!(mx.DEFAULT_NAME_MANAGER, string(name), "") == name hint = name - @test get!(mx.DEFAULT_NAME_MANAGER, "", hint) == symbol("$(hint)0") - @test get!(mx.DEFAULT_NAME_MANAGER, "", string(hint)) == symbol("$(hint)1") + @test get!(mx.DEFAULT_NAME_MANAGER, "", hint) == Symbol("$(hint)0") + @test get!(mx.DEFAULT_NAME_MANAGER, "", string(hint)) == Symbol("$(hint)1") end function test_prefix() @@ -21,8 +21,8 @@ function test_prefix() prefix = :_____foobar_____ prefix_manager = mx.PrefixNameManager(prefix) - @test get!(prefix_manager, name, "") == symbol("$prefix$name") - @test get!(prefix_manager, "", name) == symbol("$prefix$(name)0") + @test get!(prefix_manager, name, "") == Symbol("$prefix$name") + @test get!(prefix_manager, "", name) == Symbol("$prefix$(name)0") end test_default() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 67bff2959c8a..444aa90616fe 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -202,7 +202,7 @@ function test_saveload() end # save and load dictionary of ndarrays - names = [symbol("array$i") for i = 1:n_arrays] + names = [Symbol("array$i") for i = 1:n_arrays] dict = Dict([n => v for (n,v) in zip(names, nd_arrays)]) mx.save(fname, dict) data = mx.load(fname, mx.NDArray) From afd9baa1b614768502821a0d8f43803d400eb417 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 May 2016 10:10:28 +0900 Subject: [PATCH 329/630] enable travis for 0.5 --- .travis.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.travis.yml b/.travis.yml index df63021f35aa..9f08e176eed2 100644 --- a/.travis.yml +++ b/.travis.yml @@ -6,7 +6,7 @@ os: - osx julia: - 0.4 - #- nightly + - nightly # dependent apt packages addons: From 9c9e762947fff926cd040743c367b91403429f35 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 24 May 2016 10:45:22 +0900 Subject: [PATCH 330/630] Initial support for DType and TypeFlags This also adds MXNDArrayCreateNX and rewrites eltype to get the DType from mxnet --- src/ndarray.jl | 67 ++++++++++++++++++++++++++++++++++++++++++++++---- 1 file changed, 62 insertions(+), 5 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 1ed620d800e5..3987c7f5bbbd 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -3,6 +3,42 @@ NDArray API =========== =# +# All the types supported by mshadow. +typealias DType Union{Float32, Float64, Float16, UInt8, Int32} +@enum TypeFlag kFloat32 kFloat64 kFloat16 kUint8 kInt32 + +function toTypeFlag{T <: DType}(:: Type{T}) + if T == Float32 + return kFloat32 + elseif T == Float64 + return kFloat64 + elseif T == Float16 + return kFloat16 + elseif T == UInt8 + return kUint8 + elseif T == Int32 + return kInt32 + else + throw(ArgumentError("Can't convert $T to Dtype.")) + end +end + +function fromTypeFlag(T :: TypeFlag) + if T == kFloat32 + return Float32 + elseif T == kFloat64 + return Float64 + elseif T == kFloat16 + return Float16 + elseif T == kUint8 + return UInt8 + elseif T == kInt32 + return Int32 + else + throw(ArgumentError("Can't convert Dtype $T.")) + end +end + # create a NDArray handle of specific shape function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) h_ref = Ref{MX_handle}(0) @@ -13,6 +49,17 @@ function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc return handle end +# create a NDArray handle of specific shape type +function _ndarray_alloc{T <: DType,N}(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) + h_ref = Ref{MX_handle}(0) + shape = flipdim(MX_uint[shape...],1) + dtype = toTypeFlag(T) + @mxcall(:MXNDArrayCreateEx, (Ptr{MX_uint}, MX_uint, Cint, Cint, Cint, Cint, Ref{MX_handle}), + shape, length(shape), ctx.device_type, ctx.device_id, delay_alloc, dtype, h_ref) + handle = MX_NDArrayHandle(h_ref[]) + return handle +end + # create a handle to an empty NDArray, this handle can be used to hold # results returned by libmx API calls function _ndarray_alloc() @@ -51,7 +98,7 @@ type NDArray end function Base.show(io :: IO, arr :: NDArray) - print(io, "mx.NDArray$(size(arr))") + print(io, "mx.NDArray{$(eltype(arr))}$(size(arr))") end function NDArray{T<:Real}(data :: Array{T}) @@ -185,10 +232,20 @@ end #=doc .. function:: eltype(arr :: NDArray) - Get the element type of an :class:`NDArray`. Currently the element type is always ``mx.MX_float``. + Get the element type of an :class:`NDArray`. =# -function eltype(arr :: NDArray) - MX_float +function eltype{T <: Union{NDArray, MX_NDArrayHandle}}(arr :: T) + dtype_ref = Ref{Cint}(0) + @mxcall(:MXNDArrayGetDType, (MX_handle, Ptr{Cint}), arr, dtype_ref) + + if dtype_ref[] == -1 # arr->is_none() + warn("Eltype of $arr is not defined") + Base.show_backtrace(STDOUT,backtrace()) + println() + return Float32 + else + return fromTypeFlag(TypeFlag(dtype_ref[])) + end end @@ -499,7 +556,7 @@ function .-(arg0 :: Real, arg1 :: NDArray) end function -(arg0 :: NDArray) - _mul_scalar(arg0, -1.0) + _mul_scalar(arg0, -one(eltype(arg0))) end #=doc From a282586232a65ca05311f99a40c46eb4e6ee1985 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 May 2016 12:06:14 +0900 Subject: [PATCH 331/630] add typed empty, ones, zeros --- src/ndarray.jl | 62 +++++++++++++++++++++++++++++++++++++++- test/unittest/ndarray.jl | 14 +++++++++ 2 files changed, 75 insertions(+), 1 deletion(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 3987c7f5bbbd..f903a797fb66 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -6,6 +6,7 @@ NDArray API # All the types supported by mshadow. typealias DType Union{Float32, Float64, Float16, UInt8, Int32} @enum TypeFlag kFloat32 kFloat64 kFloat16 kUint8 kInt32 +typealias DEFAULT_DTYPE Float32 function toTypeFlag{T <: DType}(:: Type{T}) if T == Float32 @@ -127,13 +128,32 @@ function context(arr :: NDArray) return Context(ref_typeid[], ref_devid[]) end + +#=doc +.. function:: + empty(DType, shape :: Tuple, ctx :: Context) + empty(DType, shape :: Tuple) + empty(DType, dim1, dim2, ...) + + Allocate memory for an uninitialized :class:`NDArray` with a specified type. +=# +function empty{N,T<:DType}(::Type{T}, shape :: NTuple{N, Int}) + empty(T, shape, cpu()) +end +function empty{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) + NDArray(_ndarray_alloc(T, shape, ctx, false)) +end +function empty{T<:DType}(:: Type{T}, shape :: Int...) + empty(T, shape) +end + #=doc .. function:: empty(shape :: Tuple, ctx :: Context) empty(shape :: Tuple) empty(dim1, dim2, ...) - Allocate memory for an uninitialized :class:`NDArray` with specific shape. + Allocate memory for an uninitialized :class:`NDArray` with specific shape of type Float32. =# function empty{N}(shape :: NTuple{N, Int}) empty(shape, cpu()) @@ -150,6 +170,26 @@ Interface functions similar to Julia Arrays ------------------------------------------- =# +#=doc +.. function:: + zeros(DType, shape :: Tuple, ctx :: Context) + zeros(DType, shape :: Tuple) + zeros(DType, dim1, dim2, ...) + + Create zero-ed :class:`NDArray` with specific shape and type +=# +function zeros{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}) + zeros(T, shape, cpu()) +end +function zeros{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) + arr = empty(T, shape, ctx) + arr[:] = zero(T) + return arr +end +function zeros{T<:DType}(:: Type{T}, shape :: Int...) + zeros(T, shape) +end + #=doc .. function:: zeros(shape :: Tuple, ctx :: Context) @@ -170,6 +210,26 @@ function zeros(shape :: Int...) zeros(shape) end +#=doc +.. function:: + ones(DType, shape :: Tuple, ctx :: Context) + ones(DType, shape :: Tuple) + ones(DType, dim1, dim2, ...) + + Create an :class:`NDArray` with specific shape & type, and initialize with 1. +=# +function ones{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}) + ones(T, shape, cpu()) +end +function ones{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) + arr = empty(T, shape, ctx) + arr[:] = one(T) + return arr +end +function ones{T<:DType}(:: Type{T}, shape :: Int...) + ones(T, shape) +end + #=doc .. function:: ones(shape :: Tuple, ctx :: Context) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 444aa90616fe..6750e9eb5914 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -271,6 +271,19 @@ function test_dot() @test size(z) == (2, 8) end +function test_eltype() + info("NDArray::eltype") + dims1 = (3,3) + + x = mx.empty(dims1) + @test eltype(x) == mx.DEFAULT_DTYPE + + for TF in instances(mx.TypeFlag) + T = mx.fromTypeFlag(TF) + x = mx.empty(T, dims1) + @test eltype(x) == T + end +end ################################################################################ # Run tests @@ -286,6 +299,7 @@ test_gd() test_saveload() test_clip() test_sqrt() +test_eltype() test_nd_as_jl() test_dot() From c161fe16c204685bf96aa58008066ab15ea3f940 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 May 2016 13:56:10 +0900 Subject: [PATCH 332/630] make arithmetic work with DType and extend arithmetic tests on all types --- src/ndarray.jl | 41 ++++++++++++++++++++------------------- test/unittest/bind.jl | 24 ++++++++++++----------- test/unittest/ndarray.jl | 13 +++++++++++++ test/unittest/operator.jl | 2 +- 4 files changed, 48 insertions(+), 32 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index f903a797fb66..1c34c45d0c33 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -20,7 +20,7 @@ function toTypeFlag{T <: DType}(:: Type{T}) elseif T == Int32 return kInt32 else - throw(ArgumentError("Can't convert $T to Dtype.")) + throw(ArgumentError("Can't convert $T to DType.")) end end @@ -36,7 +36,7 @@ function fromTypeFlag(T :: TypeFlag) elseif T == kInt32 return Int32 else - throw(ArgumentError("Can't convert Dtype $T.")) + throw(ArgumentError("Can't convert DType $T.")) end end @@ -353,7 +353,7 @@ import Base: setindex! =# function setindex!(arr :: NDArray, val :: Real, ::Colon) @assert(arr.writable) - _set_value(val, arr) + _set_value(convert(eltype(arr), val), arr) return arr end function setindex!{T<:Real}(arr :: NDArray, val :: Array{T}, ::Colon) @@ -426,9 +426,10 @@ function copy!(dst :: NDArray, src :: NDArray) return dst end -function copy!(dst :: Array{MX_float}, src :: NDArray) +function copy!{T<:DType}(dst :: Array{T}, src :: NDArray) + @assert T == eltype(src) @assert size(dst) == size(src) - @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{MX_float}, Csize_t), + @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{Void}, Csize_t), src, pointer(dst), length(dst)) return dst end @@ -439,8 +440,8 @@ end function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) @assert dst.writable @assert size(dst) == size(src) - src = convert(Array{MX_float}, src) # this might involve copying - @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), + src = convert(Array{eltype(dst)}, src) # this might involve copying + @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{Void}, Csize_t), dst.handle, pointer(src), length(src)) return dst end @@ -448,8 +449,8 @@ end function copy_ignore_shape!{T<:Real}(dst :: NDArray, src :: Array{T}) @assert dst.writable @assert length(dst) == length(src) - src = convert(Array{MX_float}, src) # this might involve copying - @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{MX_float}, Csize_t), + src = convert(Array{eltype(dst)}, src) # this might involve copying + @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{Void}, Csize_t), dst.handle, pointer(src), length(src)) return dst end @@ -466,19 +467,19 @@ end =# # Create copy: NDArray -> Julia Array function copy(arr :: NDArray) - j_arr = Array(MX_float, size(arr)) + j_arr = Array{eltype(arr)}(size(arr)) copy!(j_arr, arr) end # Create copy: NDArray -> NDArray in a given context function copy(arr :: NDArray, ctx :: Context) - dst = NDArray(_ndarray_alloc(size(arr), ctx, true)) + dst = NDArray(_ndarray_alloc(eltype(arr), size(arr), ctx, true)) copy!(dst, arr) end # Create copy: Julia Array -> NDArray in a given context -function copy{T<:Real}(arr :: Array{T}, ctx :: Context) - dst = empty(size(arr), ctx) +function copy{T<:DType}(arr :: Array{T}, ctx :: Context) + dst = empty(T, size(arr), ctx) copy!(dst, arr) end @@ -543,7 +544,7 @@ function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) @assert dst.writable for arg in args if isa(arg, Real) - _plus_scalar(dst, arg, dst) + _plus_scalar(dst, convert(eltype(dst), arg), dst) else _plus(dst, arg, dst) end @@ -583,7 +584,7 @@ end function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) - _minus_scalar(dst, arg, dst) + _minus_scalar(dst, convert(eltype(dst), arg), dst) else _minus(dst, arg, dst) end @@ -628,7 +629,7 @@ end function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) - _mul_scalar(dst, arg, dst) + _mul_scalar(dst, convert(eltype(dst), arg), dst) else _mul(dst, arg, dst) end @@ -673,7 +674,7 @@ end function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) - _div_scalar(dst, arg, dst) + _div_scalar(dst, convert(eltype(dst), arg), dst) else _div(dst, arg, dst) end @@ -821,7 +822,7 @@ import Base.pointer function pointer(arr :: NDArray) pdata = Ref{Ptr{MX_float}}(0) @mxcall(:MXNDArrayGetData, (MX_handle, Ref{Ptr{MX_float}}), arr, pdata) - return pdata[] + return convert(Ptr{eltype(arr)}, pdata[]) end function _wait_to_read(arr :: NDArray) @mxcall(:MXNDArrayWaitToRead, (MX_handle,), arr) @@ -861,10 +862,10 @@ end :param Array j_arr: the Julia Array. :param NDArray arr: the :class:`NDArray`. =# -function is_shared{T}(j_arr :: Array{T}, arr :: NDArray) +function is_shared(j_arr :: Array, arr :: NDArray) false end -function is_shared(j_arr :: Array{MX_float}, arr :: NDArray) +function is_shared{T<:DType}(j_arr :: Array{T}, arr :: NDArray) if length(j_arr) != length(arr) return false end diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl index 760e261fe581..6e1b821aa418 100644 --- a/test/unittest/bind.jl +++ b/test/unittest/bind.jl @@ -7,19 +7,19 @@ using ..Main: rand_dims, reldiff ################################################################################ # Test Implementations ################################################################################ -function test_arithmetic(uf, gf) +function test_arithmetic{T <: mx.DType}(::Type{T}, uf, gf) shape = rand_dims() - info("Bind::arithmetic::$uf::dims = $shape") + info("Bind::arithmetic::$T::$uf::dims = $shape") lhs = mx.Variable(:lhs) rhs = mx.Variable(:rhs) ret = uf(lhs, rhs) @test mx.list_arguments(ret) == [:lhs, :rhs] - lhs_arr = mx.NDArray(rand(shape)) - rhs_arr = mx.NDArray(rand(shape)) - lhs_grad = mx.empty(shape) - rhs_grad = mx.empty(shape) + lhs_arr = mx.NDArray(rand(T, shape)) + rhs_arr = mx.NDArray(rand(T, shape)) + lhs_grad = mx.empty(T, shape) + rhs_grad = mx.empty(T, shape) exec2 = mx.bind(ret, mx.Context(mx.CPU), [lhs_arr, rhs_arr], args_grad=[lhs_grad, rhs_grad]) exec3 = mx.bind(ret, mx.Context(mx.CPU), [lhs_arr, rhs_arr]) @@ -39,7 +39,7 @@ function test_arithmetic(uf, gf) @test reldiff(out1, out4) < 1e-6 # test gradients - out_grad = mx.NDArray(ones(shape)) + out_grad = mx.NDArray(ones(T, shape)) lhs_grad2, rhs_grad2 = gf(copy(out_grad), copy(lhs_arr), copy(rhs_arr)) mx.backward(exec2, out_grad) @test reldiff(copy(lhs_grad), lhs_grad2) < 1e-6 @@ -55,10 +55,12 @@ function test_arithmetic(uf, gf) end function test_arithmetic() - test_arithmetic(.+, (g,x,y) -> (g,g)) - test_arithmetic(.-, (g,x,y) -> (g,-g)) - test_arithmetic(.*, (g,x,y) -> (y.*g, x.*g)) - test_arithmetic(./, (g,x,y) -> (g ./ y, -x .* g ./ (y.^2))) + for T in [mx.fromTypeFlag(TF) for TF in instances(mx.TypeFlag)] + test_arithmetic(T, .+, (g,x,y) -> (g,g)) + test_arithmetic(T, .-, (g,x,y) -> (g,-g)) + test_arithmetic(T, .*, (g,x,y) -> (y.*g, x.*g)) + test_arithmetic(T, ./, (g,x,y) -> (g ./ y, -x .* g ./ (y.^2))) + end end ################################################################################ diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 6750e9eb5914..f76d8cd95b59 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -44,11 +44,24 @@ function test_assign() array2 = mx.zeros(size(tensor)) @test reldiff(zeros(size(tensor)), copy(array2)) < 1e-6 + array3 = mx.zeros(Float16, size(tensor)) + @test reldiff(zeros(Float16, size(tensor)), copy(array2)) < 1e-6 + # scalar -> NDArray assignment scalar = rand() array2[:] = scalar @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < 1e-6 + scalar = rand(Float16) + array2[:] = scalar + @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < 1e-6 + + scalar = rand(Float64) + array2[:] = scalar + array3[:] = scalar + @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < 1e-6 + @test reldiff(zeros(Float16,size(tensor))+scalar, copy(array3)) < 1e-6 + # NDArray -> NDArray assignment array[:] = array2 @test reldiff(zeros(size(tensor))+scalar, copy(array)) < 1e-6 diff --git a/test/unittest/operator.jl b/test/unittest/operator.jl index 2284b1080c7e..f4332582428c 100644 --- a/test/unittest/operator.jl +++ b/test/unittest/operator.jl @@ -9,7 +9,7 @@ function test_scalar_op() shape = rand_dims() info("Operator::scalar_op::dims = $shape") - data_jl = 5ones(shape) + data_jl = 5ones(Float32, shape) arr_data = mx.copy(data_jl, mx.cpu()) arr_grad = mx.zeros(shape) From 2916a8f5da0f31a4ca8d66afbc86c97cf3791a51 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 May 2016 16:49:47 +0900 Subject: [PATCH 333/630] turn macro into helper function --- src/symbolic-node.jl | 87 ++++++++++++++++++++++---------------------- 1 file changed, 43 insertions(+), 44 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index da251e4cc74f..dbc3eb7dd26d 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -236,53 +236,52 @@ function Group(nodes :: SymbolicNode...) SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -macro _infer_shape(self, keys, indptr, sdata) - quote - ref_arg_shape_size = Ref{MX_uint}(0) - ref_arg_shape_ndim = Ref{Ptr{MX_uint}}(0) - ref_arg_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) - ref_out_shape_size = Ref{MX_uint}(0) - ref_out_shape_ndim = Ref{Ptr{MX_uint}}(0) - ref_out_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) - ref_aux_shape_size = Ref{MX_uint}(0) - ref_aux_shape_ndim = Ref{Ptr{MX_uint}}(0) - ref_aux_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) - ref_complete = Ref{Cint}(0) - @mxcall(:MXSymbolInferShape, - (MX_handle, MX_uint, char_pp, Ptr{MX_uint}, Ptr{MX_uint}, - Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, - Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, - Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, - Ref{Cint}), - self, length(indptr)-1, keys, indptr, sdata, - ref_arg_shape_size, ref_arg_shape_ndim, ref_arg_shape_data, - ref_out_shape_size, ref_out_shape_ndim, ref_out_shape_data, - ref_aux_shape_size, ref_aux_shape_ndim, ref_aux_shape_data, - ref_complete) - if ref_complete[] == 0 - return (nothing, nothing, nothing) - else - function build_shapes(shape_size::MX_uint, shape_ndim::Ptr{MX_uint}, shape_data::Ptr{Ptr{MX_uint}}) - shape_ndim = pointer_to_array(shape_ndim, shape_size) - shape_data = pointer_to_array(shape_data, shape_size) - shapes = map(1:shape_size) do i - my_shape = pointer_to_array(shape_data[i], shape_ndim[i]) - tuple(flipdim(Int[my_shape...],1)...) - end - convert(Vector{Tuple}, shapes) - end - return ( - build_shapes(ref_arg_shape_size[], ref_arg_shape_ndim[], ref_arg_shape_data[]), - build_shapes(ref_out_shape_size[], ref_out_shape_ndim[], ref_out_shape_data[]), - build_shapes(ref_aux_shape_size[], ref_aux_shape_ndim[], ref_aux_shape_data[]) - ) - end +function _build_shapes(shape_size::MX_uint, shape_ndim::Ptr{MX_uint}, shape_data::Ptr{Ptr{MX_uint}}) + shape_ndim = pointer_to_array(shape_ndim, shape_size) + shape_data = pointer_to_array(shape_data, shape_size) + shapes = map(1:shape_size) do i + my_shape = pointer_to_array(shape_data[i], shape_ndim[i]) + tuple(flipdim(Int[my_shape...],1)...) + end + convert(Vector{Tuple}, shapes) +end + +function _infer_shape(self, keys, indptr, sdata) + ref_arg_shape_size = Ref{MX_uint}(0) + ref_arg_shape_ndim = Ref{Ptr{MX_uint}}(0) + ref_arg_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) + ref_out_shape_size = Ref{MX_uint}(0) + ref_out_shape_ndim = Ref{Ptr{MX_uint}}(0) + ref_out_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) + ref_aux_shape_size = Ref{MX_uint}(0) + ref_aux_shape_ndim = Ref{Ptr{MX_uint}}(0) + ref_aux_shape_data = Ref{Ptr{Ptr{MX_uint}}}(0) + ref_complete = Ref{Cint}(0) + @mxcall(:MXSymbolInferShape, + (MX_handle, MX_uint, char_pp, Ptr{MX_uint}, Ptr{MX_uint}, + Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, + Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, + Ref{MX_uint}, Ref{Ptr{MX_uint}}, Ref{Ptr{Ptr{MX_uint}}}, + Ref{Cint}), + self, length(indptr)-1, keys, indptr, sdata, + ref_arg_shape_size, ref_arg_shape_ndim, ref_arg_shape_data, + ref_out_shape_size, ref_out_shape_ndim, ref_out_shape_data, + ref_aux_shape_size, ref_aux_shape_ndim, ref_aux_shape_data, + ref_complete) + if ref_complete[] == 0 + return (nothing, nothing, nothing) + else + return ( + _build_shapes(ref_arg_shape_size[], ref_arg_shape_ndim[], ref_arg_shape_data[]), + _build_shapes(ref_out_shape_size[], ref_out_shape_ndim[], ref_out_shape_data[]), + _build_shapes(ref_aux_shape_size[], ref_aux_shape_ndim[], ref_aux_shape_data[]) + ) end end #=doc .. function:: - infer_shape(self :: SymbolicNode; args...) + infer_shape(self :: SymbolicNode, args...) infer_shape(self :: SymbolicNode; kwargs...) Do shape inference according to the input shapes. The input shapes could be provided @@ -302,7 +301,7 @@ function infer_shape(self :: SymbolicNode; kwargs...) push!(indptr, length(sdata)) end keys = AbstractString[string(x[1]) for x in kwargs] - @_infer_shape(self, keys, indptr, sdata) + _infer_shape(self, keys, indptr, sdata) end function infer_shape(self :: SymbolicNode, args :: Union{Tuple, Void}...) sdata = MX_uint[] @@ -313,7 +312,7 @@ function infer_shape(self :: SymbolicNode, args :: Union{Tuple, Void}...) push!(indptr, length(sdata)) end keys = Ptr{char_p}(0) - @_infer_shape(self, keys, indptr, sdata) + _infer_shape(self, keys, indptr, sdata) end #=doc From dc405e73fd6558c2944edbe76c03c6d91bbb4033 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 May 2016 17:57:43 +0900 Subject: [PATCH 334/630] add type_infer --- src/symbolic-node.jl | 64 ++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 64 insertions(+) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index dbc3eb7dd26d..94e45188038a 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -315,6 +315,70 @@ function infer_shape(self :: SymbolicNode, args :: Union{Tuple, Void}...) _infer_shape(self, keys, indptr, sdata) end +function _infer_type(self, keys, arg_type_data) + ref_in_type_size = Ref{MX_uint}() + ref_in_type_data = Ref{Ptr{Cint}}() + ref_out_type_size = Ref{MX_uint}() + ref_out_type_data = Ref{Ptr{Cint}}() + ref_aux_type_size = Ref{MX_uint}() + ref_aux_type_data = Ref{Ptr{Cint}}() + ref_complete = Ref{Cint}() + + @mxcall(:MXSymbolInferType, + (MX_handle, MX_uint, char_pp, Ptr{Cint}, + Ref{MX_uint}, Ref{Ptr{Cint}}, + Ref{MX_uint}, Ref{Ptr{Cint}}, + Ref{MX_uint}, Ref{Ptr{Cint}}, + Ref{Cint}), + self, length(arg_type_data)-1, keys, arg_type_data, + ref_in_type_size, ref_in_type_data, + ref_out_type_size, ref_out_type_data, + ref_aux_type_size, ref_aux_type_data, + ref_complete) + + if ref_complete[] == 0 + return (nothing, nothing, nothing) + else + in_type = pointer_to_array(ref_in_type_data[], ref_in_type_size[]) + out_type = pointer_to_array(ref_out_type_data[], ref_out_type_size[]) + aux_type = pointer_to_array(ref_aux_type_data[], ref_aux_type_size[]) + return ([fromTypeFlag(TypeFlag(t)) for t in in_type], + [fromTypeFlag(TypeFlag(t)) for t in out_type], + [fromTypeFlag(TypeFlag(t)) for t in aux_type]) + end +end + +#=doc +.. function:: + infer_type(self :: SymbolicNode; kwargs...) + infer_type(self :: SymbolicNode, args...) + + Do type inference according to the input types. The input types could be provided + as a list of types, which should specify the types of inputs in the same order as + the arguments returned by :func:`list_arguments`. Alternatively, the type information + could be specified via keyword arguments. + + :return: A 3-tuple containing types of all the arguments, types of all the outputs and + types of all the auxiliary variables. If type inference failed due to incomplete + or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. +=# +function infer_type(self :: SymbolicNode; kwargs...) + types = Cint[toTypeFlag(x[2]) for x in kwargs] + keys = AbstractString[string(x[1]) for x in kwargs] + _infer_type(self, keys, types) +end + +function infer_type(self :: SymbolicNode, args :: Union{Tuple, Void}...) + types = Cint[] + keys = Ptr{char_p}(0) + + for arg in args + if isa(arg, Void); continue; end + push!(types, toTypeFlag(arg)) + end + _infer_type(self, keys, types) +end + #=doc .. function:: getindex(self :: SymbolicNode, idx :: Union{Int, Base.Symbol, AbstractString}) From 4a4ea61d08f2eb77fa8aef781ca25dad2a5b8229 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Mon, 30 May 2016 12:51:38 +0900 Subject: [PATCH 335/630] make bind tests use isapprox and don't run division tests for Integer types --- test/unittest/bind.jl | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl index 6e1b821aa418..64ae2cd95592 100644 --- a/test/unittest/bind.jl +++ b/test/unittest/bind.jl @@ -34,24 +34,24 @@ function test_arithmetic{T <: mx.DType}(::Type{T}, uf, gf) out2 = copy(exec2.outputs[1]) out3 = copy(exec3.outputs[1]) out4 = copy(exec4.outputs[1]) - @test reldiff(out1, out2) < 1e-6 - @test reldiff(out1, out3) < 1e-6 - @test reldiff(out1, out4) < 1e-6 + @test isapprox(out1, out2) + @test isapprox(out1, out3) + @test isapprox(out1, out4) # test gradients out_grad = mx.NDArray(ones(T, shape)) lhs_grad2, rhs_grad2 = gf(copy(out_grad), copy(lhs_arr), copy(rhs_arr)) mx.backward(exec2, out_grad) - @test reldiff(copy(lhs_grad), lhs_grad2) < 1e-6 - @test reldiff(copy(rhs_grad), rhs_grad2) < 1e-6 + @test isapprox(copy(lhs_grad), lhs_grad2) + @test isapprox(copy(rhs_grad), rhs_grad2) # reset grads lhs_grad[:] = 0 rhs_grad[:] = 0 # compute using another binding mx.backward(exec4, out_grad) - @test reldiff(copy(lhs_grad), lhs_grad2) < 1e-6 - @test reldiff(copy(rhs_grad), rhs_grad2) < 1e-6 + @test isapprox(copy(lhs_grad), lhs_grad2) + @test isapprox(copy(rhs_grad), rhs_grad2) end function test_arithmetic() @@ -59,7 +59,7 @@ function test_arithmetic() test_arithmetic(T, .+, (g,x,y) -> (g,g)) test_arithmetic(T, .-, (g,x,y) -> (g,-g)) test_arithmetic(T, .*, (g,x,y) -> (y.*g, x.*g)) - test_arithmetic(T, ./, (g,x,y) -> (g ./ y, -x .* g ./ (y.^2))) + T <: Integer || test_arithmetic(T, ./, (g,x,y) -> (g ./ y, -x .* g ./ (y.^2))) end end From affebe675eaa4761475768ed5386439f5d828dd1 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 7 Jun 2016 11:35:32 +0900 Subject: [PATCH 336/630] Exclude division test for Float16 --- test/unittest/bind.jl | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl index 64ae2cd95592..c764435d5a9c 100644 --- a/test/unittest/bind.jl +++ b/test/unittest/bind.jl @@ -59,7 +59,11 @@ function test_arithmetic() test_arithmetic(T, .+, (g,x,y) -> (g,g)) test_arithmetic(T, .-, (g,x,y) -> (g,-g)) test_arithmetic(T, .*, (g,x,y) -> (y.*g, x.*g)) - T <: Integer || test_arithmetic(T, ./, (g,x,y) -> (g ./ y, -x .* g ./ (y.^2))) + if T <: Integer || T == Float16 + warn("Not running division test for $T") + else + test_arithmetic(T, ./, (g,x,y) -> (g ./ y, -x .* g ./ (y.^2))) + end end end From 9a827f796a2d574c68d87f359c679c1ccc1a50ad Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 7 Jun 2016 11:43:52 +0900 Subject: [PATCH 337/630] fix blas_vendor for v0.5 --- deps/build.jl | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index e0e0a0e1388f..9449c6337102 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -30,8 +30,14 @@ if !libmxnet_detected openblas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) + if VERSION >= v"0.5.0-dev+4338" + blas_vendor = Base.BLAS.vendor() + else + blas_vendor = Base.blas_vendor() + end + ilp64 = "" - if Base.blas_vendor() == :openblas64 + if blas_vendor == :openblas64 ilp64 = "-DINTERFACE64" end From 5e70cb96e9de4a7a18d347d5f15bd42ea46e3e99 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 5 Jul 2016 09:23:15 +0900 Subject: [PATCH 338/630] start transitioning to Documenter.jl --- .gitignore | 2 ++ docs/make.jl | 3 +++ docs/src/index.md | 0 3 files changed, 5 insertions(+) create mode 100644 docs/make.jl create mode 100644 docs/src/index.md diff --git a/.gitignore b/.gitignore index e2b2ea70b3fc..3325a370ecaf 100644 --- a/.gitignore +++ b/.gitignore @@ -8,3 +8,5 @@ deps/src deps/usr deps/deps.jl docs/_build +docs/build/ +docs/site/ diff --git a/docs/make.jl b/docs/make.jl new file mode 100644 index 000000000000..1a20e2b93826 --- /dev/null +++ b/docs/make.jl @@ -0,0 +1,3 @@ +using Documenter, MXNet + +makedocs() diff --git a/docs/src/index.md b/docs/src/index.md new file mode 100644 index 000000000000..e69de29bb2d1 From ce16bfe76d0aee40d7c157de2f7718a9b5ab4739 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 5 Jul 2016 23:41:16 +0900 Subject: [PATCH 339/630] split import_ndarry functions up --- src/ndarray.jl | 192 ++++++++++++++++++++++++++----------------------- 1 file changed, 104 insertions(+), 88 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 1c34c45d0c33..82b421651a4f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -988,110 +988,126 @@ object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the out **autogen:EMBED:ndarray:EMBED:autogen** =# -function _import_ndarray_functions(;gen_docs=false) - n_ref = Ref{MX_uint}(0) - h_ref = Ref{Ptr{MX_handle}}(0) - @mxcall(:MXListFunctions, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) - n_funcs = n_ref[] - h_funcs = pointer_to_array(h_ref[], n_funcs) +function _get_ndarray_functions() + n = Ref{MX_uint}(0) + handles = Ref{Ptr{MX_handle}}(0) - if gen_docs - docs = Dict{Base.Symbol, AbstractString}() - end + @mxcall(:MXListFunctions, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n, handles) - for i = 1:n_funcs - func_handle = h_funcs[i] + funcs = unsafe_wrap(Array, handles[], n[]) + return funcs +end - #---------------------------------------- - # get function information (human readable) - ref_name = Ref{char_p}(0) - ref_desc = Ref{char_p}(0) - ref_narg = Ref{MX_uint}(0) +function _get_function_description(handle :: MX_handle) + # get function information (human readable) + ref_name = Ref{char_p}(0) + ref_desc = Ref{char_p}(0) + ref_narg = Ref{MX_uint}(0) - ref_arg_names = Ref{char_pp}(0) - ref_arg_types = Ref{char_pp}(0) - ref_arg_descs = Ref{char_pp}(0) + ref_arg_names = Ref{char_pp}(0) + ref_arg_types = Ref{char_pp}(0) + ref_arg_descs = Ref{char_pp}(0) - ref_ret_type = Ref{char_p}(0) + ref_ret_type = Ref{char_p}(0) - @mxcall(:MXFuncGetInfo, - (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, - Ref{char_pp}, Ref{char_pp}, Ref{char_p}), - func_handle, ref_name, ref_desc, ref_narg, ref_arg_names, - ref_arg_types, ref_arg_descs, ref_ret_type) + @mxcall(:MXFuncGetInfo, + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, + Ref{char_pp}, Ref{char_pp}, Ref{char_p}), + handle, ref_name, ref_desc, ref_narg, ref_arg_names, + ref_arg_types, ref_arg_descs, ref_ret_type) - func_name = Symbol(@compat String(ref_name[])) + name = Symbol(unsafe_wrap(String, ref_name[])) - if gen_docs - # generate document only - f_desc = @compat String(ref_desc[]) * "\n\n" - f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) - docs[func_name] = f_desc - else - #---------------------------------------- - # get function specification - ref_n_use_vars = Ref{MX_uint}(0) - ref_n_scalars = Ref{MX_uint}(0) - ref_n_mut_vars = Ref{MX_uint}(0) - ref_type_mask = Ref{Cint}(0) - @mxcall(:MXFuncDescribe, - (MX_handle, Ref{MX_uint}, Ref{MX_uint}, Ref{MX_uint}, Ref{Cint}), - func_handle, ref_n_use_vars, ref_n_scalars, ref_n_mut_vars, ref_type_mask) - - #---------------------------------------- - # prepare function definition - n_used_vars = ref_n_use_vars[] - n_scalars = ref_n_scalars[] - n_mutate_vars = ref_n_mut_vars[] - type_mask = ref_type_mask[] - accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 - arg_before_scalar = (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 - - # general ndarray function - if arg_before_scalar - args = vcat([Expr(:(::), Symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), Symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), Symbol("out$i"), NDArray) for i=1:n_mutate_vars]) - else - args = vcat([Expr(:(::), Symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), Symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), Symbol("out$i"), NDArray) for i=1:n_mutate_vars]) - end + desc = unsafe_wrap(String, ref_desc[]) * "\n\n" + desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) + return name, desc +end - _use_vars = Expr(:ref, :MX_handle, [Symbol("in$i") for i=1:n_used_vars]...) - _scalars = Expr(:ref, :MX_float, [Symbol("sca$i") for i=1:n_scalars]...) - _mut_vars = Expr(:ref, :MX_handle, [Symbol("out$i") for i=1:n_mutate_vars]...) +function _get_function_expressions(handle :: MX_handle, name) + # get function specification + ref_n_use_vars = Ref{MX_uint}(0) + ref_n_scalars = Ref{MX_uint}(0) + ref_n_mut_vars = Ref{MX_uint}(0) + ref_type_mask = Ref{Cint}(0) + @mxcall(:MXFuncDescribe, + (MX_handle, Ref{MX_uint}, Ref{MX_uint}, Ref{MX_uint}, Ref{Cint}), + handle, ref_n_use_vars, ref_n_scalars, ref_n_mut_vars, ref_type_mask) - # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped - # See https://github.com/dmlc/MXNet.jl/issues/55 - if func_name == :dot - _use_vars.args[2:end] = flipdim(_use_vars.args[2:end], 1) - end + n_used_vars = ref_n_use_vars[] + n_scalars = ref_n_scalars[] + n_mutate_vars = ref_n_mut_vars[] + type_mask = ref_type_mask[] + accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 + arg_before_scalar = (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 - stmt_call = Expr(:call, :_invoke_mxfunction, func_handle, _use_vars, _scalars, _mut_vars) - if n_mutate_vars == 1 - stmt_ret = :(return out1) - else - stmt_ret = Expr(:return, Expr(:tuple, [Symbol("out$i") for i=1:n_mutate_vars]...)) - end + # general ndarray function + if arg_before_scalar + args = vcat([Expr(:(::), Symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), Symbol("sca$i"), Real) for i=1:n_scalars], + [Expr(:(::), Symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + else + args = vcat([Expr(:(::), Symbol("sca$i"), Real) for i=1:n_scalars], + [Expr(:(::), Symbol("in$i"), NDArray) for i=1:n_used_vars], + [Expr(:(::), Symbol("out$i"), NDArray) for i=1:n_mutate_vars]) + end + + _use_vars = Expr(:ref, :MX_handle, [Symbol("in$i") for i=1:n_used_vars]...) + _scalars = Expr(:ref, :MX_float, [Symbol("sca$i") for i=1:n_scalars]...) + _mut_vars = Expr(:ref, :MX_handle, [Symbol("out$i") for i=1:n_mutate_vars]...) + + # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped + # See https://github.com/dmlc/MXNet.jl/issues/55 + if name == :dot + _use_vars.args[2:end] = flipdim(_use_vars.args[2:end], 1) + end - func_body = Expr(:block, stmt_call, stmt_ret) - func_head = Expr(:call, func_name, args...) + stmt_call = Expr(:call, :_invoke_mxfunction, handle, _use_vars, _scalars, _mut_vars) + if n_mutate_vars == 1 + stmt_ret = :(return out1) + else + stmt_ret = Expr(:return, Expr(:tuple, [Symbol("out$i") for i=1:n_mutate_vars]...)) + end + + func_body = Expr(:block, stmt_call, stmt_ret) + func_head = Expr(:call, name, args...) + + func_def = Expr(:function, func_head, func_body) + exprs = Expr[func_def] + + if accept_empty_mutate + args0 = args[1:n_used_vars+n_scalars] + func_head0 = Expr(:call, name, args0...) + _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] + stmt_call0 = Expr(:call, name, args0..., _mut_vars0...) + func_body0 = Expr(:block, stmt_call0) + func_head0 = Expr(:call, name, args0...) + + func_def0 = Expr(:function, func_head0, func_body0) + push!(exprs, func_def0) + end + return exprs +end - func_def = Expr(:function, func_head, func_body) - eval(func_def) +function _import_ndarray_functions(;gen_docs=false) + funcs = _get_ndarray_functions() + + if gen_docs + docs = Dict{Symbol, String}() + end - if accept_empty_mutate - args0 = args[1:n_used_vars+n_scalars] - func_head0 = Expr(:call, func_name, args0...) - _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] - stmt_call0 = Expr(:call, func_name, args0..., _mut_vars0...) - func_body0 = Expr(:block, stmt_call0) - func_head0 = Expr(:call, func_name, args0...) + for i = 1:length(funcs) + handle = funcs[i] - func_def0 = Expr(:function, func_head0, func_body0) - eval(func_def0) + name, desc = _get_function_description(handle) + + if gen_docs + # generate document only + docs[name] = desc + else + exprs = _get_function_expressions(handle, name) + for expr in exprs + eval(expr) end end end From f09362c92c2ea93289badcc992ae520047251f54 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 6 Jul 2016 00:36:05 +0900 Subject: [PATCH 340/630] add mxnet.so as a dependency --- src/base.jl | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/base.jl b/src/base.jl index bd67a7c2ac52..ba1fda2e258c 100644 --- a/src/base.jl +++ b/src/base.jl @@ -24,6 +24,8 @@ if isempty(MXNET_LIB) # MXNet.ji will be re-compiled to get MXNET_LIB properly. touch(@__FILE__) error("Cannot find or load libmxnet.so. Please see the document on how to build it.") +else + include_dependency(MXNET_LIB) end function __init__() From 411a08bca644253fff7acb7125fdc933af932fc8 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 6 Jul 2016 00:36:53 +0900 Subject: [PATCH 341/630] simplify _import_ndarray --- src/ndarray.jl | 24 +++++++----------------- 1 file changed, 7 insertions(+), 17 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 82b421651a4f..b82787c18c97 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1089,31 +1089,21 @@ function _get_function_expressions(handle :: MX_handle, name) return exprs end -function _import_ndarray_functions(;gen_docs=false) +function _import_ndarray_functions() funcs = _get_ndarray_functions() - - if gen_docs - docs = Dict{Symbol, String}() - end + func_exprs = Expr[] for i = 1:length(funcs) handle = funcs[i] name, desc = _get_function_description(handle) + exprs = _get_function_expressions(handle, name) - if gen_docs - # generate document only - docs[name] = desc - else - exprs = _get_function_expressions(handle, name) - for expr in exprs - eval(expr) - end + expr = quote + $(exprs...) + @doc $desc $name end - end - - if gen_docs - return docs + eval(expr) end end From 7b65547780e1868b4944423847e18e9a77e19559 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 6 Jul 2016 00:59:46 +0900 Subject: [PATCH 342/630] implement _import_ndarray functions as macro --- src/MXNet.jl | 2 +- src/base.jl | 1 - src/ndarray.jl | 23 +++++++++++++++++++---- 3 files changed, 20 insertions(+), 6 deletions(-) diff --git a/src/MXNet.jl b/src/MXNet.jl index cdbacbe64be0..c447617e7fbf 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -18,6 +18,7 @@ import Base: round, ceil, floor, cos, sin, abs, sign, exp, sqrt, exp, log, norm, include("base.jl") include("context.jl") +include("util.jl") include("ndarray.jl") include("random.jl") @@ -36,7 +37,6 @@ include("kvstore.jl") include("callback.jl") include("model.jl") -include("util.jl") include("visualize.jl") include("nn-factory.jl") diff --git a/src/base.jl b/src/base.jl index ba1fda2e258c..578647e30486 100644 --- a/src/base.jl +++ b/src/base.jl @@ -29,7 +29,6 @@ else end function __init__() - _import_ndarray_functions() _import_atomic_symbol_creators() _import_io_iterators() diff --git a/src/ndarray.jl b/src/ndarray.jl index b82787c18c97..a555e201725b 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -999,6 +999,13 @@ function _get_ndarray_functions() return funcs end +function _get_function(name :: String) + handle = Ref{MX_handle}(0) + + @mxcall(:MXGetFunction, (Cstring, Ref{MX_handle}), name, handle) + return handle[] +end + function _get_function_description(handle :: MX_handle) # get function information (human readable) ref_name = Ref{char_p}(0) @@ -1061,8 +1068,10 @@ function _get_function_expressions(handle :: MX_handle, name) if name == :dot _use_vars.args[2:end] = flipdim(_use_vars.args[2:end], 1) end - - stmt_call = Expr(:call, :_invoke_mxfunction, handle, _use_vars, _scalars, _mut_vars) + stmt_call = quote + local handle = _get_function($(string(name))) + _invoke_mxfunction(handle, $_use_vars, $_scalars, $_mut_vars) + end if n_mutate_vars == 1 stmt_ret = :(return out1) else @@ -1089,7 +1098,7 @@ function _get_function_expressions(handle :: MX_handle, name) return exprs end -function _import_ndarray_functions() +macro _import_ndarray_functions() funcs = _get_ndarray_functions() func_exprs = Expr[] @@ -1103,7 +1112,13 @@ function _import_ndarray_functions() $(exprs...) @doc $desc $name end - eval(expr) + + push!(func_exprs, expr) end + + esc(quote + $(func_exprs...) + end) end +@_import_ndarray_functions() From 89e2c8e9c7ce5c1d5da7674fcf831457fa889b7a Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 6 Jul 2016 02:06:07 +0900 Subject: [PATCH 343/630] implement a function cache --- src/ndarray.jl | 18 ++++++++++++------ 1 file changed, 12 insertions(+), 6 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index a555e201725b..d78d647fe185 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -999,11 +999,17 @@ function _get_ndarray_functions() return funcs end -function _get_function(name :: String) - handle = Ref{MX_handle}(0) - - @mxcall(:MXGetFunction, (Cstring, Ref{MX_handle}), name, handle) - return handle[] +const _function_cache = Dict{Symbol, MX_handle}() +function _get_function(name :: Symbol) + if !haskey(_function_cache, name) + handle = Ref{MX_handle}(0) + + @mxcall(:MXGetFunction, (Cstring, Ref{MX_handle}), name, handle) + _function_cache[name] = handle[] + return handle[] + else + return _function_cache[name] + end end function _get_function_description(handle :: MX_handle) @@ -1069,7 +1075,7 @@ function _get_function_expressions(handle :: MX_handle, name) _use_vars.args[2:end] = flipdim(_use_vars.args[2:end], 1) end stmt_call = quote - local handle = _get_function($(string(name))) + local handle = _get_function($(QuoteNode(name))) _invoke_mxfunction(handle, $_use_vars, $_scalars, $_mut_vars) end if n_mutate_vars == 1 From 5b2bd3ee8948d57305eb950f6fb14fe7a383e7a5 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 6 Jul 2016 02:57:18 +0900 Subject: [PATCH 344/630] Refactor _import_atomic_symbol to be a macro --- src/base.jl | 2 +- src/symbolic-node.jl | 87 +++++++++++++++++++++++++++----------------- 2 files changed, 54 insertions(+), 35 deletions(-) diff --git a/src/base.jl b/src/base.jl index 578647e30486..32968ea0afb6 100644 --- a/src/base.jl +++ b/src/base.jl @@ -29,7 +29,7 @@ else end function __init__() - _import_atomic_symbol_creators() + _populate_symbol_creator_cache!() _import_io_iterators() atexit() do diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 94e45188038a..5bd1a6120f0e 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -580,7 +580,7 @@ libmxnet APIs ################################################################################ # Atomic SymbolicNode functions dynamically imported from libmxnet ################################################################################ -function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) +function _define_atomic_symbol_creator(hdr :: MX_handle) ref_name = Ref{char_p}(0) ref_desc = Ref{char_p}(0) ref_kv_nargs = Ref{char_p}(0) @@ -596,22 +596,19 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, ref_kv_nargs, ref_ret_type) - func_name_s= @compat String(ref_name[]) - func_name = Symbol(func_name_s) - kv_nargs_s = @compat String(ref_kv_nargs[]) - kv_nargs = Symbol(kv_nargs_s) + func_name_s = unsafe_wrap(String, ref_name[]) + func_name = Symbol(func_name_s) + kv_nargs_s = unsafe_wrap(String, ref_kv_nargs[]) + kv_nargs = Symbol(kv_nargs_s) - if gen_docs - f_desc = @compat String(ref_desc[]) * "\n\n" - if !isempty(kv_nargs_s) - f_desc *= "This function support variable length positional :class:`SymbolicNode` inputs.\n\n" - end - f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional.\n" - f_desc *= ":param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`.\n\n" - f_desc *= ":return: $(_format_typestring(@compat String(ref_ret_type[]))).\n\n" - return (func_name, f_desc) + f_desc = unsafe_wrap(String, ref_desc[]) * "\n\n" + if !isempty(kv_nargs_s) + f_desc *= "This function support variable length positional :class:`SymbolicNode` inputs.\n\n" end + f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) + f_desc *= ":param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional.\n" + f_desc *= ":param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`.\n\n" + f_desc *= ":return: $(_format_typestring(unsafe_wrap(String, ref_ret_type[]))).\n\n" # function $func_name(args...; kwargs...) func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) @@ -623,10 +620,10 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) name = "" end - param_keys = AbstractString[] - param_vals = AbstractString[] + param_keys = String[] + param_vals = String[] symbol_kws = Dict{Symbol, SymbolicNode}() - attrs = Dict{Symbol, AbstractString}() + attrs = Dict{Symbol, String}() $(if kv_nargs != Symbol("") quote @@ -665,11 +662,13 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) end end) + local hdr = _get_symbol_creator($(QuoteNode(func_name))) + # create the SymbolicNode ref_sym_hdr = Ref{MX_handle}() @mxcall(:MXSymbolCreateAtomicSymbol, (MX_handle, MX_uint, Ptr{char_p}, Ptr{char_p}, Ref{MX_handle}), - $hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) + hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) sym_hdr = ref_sym_hdr[] node = SymbolicNode(MX_SymbolHandle(sym_hdr)) @@ -691,34 +690,54 @@ function _define_atomic_symbol_creator(hdr :: MX_handle; gen_docs=false) end func_def = Expr(:function, func_head, Expr(:block, func_body)) - eval(func_def) + quote + $func_def + @doc $f_desc $func_name + end end -function _import_atomic_symbol_creators(;gen_docs=false) +function _get_atomic_symbol_creators() n_ref = Ref{MX_uint}(0) h_ref = Ref{Ptr{MX_handle}}(0) @mxcall(:MXSymbolListAtomicSymbolCreators, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) - n_creators = n_ref[] - h_creators = pointer_to_array(h_ref[], n_creators) + return unsafe_wrap(Array, h_ref[], n_ref[]) +end - if gen_docs - docs = Dict{Base.Symbol, AbstractString}() - end +function _get_atomic_symbol_name(handle :: MX_handle) + name_r = Ref{char_p}(0) + @mxcall(:MXSymbolGetAtomicSymbolName, (MX_handle, Ref{char_p}), handle, name_r) + return unsafe_wrap(String, name_r[]) +end - for i = 1:n_creators - creator_hdr = h_creators[i] - ret = _define_atomic_symbol_creator(creator_hdr, gen_docs=gen_docs) - if gen_docs - docs[ret[1]] = ret[2] - end +const _symbol_creator_cache = Dict{Symbol, MX_handle}() +function _populate_symbol_creator_cache!() + empty!(_symbol_creator_cache) + h_creators = _get_atomic_symbol_creators() + for handle in h_creators + name = Symbol(_get_atomic_symbol_name(handle)) + _symbol_creator_cache[name] = handle end +end + +_get_symbol_creator(name :: Symbol) = _symbol_creator_cache[name] - if gen_docs - return docs +macro _import_atomic_symbol_creators() + h_creators = _get_atomic_symbol_creators() + + exprs = Expr[] + for creator_hdr in h_creators + expr = _define_atomic_symbol_creator(creator_hdr) + push!(exprs, expr) end + + esc(quote + $(exprs...) + end) end +@_import_atomic_symbol_creators() + ################################################################################ # Utility macros to chain up symbols ################################################################################ From 1ad9a1a7a38e676e7e01df040c904e708c918daa Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 6 Jul 2016 03:54:36 +0900 Subject: [PATCH 345/630] transition context to see how it turns out --- docs/src/api/context.md | 7 +++++++ src/context.jl | 36 +++++++++++++++++------------------- 2 files changed, 24 insertions(+), 19 deletions(-) create mode 100644 docs/src/api/context.md diff --git a/docs/src/api/context.md b/docs/src/api/context.md new file mode 100644 index 000000000000..2c2ac8f7d7ac --- /dev/null +++ b/docs/src/api/context.md @@ -0,0 +1,7 @@ +# Context + +```@docs +mx.Context +mx.cpu +mx.gpu +``` diff --git a/src/context.jl b/src/context.jl index 1e96c305fb04..908d542f5ba3 100644 --- a/src/context.jl +++ b/src/context.jl @@ -1,14 +1,10 @@ -#=doc -Context -======= -=# @enum CONTEXT_TYPE CPU=1 GPU=2 CPU_PINNED=3 -#=doc -.. class:: Context +""" + Context(dev_type, dev_id) - A context describes the device type and id on which computation should be carried on. -=# +A context describes the device type and id on which computation should be carried on. +""" immutable Context device_type :: CONTEXT_TYPE device_id :: Int @@ -20,25 +16,27 @@ function Base.show(io :: IO, ctx :: Context) print(io, "$(ctx.device_type)$(ctx.device_id)") end -#=doc -.. function:: cpu(dev_id=0) +""" + cpu(dev_id) - :param Int dev_id: the CPU id. +Get a CPU context with a specific id. ``cpu()`` is usually the default context for many +operations when no context is specified. - Get a CPU context with a specific id. ``cpu()`` is usually the default context for many - operations when no context is specified. -=# +# Arguments +* `dev_id::Int = 0`: the CPU id. +""" function cpu(dev_id::Int=0) return Context(CPU, dev_id) end -#=doc -.. function:: gpu(dev_id=0) +""" + gpu(dev_id) - :param Int dev_id: the GPU device id. +Get a GPU context with a specific id. The K GPUs on a node is typically numbered as 0,...,K-1. - Get a GPU context with a specific id. The K GPUs on a node is typically numbered as 0,...,K-1. -=# +# Arguments +* `dev_id :: Int = 0` the GPU device id. +""" function gpu(dev_id::Int=0) return Context(GPU, dev_id) end From ca949d73b5b90c81eda2e021dfaa20a973e271a4 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 6 Jul 2016 03:57:42 +0900 Subject: [PATCH 346/630] get rid of the most of the old docs --- docs/Makefile | 180 -- docs/api/callback.rst | 92 - docs/api/context.rst | 32 - docs/api/executor.rst | 32 - docs/api/initializer.rst | 81 - docs/api/io.rst | 525 ------ docs/api/metric.rst | 77 - docs/api/model.rst | 133 -- docs/api/ndarray.rst | 1027 ----------- docs/api/nn-factory.rst | 33 - docs/api/optimizer.rst | 194 -- docs/api/symbolic-node.rst | 1591 ----------------- docs/api/visualize.rst | 19 - docs/build-api.jl | 98 - docs/conf.py | 277 --- docs/index.rst | 55 - docs/sphinx/julia.py | 23 - docs/src/index.md | 55 + docs/{ => src}/tutorial/char-lstm.rst | 0 .../{ => src}/tutorial/images/LSTM3-chain.png | Bin .../tutorial/images/char-lstm-vis.svg | 0 docs/{ => src}/tutorial/mnist.rst | 0 docs/{ => src}/user-guide/faq.rst | 0 docs/{ => src}/user-guide/install.rst | 0 docs/{ => src}/user-guide/overview.rst | 0 25 files changed, 55 insertions(+), 4469 deletions(-) delete mode 100644 docs/Makefile delete mode 100644 docs/api/callback.rst delete mode 100644 docs/api/context.rst delete mode 100644 docs/api/executor.rst delete mode 100644 docs/api/initializer.rst delete mode 100644 docs/api/io.rst delete mode 100644 docs/api/metric.rst delete mode 100644 docs/api/model.rst delete mode 100644 docs/api/ndarray.rst delete mode 100644 docs/api/nn-factory.rst delete mode 100644 docs/api/optimizer.rst delete mode 100644 docs/api/symbolic-node.rst delete mode 100644 docs/api/visualize.rst delete mode 100644 docs/build-api.jl delete mode 100644 docs/conf.py delete mode 100644 docs/index.rst delete mode 100644 docs/sphinx/julia.py rename docs/{ => src}/tutorial/char-lstm.rst (100%) rename docs/{ => src}/tutorial/images/LSTM3-chain.png (100%) rename docs/{ => src}/tutorial/images/char-lstm-vis.svg (100%) rename docs/{ => src}/tutorial/mnist.rst (100%) rename docs/{ => src}/user-guide/faq.rst (100%) rename docs/{ => src}/user-guide/install.rst (100%) rename docs/{ => src}/user-guide/overview.rst (100%) diff --git a/docs/Makefile b/docs/Makefile deleted file mode 100644 index e1763e330fc7..000000000000 --- a/docs/Makefile +++ /dev/null @@ -1,180 +0,0 @@ -# Makefile for Sphinx documentation -# - -# You can set these variables from the command line. -SPHINXOPTS = -SPHINXBUILD = sphinx-build -PAPER = -BUILDDIR = _build - -# User-friendly check for sphinx-build -ifeq ($(shell which $(SPHINXBUILD) >/dev/null 2>&1; echo $$?), 1) -$(error The '$(SPHINXBUILD)' command was not found. Make sure you have Sphinx installed, then set the SPHINXBUILD environment variable to point to the full path of the '$(SPHINXBUILD)' executable. Alternatively you can add the directory with the executable to your PATH. If you don't have Sphinx installed, grab it from http://sphinx-doc.org/) -endif - -# Internal variables. -PAPEROPT_a4 = -D latex_paper_size=a4 -PAPEROPT_letter = -D latex_paper_size=letter -ALLSPHINXOPTS = -d $(BUILDDIR)/doctrees $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) . -# the i18n builder cannot share the environment and doctrees with the others -I18NSPHINXOPTS = $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) . - -.PHONY: help clean html dirhtml singlehtml pickle json htmlhelp qthelp devhelp epub latex latexpdf text man changes linkcheck doctest gettext - -help: - @echo "Please use \`make ' where is one of" - @echo " html to make standalone HTML files" - @echo " dirhtml to make HTML files named index.html in directories" - @echo " singlehtml to make a single large HTML file" - @echo " pickle to make pickle files" - @echo " json to make JSON files" - @echo " htmlhelp to make HTML files and a HTML help project" - @echo " qthelp to make HTML files and a qthelp project" - @echo " devhelp to make HTML files and a Devhelp project" - @echo " epub to make an epub" - @echo " latex to make LaTeX files, you can set PAPER=a4 or PAPER=letter" - @echo " latexpdf to make LaTeX files and run them through pdflatex" - @echo " latexpdfja to make LaTeX files and run them through platex/dvipdfmx" - @echo " text to make text files" - @echo " man to make manual pages" - @echo " texinfo to make Texinfo files" - @echo " info to make Texinfo files and run them through makeinfo" - @echo " gettext to make PO message catalogs" - @echo " changes to make an overview of all changed/added/deprecated items" - @echo " xml to make Docutils-native XML files" - @echo " pseudoxml to make pseudoxml-XML files for display purposes" - @echo " linkcheck to check all external links for integrity" - @echo " doctest to run all doctests embedded in the documentation (if enabled)" - -clean: - rm -rf $(BUILDDIR)/* - -livehtml: - sphinx-autobuild -b html $(ALLSPHINXOPTS) $(BUILDDIR)/html - -html: - $(SPHINXBUILD) -b html $(ALLSPHINXOPTS) $(BUILDDIR)/html - @echo - @echo "Build finished. The HTML pages are in $(BUILDDIR)/html." - -dirhtml: - $(SPHINXBUILD) -b dirhtml $(ALLSPHINXOPTS) $(BUILDDIR)/dirhtml - @echo - @echo "Build finished. The HTML pages are in $(BUILDDIR)/dirhtml." - -singlehtml: - $(SPHINXBUILD) -b singlehtml $(ALLSPHINXOPTS) $(BUILDDIR)/singlehtml - @echo - @echo "Build finished. The HTML page is in $(BUILDDIR)/singlehtml." - -pickle: - $(SPHINXBUILD) -b pickle $(ALLSPHINXOPTS) $(BUILDDIR)/pickle - @echo - @echo "Build finished; now you can process the pickle files." - -json: - $(SPHINXBUILD) -b json $(ALLSPHINXOPTS) $(BUILDDIR)/json - @echo - @echo "Build finished; now you can process the JSON files." - -htmlhelp: - $(SPHINXBUILD) -b htmlhelp $(ALLSPHINXOPTS) $(BUILDDIR)/htmlhelp - @echo - @echo "Build finished; now you can run HTML Help Workshop with the" \ - ".hhp project file in $(BUILDDIR)/htmlhelp." - -qthelp: - $(SPHINXBUILD) -b qthelp $(ALLSPHINXOPTS) $(BUILDDIR)/qthelp - @echo - @echo "Build finished; now you can run "qcollectiongenerator" with the" \ - ".qhcp project file in $(BUILDDIR)/qthelp, like this:" - @echo "# qcollectiongenerator $(BUILDDIR)/qthelp/Mocha.qhcp" - @echo "To view the help file:" - @echo "# assistant -collectionFile $(BUILDDIR)/qthelp/Mocha.qhc" - -devhelp: - $(SPHINXBUILD) -b devhelp $(ALLSPHINXOPTS) $(BUILDDIR)/devhelp - @echo - @echo "Build finished." - @echo "To view the help file:" - @echo "# mkdir -p $$HOME/.local/share/devhelp/Mocha" - @echo "# ln -s $(BUILDDIR)/devhelp $$HOME/.local/share/devhelp/Mocha" - @echo "# devhelp" - -epub: - $(SPHINXBUILD) -b epub $(ALLSPHINXOPTS) $(BUILDDIR)/epub - @echo - @echo "Build finished. The epub file is in $(BUILDDIR)/epub." - -latex: - $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex - @echo - @echo "Build finished; the LaTeX files are in $(BUILDDIR)/latex." - @echo "Run \`make' in that directory to run these through (pdf)latex" \ - "(use \`make latexpdf' here to do that automatically)." - -latexpdf: - $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex - @echo "Running LaTeX files through pdflatex..." - $(MAKE) -C $(BUILDDIR)/latex all-pdf - @echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex." - -latexpdfja: - $(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex - @echo "Running LaTeX files through platex and dvipdfmx..." - $(MAKE) -C $(BUILDDIR)/latex all-pdf-ja - @echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex." - -text: - $(SPHINXBUILD) -b text $(ALLSPHINXOPTS) $(BUILDDIR)/text - @echo - @echo "Build finished. The text files are in $(BUILDDIR)/text." - -man: - $(SPHINXBUILD) -b man $(ALLSPHINXOPTS) $(BUILDDIR)/man - @echo - @echo "Build finished. The manual pages are in $(BUILDDIR)/man." - -texinfo: - $(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo - @echo - @echo "Build finished. The Texinfo files are in $(BUILDDIR)/texinfo." - @echo "Run \`make' in that directory to run these through makeinfo" \ - "(use \`make info' here to do that automatically)." - -info: - $(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo - @echo "Running Texinfo files through makeinfo..." - make -C $(BUILDDIR)/texinfo info - @echo "makeinfo finished; the Info files are in $(BUILDDIR)/texinfo." - -gettext: - $(SPHINXBUILD) -b gettext $(I18NSPHINXOPTS) $(BUILDDIR)/locale - @echo - @echo "Build finished. The message catalogs are in $(BUILDDIR)/locale." - -changes: - $(SPHINXBUILD) -b changes $(ALLSPHINXOPTS) $(BUILDDIR)/changes - @echo - @echo "The overview file is in $(BUILDDIR)/changes." - -linkcheck: - $(SPHINXBUILD) -b linkcheck $(ALLSPHINXOPTS) $(BUILDDIR)/linkcheck - @echo - @echo "Link check complete; look for any errors in the above output " \ - "or in $(BUILDDIR)/linkcheck/output.txt." - -doctest: - $(SPHINXBUILD) -b doctest $(ALLSPHINXOPTS) $(BUILDDIR)/doctest - @echo "Testing of doctests in the sources finished, look at the " \ - "results in $(BUILDDIR)/doctest/output.txt." - -xml: - $(SPHINXBUILD) -b xml $(ALLSPHINXOPTS) $(BUILDDIR)/xml - @echo - @echo "Build finished. The XML files are in $(BUILDDIR)/xml." - -pseudoxml: - $(SPHINXBUILD) -b pseudoxml $(ALLSPHINXOPTS) $(BUILDDIR)/pseudoxml - @echo - @echo "Build finished. The pseudo-XML files are in $(BUILDDIR)/pseudoxml." diff --git a/docs/api/callback.rst b/docs/api/callback.rst deleted file mode 100644 index 2bda7477094f..000000000000 --- a/docs/api/callback.rst +++ /dev/null @@ -1,92 +0,0 @@ - -Callbacks in training -===================== - - - - -.. class:: AbstractCallback - - Abstract type of callback functions used in training. - - - - -.. class:: AbstractBatchCallback - - Abstract type of callbacks to be called every mini-batch. - - - - -.. class:: AbstractEpochCallback - - Abstract type of callbacks to be called every epoch. - - - - -.. function:: every_n_batch(callback :: Function, n :: Int; call_on_0 = false) - - A convenient function to construct a callback that runs every ``n`` mini-batches. - - :param Int call_on_0: keyword argument, default false. Unless set, the callback - will **not** be run on batch 0. - - For example, the :func:`speedometer` callback is defined as - - .. code-block:: julia - - every_n_iter(frequency, call_on_0=true) do state :: OptimizationState - if state.curr_batch == 0 - # reset timer - else - # compute and print speed - end - end - - :seealso: :func:`every_n_epoch`, :func:`speedometer`. - - - - -.. function:: speedometer(; frequency=50) - - Create an :class:`AbstractBatchCallback` that measure the training speed - (number of samples processed per second) every k mini-batches. - - :param Int frequency: keyword argument, default 50. The frequency (number of - min-batches) to measure and report the speed. - - - - -.. function:: every_n_epoch(callback :: Function, n :: Int; call_on_0 = false) - - A convenient function to construct a callback that runs every ``n`` full data-passes. - - :param Int call_on_0: keyword argument, default false. Unless set, the callback - will **not** be run on epoch 0. Epoch 0 means no training has been performed - yet. This is useful if you want to inspect the randomly initialized model - that has not seen any data yet. - - :seealso: :func:`every_n_iter`. - - - - -.. function:: do_checkpoint(prefix; frequency=1, save_epoch_0=false) - - Create an :class:`AbstractEpochCallback` that save checkpoints of the model to disk. - The checkpoints can be loaded back later on. - - :param AbstractString prefix: the prefix of the filenames to save the model. The model - architecture will be saved to prefix-symbol.json, while the weights will be saved - to prefix-0012.params, for example, for the 12-th epoch. - :param Int frequency: keyword argument, default 1. The frequency (measured in epochs) to - save checkpoints. - :param Bool save_epoch_0: keyword argument, default false. Whether we should save a - checkpoint for epoch 0 (model initialized but not seen any data yet). - - - diff --git a/docs/api/context.rst b/docs/api/context.rst deleted file mode 100644 index 5230b892c8e5..000000000000 --- a/docs/api/context.rst +++ /dev/null @@ -1,32 +0,0 @@ - -Context -======= - - - - -.. class:: Context - - A context describes the device type and id on which computation should be carried on. - - - - -.. function:: cpu(dev_id=0) - - :param Int dev_id: the CPU id. - - Get a CPU context with a specific id. ``cpu()`` is usually the default context for many - operations when no context is specified. - - - - -.. function:: gpu(dev_id=0) - - :param Int dev_id: the GPU device id. - - Get a GPU context with a specific id. The K GPUs on a node is typically numbered as 0,...,K-1. - - - diff --git a/docs/api/executor.rst b/docs/api/executor.rst deleted file mode 100644 index 69c78137cd0e..000000000000 --- a/docs/api/executor.rst +++ /dev/null @@ -1,32 +0,0 @@ - -Executor -======== - - - - -.. class:: Executor - - An executor is a realization of a symbolic architecture defined by a :class:`SymbolicNode`. - The actual forward and backward computation specified by the network architecture can - be carried out with an executor. - - - - -.. function:: bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) - - Create an :class:`Executor` by binding a :class:`SymbolicNode` to concrete :class:`NDArray`. - - :param SymbolicNode sym: the network architecture describing the computation graph. - :param Context ctx: the context on which the computation should run. - :param args: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete - arrays for all the inputs in the network architecture. The inputs typically include - network parameters (weights, bias, filters, etc.), data and labels. See :func:`list_arguments` - and :func:`infer_shape`. - :param args_grad: TODO - :param aux_states: - :param grad_req: - - - diff --git a/docs/api/initializer.rst b/docs/api/initializer.rst deleted file mode 100644 index 6dbb81a001b3..000000000000 --- a/docs/api/initializer.rst +++ /dev/null @@ -1,81 +0,0 @@ - -Initializers -============ -Interface ---------- - - - - -.. class:: AbstractInitializer - - The abstract base class for all initializers. - -To define a new initializer, it is -enough to derive a new type, and implement one or more of the following methods: - -.. function:: _init_weight(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -.. function:: _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -.. function:: _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -.. function:: _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) - -Or, if full behavior customization is needed, override the following function - -.. function:: init(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) - - - - -Built-in initializers ---------------------- - - - - -.. class:: UniformInitializer - - Initialize weights according to a uniform distribution within the provided scale. - - - - -.. function UniformInitializer(scale=0.07) - - Construct a :class:`UniformInitializer` with the specified scale. - - - - -.. class:: NormalInitializer - - Initialize weights according to a univariate Gaussian distribution. - - - - -.. function:: NormalIninitializer(; mu=0, sigma=0.01) - - Construct a :class:`NormalInitializer` with mean ``mu`` and variance ``sigma``. - - - - -.. class:: XavierInitializer - - The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding - the difficulty of training deep feedforward neuralnetworks*. - - There are several different version of the XavierInitializer used in the wild. - The general idea is that the variance of the initialization distribution is controlled - by the dimensionality of the input and output. As a distribution one can either choose - a normal distribution with μ = 0 and σ² or a uniform distribution from -σ to σ. - - Several different ways of calculating the variance are given in the literature or are - used by various libraries. - - - [Bengio and Glorot 2010]: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 1)`` - - [K. He, X. Zhang, S. Ren, and J. Sun 2015]: ``mx.XavierInitializer(distribution = mx.xv_gaussian, regularization = mx.xv_in, magnitude = 2)`` - - caffe_avg: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 3)`` - - - diff --git a/docs/api/io.rst b/docs/api/io.rst deleted file mode 100644 index e5cb3ffb32e5..000000000000 --- a/docs/api/io.rst +++ /dev/null @@ -1,525 +0,0 @@ - -Data Providers -============== -Interface ---------- - -Data providers are wrappers that load external data, be it images, text, or general tensors, -and split it into mini-batches so that the model can consume the data in a uniformed way. - - - - -.. class:: AbstractDataProvider - - The root type for all data provider. A data provider should implement the following interfaces: - - .. function:: get_batch_size(provider) -> Int - - :param AbstractDataProvider provider: the data provider. - :return: the mini-batch size of the provided data. All the provided data should have the - same mini-batch size (i.e. the last dimension). - - .. function:: provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} - - :param AbstractDataProvider provider: the data provider. - :return: a vector of (name, shape) pairs describing the names of the data it provides, and - the corresponding shapes. - - .. function:: provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} - - :param AbstractDataProvider provider: the data provider. - :return: a vector of (name, shape) pairs describing the names of the labels it provides, and - the corresponding shapes. - - The difference between *data* and *label* is that during - training stage, both *data* and *label* will be feeded into the model, while during - prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and - of any shapes. The provided data and label names here should match the input names in a target - :class:`SymbolicNode`. - - A data provider should also implement the Julia iteration interface, in order to allow iterating - through the data set. The provider will be called in the following way: - - .. code-block:: julia - - for batch in eachbatch(provider) - data = get_data(provider, batch) - end - - which will be translated by Julia compiler into - - .. code-block:: julia - - state = Base.start(eachbatch(provider)) - while !Base.done(provider, state) - (batch, state) = Base.next(provider, state) - data = get_data(provider, batch) - end - - By default, :func:`eachbatch` simply returns the provider itself, so the iterator interface - is implemented on the provider type itself. But the extra layer of abstraction allows us to - implement a data provider easily via a Julia ``Task`` coroutine. See the - data provider defined in :doc:`the char-lstm example - ` for an example of using coroutine to define data - providers. - -The detailed interface functions for the iterator API is listed below: - -.. function:: Base.eltype(provider) -> AbstractDataBatch - - :param AbstractDataProvider provider: the data provider. - :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. - -.. function:: Base.start(provider) -> AbstractDataProviderState - - :param AbstractDataProvider provider: the data provider. - - This function is always called before iterating into the dataset. It should initialize - the iterator, reset the index, and do data shuffling if needed. - -.. function:: Base.done(provider, state) -> Bool - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. - :return: true if there is no more data to iterate in this dataset. - -.. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) - - :param AbstractDataProvider provider: the data provider. - :return: the current data batch, and the state for the next iteration. - -Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that -is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this -case, you can safely assume that - -* :func:`Base.start` will always be called, and called only once before the iteration starts. -* :func:`Base.done` will always be called at the beginning of every iteration and always be called once. -* If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with - a call to :func:`Base.start`. -* :func:`Base.next` will always be called only once in each iteration. It will always be called after - one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will - not be called. - -With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation -of the built-in :class:`MXDataProvider` for example. - -.. caution:: - - Please do not use the one data provider simultaneously in two different places, either in parallel, - or in a nested loop. For example, the behavior for the following code is undefined - - .. code-block:: julia - - for batch in data - # updating the parameters - - # now let's test the performance on the training set - for b2 in data - # ... - end - end - - - - -.. class:: AbstractDataProviderState - - Base type for data provider states. - - - - -.. class:: AbstractDataBatch - - Base type for a data mini-batch. It should implement the following interfaces: - - .. function:: count_samples(provider, batch) -> Int - - :param AbstractDataBatch batch: the data batch object. - :return: the number of samples in this batch. This number should be greater than 0, but - less than or equal to the batch size. This is used to indicate at the end of - the data set, there might not be enough samples for a whole mini-batch. - - .. function:: get_data(provider, batch) -> Vector{NDArray} - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :return: a vector of data in this batch, should be in the same order as declared in - :func:`provide_data() `. - - The last dimension of each :class:`NDArray` should always match the batch_size, even when - :func:`count_samples` returns a value less than the batch size. In this case, - the data provider is free to pad the remaining contents with any value. - - .. function:: get_label(provider, batch) -> Vector{NDArray} - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :return: a vector of labels in this batch. Similar to :func:`get_data`. - - - The following utility functions will be automatically defined. - - .. function:: get(provider, batch, name) -> NDArray - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :param Base.Symbol name: the name of the data to get, should be one of the names - provided in either :func:`provide_data() ` - or :func:`provide_label() `. - :return: the corresponding data array corresponding to that name. - - .. function:: load_data!(provider, batch, targets) - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :param targets: the targets to load data into. - :type targets: Vector{Vector{SlicedNDArray}} - - The targets is a list of the same length as number of data provided by this provider. - Each element in the list is a list of :class:`SlicedNDArray`. This list described a - spliting scheme of this data batch into different slices, each slice is specified by - a slice-ndarray pair, where *slice* specify the range of samples in the mini-batch - that should be loaded into the corresponding *ndarray*. - - This utility function is used in data parallelization, where a mini-batch is splited - and computed on several different devices. - - .. function:: load_label!(provider, batch, targets) - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :param targets: the targets to load label into. - :type targets: Vector{Vector{SlicedNDArray}} - - The same as :func:`load_data!`, except that this is for loading labels. - - - - -.. class:: DataBatch - - A basic subclass of :class:`AbstractDataBatch`, that implement the interface by - accessing member fields. - - - - -.. class:: SlicedNDArray - - A alias type of ``Tuple{UnitRange{Int},NDArray}``. - - - - -Built-in data providers ------------------------ - - - - -.. class:: ArrayDataProvider - - A convenient tool to iterate :class:`NDArray` or Julia ``Array``. - - - - -.. function:: ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) - - Construct a data provider from :class:`NDArray` or Julia Arrays. - - :param data: the data, could be - - - a :class:`NDArray`, or a Julia Array. This is equivalent to ``:data => data``. - - a name-data pair, like ``:mydata => array``, where ``:mydata`` is the name of the data - and ``array`` is an :class:`NDArray` or a Julia Array. - - a list of name-data pairs. - - :param label: the same as the ``data`` parameter. When this argument is omitted, the constructed - provider will provide no labels. - :param Int batch_size: the batch size, default is 0, which means treating the whole array as a - single mini-batch. - :param Bool shuffle: turn on if the data should be shuffled at every epoch. - :param Real data_padding: when the mini-batch goes beyond the dataset boundary, there might - be less samples to include than a mini-batch. This value specify a scalar to pad the - contents of all the missing data points. - :param Real label_padding: the same as ``data_padding``, except for the labels. - - TODO: remove ``data_padding`` and ``label_padding``, and implement rollover that copies - the last or first several training samples to feed the padding. - - - - -libmxnet data providers ------------------------ - - - - -.. class:: MXDataProvider - - A data provider that wrap built-in data iterators from libmxnet. See below for - a list of built-in data iterators. - - - - -.. function:: CSVIter(...) - - Can also be called with the alias ``CSVProvider``. - Create iterator for dataset in csv. - - :param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data. - :param Base.Symbol label_name: keyword argument, default ``:softmax_label``. The name of the label. Could be ``nothing`` if no label is presented in this dataset. - - :param data_csv: Dataset Param: Data csv path. - :type data_csv: string, required - - - :param data_shape: Dataset Param: Shape of the data. - :type data_shape: Shape(tuple), required - - - :param label_csv: Dataset Param: Label csv path. If is NULL, all labels will be returned as 0 - :type label_csv: string, optional, default='NULL' - - - :param label_shape: Dataset Param: Shape of the label. - :type label_shape: Shape(tuple), optional, default=(1,) - - :return: the constructed :class:`MXDataProvider`. - - - -.. function:: ImageRecordIter(...) - - Can also be called with the alias ``ImageRecordProvider``. - Create iterator for dataset packed in recordio. - - :param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data. - :param Base.Symbol label_name: keyword argument, default ``:softmax_label``. The name of the label. Could be ``nothing`` if no label is presented in this dataset. - - :param path_imglist: Dataset Param: Path to image list. - :type path_imglist: string, optional, default='' - - - :param path_imgrec: Dataset Param: Path to image record file. - :type path_imgrec: string, optional, default='./data/imgrec.rec' - - - :param label_width: Dataset Param: How many labels for an image. - :type label_width: int, optional, default='1' - - - :param data_shape: Dataset Param: Shape of each instance generated by the DataIter. - :type data_shape: Shape(tuple), required - - - :param preprocess_threads: Backend Param: Number of thread to do preprocessing. - :type preprocess_threads: int, optional, default='4' - - - :param verbose: Auxiliary Param: Whether to output parser information. - :type verbose: boolean, optional, default=True - - - :param num_parts: partition the data into multiple parts - :type num_parts: int, optional, default='1' - - - :param part_index: the index of the part will read - :type part_index: int, optional, default='0' - - - :param shuffle: Augmentation Param: Whether to shuffle data. - :type shuffle: boolean, optional, default=False - - - :param seed: Augmentation Param: Random Seed. - :type seed: int, optional, default='0' - - - :param batch_size: Batch Param: Batch size. - :type batch_size: int (non-negative), required - - - :param round_batch: Batch Param: Use round robin to handle overflow batch. - :type round_batch: boolean, optional, default=True - - - :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 - - - :param rand_crop: Augmentation Param: Whether to random crop on the image - :type rand_crop: boolean, optional, default=False - - - :param crop_y_start: Augmentation Param: Where to nonrandom crop on y. - :type crop_y_start: int, optional, default='-1' - - - :param crop_x_start: Augmentation Param: Where to nonrandom crop on x. - :type crop_x_start: int, optional, default='-1' - - - :param max_rotate_angle: Augmentation Param: rotated randomly in [-max_rotate_angle, max_rotate_angle]. - :type max_rotate_angle: int, optional, default='0' - - - :param max_aspect_ratio: Augmentation Param: denotes the max ratio of random aspect ratio augmentation. - :type max_aspect_ratio: float, optional, default=0 - - - :param max_shear_ratio: Augmentation Param: denotes the max random shearing ratio. - :type max_shear_ratio: float, optional, default=0 - - - :param max_crop_size: Augmentation Param: Maximum crop size. - :type max_crop_size: int, optional, default='-1' - - - :param min_crop_size: Augmentation Param: Minimum crop size. - :type min_crop_size: int, optional, default='-1' - - - :param max_random_scale: Augmentation Param: Maxmum scale ratio. - :type max_random_scale: float, optional, default=1 - - - :param min_random_scale: Augmentation Param: Minimum scale ratio. - :type min_random_scale: float, optional, default=1 - - - :param max_img_size: Augmentation Param: Maxmum image size after resizing. - :type max_img_size: float, optional, default=1e+10 - - - :param min_img_size: Augmentation Param: Minimum image size after resizing. - :type min_img_size: float, optional, default=0 - - - :param random_h: Augmentation Param: Maximum value of H channel in HSL color space. - :type random_h: int, optional, default='0' - - - :param random_s: Augmentation Param: Maximum value of S channel in HSL color space. - :type random_s: int, optional, default='0' - - - :param random_l: Augmentation Param: Maximum value of L channel in HSL color space. - :type random_l: int, optional, default='0' - - - :param rotate: Augmentation Param: Rotate angle. - :type rotate: int, optional, default='-1' - - - :param fill_value: Augmentation Param: Maximum value of illumination variation. - :type fill_value: int, optional, default='255' - - - :param inter_method: Augmentation Param: 0-NN 1-bilinear 2-cubic 3-area 4-lanczos4 9-auto 10-rand. - :type inter_method: int, optional, default='1' - - - :param mirror: Augmentation Param: Whether to mirror the image. - :type mirror: boolean, optional, default=False - - - :param rand_mirror: Augmentation Param: Whether to mirror the image randomly. - :type rand_mirror: boolean, optional, default=False - - - :param mean_img: Augmentation Param: Mean Image to be subtracted. - :type mean_img: string, optional, default='' - - - :param mean_r: Augmentation Param: Mean value on R channel. - :type mean_r: float, optional, default=0 - - - :param mean_g: Augmentation Param: Mean value on G channel. - :type mean_g: float, optional, default=0 - - - :param mean_b: Augmentation Param: Mean value on B channel. - :type mean_b: float, optional, default=0 - - - :param mean_a: Augmentation Param: Mean value on Alpha channel. - :type mean_a: float, optional, default=0 - - - :param scale: Augmentation Param: Scale in color space. - :type scale: float, optional, default=1 - - - :param max_random_contrast: Augmentation Param: Maximum ratio of contrast variation. - :type max_random_contrast: float, optional, default=0 - - - :param max_random_illumination: Augmentation Param: Maximum value of illumination variation. - :type max_random_illumination: float, optional, default=0 - - :return: the constructed :class:`MXDataProvider`. - - - -.. function:: MNISTIter(...) - - Can also be called with the alias ``MNISTProvider``. - Create iterator for MNIST hand-written digit number recognition dataset. - - :param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data. - :param Base.Symbol label_name: keyword argument, default ``:softmax_label``. The name of the label. Could be ``nothing`` if no label is presented in this dataset. - - :param image: Dataset Param: Mnist image path. - :type image: string, optional, default='./train-images-idx3-ubyte' - - - :param label: Dataset Param: Mnist label path. - :type label: string, optional, default='./train-labels-idx1-ubyte' - - - :param batch_size: Batch Param: Batch Size. - :type batch_size: int, optional, default='128' - - - :param shuffle: Augmentation Param: Whether to shuffle data. - :type shuffle: boolean, optional, default=True - - - :param flat: Augmentation Param: Whether to flat the data into 1D. - :type flat: boolean, optional, default=False - - - :param seed: Augmentation Param: Random Seed. - :type seed: int, optional, default='0' - - - :param silent: Auxiliary Param: Whether to print out data info. - :type silent: boolean, optional, default=False - - - :param num_parts: partition the data into multiple parts - :type num_parts: int, optional, default='1' - - - :param part_index: the index of the part will read - :type part_index: int, optional, default='0' - - - :param prefetch_buffer: Backend Param: Number of prefetched parameters - :type prefetch_buffer: , optional, default=4 - - :return: the constructed :class:`MXDataProvider`. - - - - - - diff --git a/docs/api/metric.rst b/docs/api/metric.rst deleted file mode 100644 index 0f3cc2d81358..000000000000 --- a/docs/api/metric.rst +++ /dev/null @@ -1,77 +0,0 @@ - -Evaluation Metrics -================== - -Evaluation metrics provide a way to evaluate the performance of a learned model. -This is typically used during training to monitor performance on the validation -set. - - - - -.. class:: AbstractEvalMetric - - The base class for all evaluation metrics. The sub-types should implement the following - interfaces. - - .. function:: update!(metric, labels, preds) - - Update and accumulate metrics. - - :param AbstractEvalMetric metric: the metric object. - :param labels: the labels from the data provider. - :type labels: Vector{NDArray} - :param preds: the outputs (predictions) of the network. - :type preds: Vector{NDArray} - - .. function:: reset!(metric) - - Reset the accumulation counter. - - .. function:: get(metric) - - Get the accumulated metrics. - - :return: ``Vector{Tuple{Base.Symbol, Real}}``, a list of name-value pairs. For - example, ``[(:accuracy, 0.9)]``. - - - - -.. class:: Accuracy - - Multiclass classification accuracy. - - Calculates the mean accuracy per sample for softmax in one dimension. - For a multi-dimensional softmax the mean accuracy over all dimensions is calculated. - - - - -.. class:: MSE - - Mean Squared Error. TODO: add support for multi-dimensional outputs. - - Calculates the mean squared error regression loss in one dimension. - - - - -.. class:: ACE - - Averaged cross-entropy for classification. This also know als logloss. - - Calculated the averaged cross entropy for multi-dimentions output. - - - - -.. class:: MultiACE - - Averaged cross-entropy for classification. This also know als logloss. - This variant keeps track of the different losses per class. - - Calculated the averaged cross entropy for multi-dimentions output. - - - diff --git a/docs/api/model.rst b/docs/api/model.rst deleted file mode 100644 index 764d3e9329a8..000000000000 --- a/docs/api/model.rst +++ /dev/null @@ -1,133 +0,0 @@ - -Models -====== - -The model API provides convenient high-level interface to do training and predicting on -a network described using the symbolic API. - - - - -.. class:: AbstractModel - - The abstract super type of all models in MXNet.jl. - - - - -.. class:: FeedForward - - The feedforward model provides convenient interface to train and predict on - feedforward architectures like multi-layer MLP, ConvNets, etc. There is no - explicitly handling of *time index*, but it is relatively easy to implement - unrolled RNN / LSTM under this framework (**TODO**: add example). For models - that handles sequential data explicitly, please use **TODO**... - - - - -.. function:: FeedForward(arch :: SymbolicNode, ctx) - - :param arch: the architecture of the network constructed using the symbolic API. - :param ctx: the devices on which this model should do computation. It could be a single :class:`Context` - or a list of :class:`Context` objects. In the latter case, data parallelization will be used - for training. If no context is provided, the default context ``cpu()`` will be used. - - - - -.. function:: init_model(self, initializer; overwrite=false, input_shapes...) - - Initialize the weights in the model. - - This method will be called automatically when training a model. So there is usually no - need to call this method unless one needs to inspect a model with only randomly initialized - weights. - - :param FeedForward self: the model to be initialized. - :param AbstractInitializer initializer: an initializer describing how the weights should be initialized. - :param Bool overwrite: keyword argument, force initialization even when weights already exists. - :param input_shapes: the shape of all data and label inputs to this model, given as keyword arguments. - For example, ``data=(28,28,1,100), label=(100,)``. - - - - -.. function:: - predict(self, data; overwrite=false, callback=nothing) - - Predict using an existing model. The model should be already initialized, or trained or loaded from - a checkpoint. There is an overloaded function that allows to pass the callback as the first argument, - so it is possible to do - - .. code-block:: julia - - predict(model, data) do batch_output - # consume or write batch_output to file - end - - :param FeedForward self: the model. - :param AbstractDataProvider data: the data to perform prediction on. - :param Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory - allocation of the :class:`Executor` depends on the mini-batch size of the test - data provider. If you call predict twice with data provider of the same batch-size, - then the executor can be potentially be re-used. So, if ``overwrite`` is false, - we will try to re-use, and raise an error if batch-size changed. If ``overwrite`` - is true (the default), a new :class:`Executor` will be created to replace the old one. - - .. note:: - - Prediction is computationally much less costly than training, so the bottleneck sometimes becomes the IO - for copying mini-batches of data. Since there is no concern about convergence in prediction, it is better - to set the mini-batch size as large as possible (limited by your device memory) if prediction speed is a - concern. - - For the same reason, currently prediction will only use the first device even if multiple devices are - provided to construct the model. - - .. note:: - - If you perform further after prediction. The weights are not automatically synchronized if ``overwrite`` - is set to false and the old predictor is re-used. In this case - setting ``overwrite`` to true (the default) will re-initialize the predictor the next time you call - predict and synchronize the weights again. - - :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` - - - - -.. function:: train(model :: FeedForward, ...) - - Alias to :func:`fit`. - - - - -.. function:: fit(model :: FeedForward, optimizer, data; kwargs...) - - Train the ``model`` on ``data`` with the ``optimizer``. - - :param FeedForward model: the model to be trained. - :param AbstractOptimizer optimizer: the optimization algorithm to use. - :param AbstractDataProvider data: the training data provider. - :param Int n_epoch: default 10, the number of full data-passes to run. - :param AbstractDataProvider eval_data: keyword argument, default ``nothing``. The data provider for - the validation set. - :param AbstractEvalMetric eval_metric: keyword argument, default ``Accuracy()``. The metric used - to evaluate the training performance. If ``eval_data`` is provided, the same metric is also - calculated on the validation set. - :param kvstore: keyword argument, default ``:local``. The key-value store used to synchronize gradients - and parameters when multiple devices are used for training. - :type kvstore: :class:`KVStore` or ``Base.Symbol`` - :param AbstractInitializer initializer: keyword argument, default ``UniformInitializer(0.01)``. - :param Bool force_init: keyword argument, default false. By default, the random initialization using the - provided ``initializer`` will be skipped if the model weights already exists, maybe from a previous - call to :func:`train` or an explicit call to :func:`init_model` or :func:`load_checkpoint`. When - this option is set, it will always do random initialization at the begining of training. - :param callbacks: keyword argument, default ``[]``. Callbacks to be invoked at each epoch or mini-batch, - see :class:`AbstractCallback`. - :type callbacks: ``Vector{AbstractCallback}`` - - - diff --git a/docs/api/ndarray.rst b/docs/api/ndarray.rst deleted file mode 100644 index b94232b25e50..000000000000 --- a/docs/api/ndarray.rst +++ /dev/null @@ -1,1027 +0,0 @@ - -NDArray API -=========== - - - - -.. class:: NDArray - - Wrapper of the ``NDArray`` type in ``libmxnet``. This is the basic building block - of tensor-based computation. - - .. _ndarray-shape-note: - - .. note:: - - since C/C++ use row-major ordering for arrays while Julia follows a - column-major ordering. To keep things consistent, we keep the underlying data - in their original layout, but use *language-native* convention when we talk - about shapes. For example, a mini-batch of 100 MNIST images is a tensor of - C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory - have shape (28,28,1,100). - - - - -.. function:: context(arr :: NDArray) - - Get the context that this :class:`NDArray` lives on. - - - - -.. function:: - empty(shape :: Tuple, ctx :: Context) - empty(shape :: Tuple) - empty(dim1, dim2, ...) - - Allocate memory for an uninitialized :class:`NDArray` with specific shape. - - - - -Interface functions similar to Julia Arrays -------------------------------------------- - - - - -.. function:: - zeros(shape :: Tuple, ctx :: Context) - zeros(shape :: Tuple) - zeros(dim1, dim2, ...) - - Create zero-ed :class:`NDArray` with specific shape. - - - - -.. function:: - ones(shape :: Tuple, ctx :: Context) - ones(shape :: Tuple) - ones(dim1, dim2, ...) - - Create an :class:`NDArray` with specific shape and initialize with 1. - - - - -.. function:: - size(arr :: NDArray) - size(arr :: NDArray, dim :: Int) - - Get the shape of an :class:`NDArray`. The shape is in Julia's column-major convention. See - also the :ref:`notes on NDArray shapes `. - - - - -.. function:: length(arr :: NDArray) - - Get the number of elements in an :class:`NDArray`. - - - - -.. function:: ndims(arr :: NDArray) - - Get the number of dimensions of an :class:`NDArray`. Is equivalent to ``length(size(arr))``. - - - - -.. function:: eltype(arr :: NDArray) - - Get the element type of an :class:`NDArray`. Currently the element type is always ``mx.MX_float``. - - - - -.. function:: slice(arr :: NDArray, start:stop) - - Create a view into a sub-slice of an :class:`NDArray`. Note only slicing at the slowest - changing dimension is supported. In Julia's column-major perspective, this is the last - dimension. For example, given an :class:`NDArray` of shape (2,3,4), ``slice(array, 2:3)`` will create - a :class:`NDArray` of shape (2,3,2), sharing the data with the original array. This operation is - used in data parallelization to split mini-batch into sub-batches for different devices. - - - - -.. function:: setindex!(arr :: NDArray, val, idx) - - Assign values to an :class:`NDArray`. Elementwise assignment is not implemented, only the following - scenarios are supported - - - ``arr[:] = val``: whole array assignment, ``val`` could be a scalar or an array (Julia ``Array`` - or :class:`NDArray`) of the same shape. - - ``arr[start:stop] = val``: assignment to a *slice*, ``val`` could be a scalar or an array of - the same shape to the slice. See also :func:`slice`. - - - - -.. function:: getindex(arr :: NDArray, idx) - - Shortcut for :func:`slice`. A typical use is to write - - .. code-block:: julia - - arr[:] += 5 - - which translates into - - .. code-block:: julia - - arr[:] = arr[:] + 5 - - which furthur translates into - - .. code-block:: julia - - setindex!(getindex(arr, Colon()), 5, Colon()) - - .. note:: - - The behavior is quite different from indexing into Julia's ``Array``. For example, ``arr[2:5]`` - create a **copy** of the sub-array for Julia ``Array``, while for :class:`NDArray`, this is - a *slice* that shares the memory. - - - - -Copying functions ------------------ - - - - -.. function:: - copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) - - Copy contents of ``src`` into ``dst``. - - - - -.. function:: - copy(arr :: NDArray) - copy(arr :: NDArray, ctx :: Context) - copy(arr :: Array, ctx :: Context) - - Create a copy of an array. When no :class:`Context` is given, create a Julia ``Array``. - Otherwise, create an :class:`NDArray` on the specified context. - - - - -.. function:: convert(::Type{Array{T}}, arr :: NDArray) - - Convert an :class:`NDArray` into a Julia ``Array`` of specific type. Data will be copied. - - - - -Basic arithmetics ------------------ - - - - -.. function:: @inplace - - Julia does not support re-definiton of ``+=`` operator (like ``__iadd__`` in python), - When one write ``a += b``, it gets translated to ``a = a+b``. ``a+b`` will allocate new - memory for the results, and the newly allocated :class:`NDArray` object is then assigned - back to a, while the original contents in a is discarded. This is very inefficient - when we want to do inplace update. - - This macro is a simple utility to implement this behavior. Write - - .. code-block:: julia - - @mx.inplace a += b - - will translate into - - .. code-block:: julia - - mx.add_to!(a, b) - - which will do inplace adding of the contents of ``b`` into ``a``. - - - - -.. function:: add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) - - Add a bunch of arguments into ``dst``. Inplace updating. - - - - -.. function:: - +(args...) - .+(args...) - - Summation. Multiple arguments of either scalar or :class:`NDArray` could be - added together. Note at least the first or second argument needs to be an :class:`NDArray` to - avoid ambiguity of built-in summation. - - - - -.. function:: sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) - - Subtract a bunch of arguments from ``dst``. Inplace updating. - - - - -.. function:: - -(arg0, arg1) - -(arg0) - .-(arg0, arg1) - - Subtraction ``arg0 - arg1``, of scalar types or :class:`NDArray`. Or create - the negative of ``arg0``. - - - - -.. function:: mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) - - Elementwise multiplication into ``dst`` of either a scalar or an :class:`NDArray` of the same shape. - Inplace updating. - - - - -.. function:: - .*(arg0, arg1) - - Elementwise multiplication of ``arg0`` and ``arg``, could be either scalar or :class:`NDArray`. - - - - -.. function:: - *(arg0, arg1) - - Currently only multiplication a scalar with an :class:`NDArray` is implemented. Matrix multiplication - is to be added soon. - - - - -.. function:: div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) - - Elementwise divide a scalar or an :class:`NDArray` of the same shape from ``dst``. Inplace updating. - - - - -.. function:: ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) - - Elementwise dividing an :class:`NDArray` by a scalar or another :class:`NDArray` of the same shape. - - - - -.. function:: /(arg0 :: NDArray, arg :: Real) - - Divide an :class:`NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. - - - - -Manipulating as Julia Arrays ----------------------------- - -.. function:: @nd_as_jl(captures..., statement) - - A convenient macro that allows to operate :class:`NDArray` as Julia Arrays. For example, - - .. code-block:: julia - - x = mx.zeros(3,4) - y = mx.ones(3,4) - z = mx.zeros((3,4), mx.gpu()) - - @mx.nd_as_jl ro=(x,y) rw=z begin - # now x, y, z are just ordinary Julia Arrays - z[:,1] = y[:,2] - z[:,2] = 5 - end - - Under the hood, the macro convert all the declared captures from :class:`NDArray` into Julia - Arrays, by using :func:`try_get_shared`. And automatically commit the modifications back into - the :class:`NDArray` that is declared as ``rw``. This is useful for fast prototyping and when - implement non-critical computations, such as :class:`AbstractEvalMetric`. - - .. note:: - - - Multiple ``rw`` and / or ``ro`` capture declaration could be made. - - The macro does **not** check to make sure that ``ro`` captures are not modified. If the - original :class:`NDArray` lives in CPU memory, then it is very likely the corresponding - Julia Array shares data with the :class:`NDArray`, so modifying the Julia Array will also - modify the underlying :class:`NDArray`. - - More importantly, since the :class:`NDArray` is - asynchronized, we will wait for *writing* for ``rw`` variables but wait only for *reading* - in ``ro`` variables. If we write into those ``ro`` variables, **and** if the memory is - shared, racing condition might happen, and the behavior is undefined. - - When an :class:`NDArray` is declared to be captured as ``rw``, its contents is always sync - back in the end. - - The execution results of the expanded macro is always ``nothing``. - - The statements are wrapped in a ``let``, thus locally introduced new variables will not be - available after the statements. So you will need to declare the variables before calling the - macro if needed. - - - - -.. function:: try_get_shared(arr) - - Try to create a Julia array by sharing the data with the underlying :class:`NDArray`. - - :param NDArray arr: the array to be shared. - - .. warning:: - - The returned array does not guarantee to share data with the underlying :class:`NDArray`. - In particular, data sharing is possible only when the :class:`NDArray` lives on CPU. - - - - -.. function:: is_shared(j_arr, arr) - - Test whether ``j_arr`` is sharing data with ``arr``. - - :param Array j_arr: the Julia Array. - :param NDArray arr: the :class:`NDArray`. - - - - -IO --- - - - - -.. function:: load(filename, ::Type{NDArray}) - - Load NDArrays from binary file. - - :param AbstractString filename: the path of the file to load. It could be S3 or HDFS address. - :return: Either ``Dict{Base.Symbol, NDArray}`` or ``Vector{NDArray}``. - - If the ``libmxnet`` is built with the corresponding component enabled. Examples - - * ``s3://my-bucket/path/my-s3-ndarray`` - * ``hdfs://my-bucket/path/my-hdfs-ndarray`` - * ``/path-to/my-local-ndarray`` - - - - -.. function:: save(filename :: AbstractString, data) - - Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built - with corresponding support. - - :param AbstractString filename: path to the binary file to write to. - :param data: data to save to file. - :type data: :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. - - - - -libmxnet APIs -------------- - - - - -The libxmnet APIs are automatically imported from ``libmxnet.so``. The functions listed -here operate on :class:`NDArray` objects. The arguments to the functions are typically ordered -as - -.. code-block:: julia - - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) - -unless ``NDARRAY_ARG_BEFORE_SCALAR`` is not set. In this case, the scalars are put before the input arguments: - -.. code-block:: julia - - func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) - - -If ``ACCEPT_EMPTY_MUTATE_TARGET`` is set. An overloaded function without the output arguments will also be defined: - -.. code-block:: julia - - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) - -Upon calling, the output arguments will be automatically initialized with empty NDArrays. - -Those functions always return the output arguments. If there is only one output (the typical situation), that -object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. - -Public APIs -^^^^^^^^^^^ -.. function:: abs(...) - - Take absolute value of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: argmax_channel(...) - - Take argmax indices of each channel of the src.The result will be ndarray of shape (num_channel,) on the same device. - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: ceil(...) - - Take ceil value of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: choose_element_0index(...) - - Choose one element from each line(row for python, column for R/Julia) in lhs according to index indicated by rhs. This function assume rhs uses 0-based index. - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: NDArray - - - - - -.. function:: clip(...) - - Clip ndarray elements to range (a_min, a_max) - - :param src: Source input - :type src: NDArray - - - :param a_min: Minimum value - :type a_min: real_t - - - :param a_max: Maximum value - :type a_max: real_t - - - - - -.. function:: cos(...) - - Take cos of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: dot(...) - - Calculate 2D matrix multiplication - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: NDArray - - - - - -.. function:: exp(...) - - Take exp of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: fill_element_0index(...) - - Fill one element of each line(row for python, column for R/Julia) in lhs according to index indicated by rhs and values indicated by mhs. This function assume rhs uses 0-based index. - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param mhs: Middle operand to the function. - :type mhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: NDArray - - - - - -.. function:: floor(...) - - Take floor value of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: log(...) - - Take log of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: max(...) - - Take max of the src.The result will be ndarray of shape (1,) on the same device. - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: min(...) - - Take min of the src.The result will be ndarray of shape (1,) on the same device. - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: norm(...) - - Take L2 norm of the src.The result will be ndarray of shape (1,) on the same device. - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: round(...) - - Take round value of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: rsqrt(...) - - Take rsqrt of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: sign(...) - - Take sign value of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: sin(...) - - Take sin of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: sqrt(...) - - Take sqrt of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: square(...) - - Take square of the src - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: sum(...) - - Take sum of the src.The result will be ndarray of shape (1,) on the same device. - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: sum_mid_internal(...) - - Take sum on medium dimension of the 3D src. - - :param src: Source input to the function - :type src: NDArray - - - - - -.. function:: transpose(...) - - Transpose the input matrix and return a new one - - :param src: Source input to the function - :type src: NDArray - - - - -Internal APIs -^^^^^^^^^^^^^ - -.. note:: - - Document and signatures for internal API functions might be incomplete. - -.. function:: _broadcast(...) - - Broadcast array in the given axis to the given size - - :param src: source ndarray - :type src: NDArray - - - :param axis: axis to broadcast - :type axis: int - - - :param size: size of broadcast - :type size: int - - - - - -.. function:: _copyto(...) - - - - :param src: Source input to the function. - :type src: NDArray - - - - - -.. function:: _div(...) - - Multiply lhs by rhs - - :param lhs: Left operand to the function - :type lhs: NDArray - - - :param rhs: Right operand to the function - :type rhs: NDArray - - - - - -.. function:: _div_scalar(...) - - - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: real_t - - - - - -.. function:: _imdecode(...) - - Decode an image, clip to (x0, y0, x1, y1), substract mean, and write to buffer - - :param mean: image mean - :type mean: NDArray - - - :param index: buffer position for output - :type index: int - - - :param x0: x0 - :type x0: int - - - :param y0: y0 - :type y0: int - - - :param x1: x1 - :type x1: int - - - :param y1: y1 - :type y1: int - - - :param c: channel - :type c: int - - - :param size: length of str_img - :type size: int - - - - - -.. function:: _maximum(...) - - Elementwise max of lhs by rhs - - :param lhs: Left operand to the function - :type lhs: NDArray - - - :param rhs: Right operand to the function - :type rhs: NDArray - - - - - -.. function:: _minimum(...) - - Elementwise min of lhs by rhs - - :param lhs: Left operand to the function - :type lhs: NDArray - - - :param rhs: Right operand to the function - :type rhs: NDArray - - - - - -.. function:: _minus(...) - - Minus lhs and rhs - - :param lhs: Left operand to the function - :type lhs: NDArray - - - :param rhs: Right operand to the function - :type rhs: NDArray - - - - - -.. function:: _minus_scalar(...) - - - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: real_t - - - - - -.. function:: _mul(...) - - Multiply lhs and rhs - - :param lhs: Left operand to the function - :type lhs: NDArray - - - :param rhs: Right operand to the function - :type rhs: NDArray - - - - - -.. function:: _mul_scalar(...) - - - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: real_t - - - - - -.. function:: _onehot_encode(...) - - - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: NDArray - - - - - -.. function:: _plus(...) - - Add lhs and rhs - - :param lhs: Left operand to the function - :type lhs: NDArray - - - :param rhs: Right operand to the function - :type rhs: NDArray - - - - - -.. function:: _plus_scalar(...) - - - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: real_t - - - - - -.. function:: _power(...) - - Elementwise power(lhs, rhs) - - :param lhs: Left operand to the function - :type lhs: NDArray - - - :param rhs: Right operand to the function - :type rhs: NDArray - - - - - -.. function:: _random_gaussian(...) - - - - - - - -.. function:: _random_uniform(...) - - - - - - - -.. function:: _rdiv_scalar(...) - - - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: real_t - - - - - -.. function:: _rminus_scalar(...) - - - - :param lhs: Left operand to the function. - :type lhs: NDArray - - - :param rhs: Right operand to the function. - :type rhs: real_t - - - - - -.. function:: _set_value(...) - - - - :param src: Source input to the function. - :type src: real_t - - - - - - - - diff --git a/docs/api/nn-factory.rst b/docs/api/nn-factory.rst deleted file mode 100644 index 44569c640da9..000000000000 --- a/docs/api/nn-factory.rst +++ /dev/null @@ -1,33 +0,0 @@ - -Neural Networks Factory -======================= - -Neural network factory provide convenient helper functions to define -common neural networks. - - - - -.. function:: MLP(input, spec) - - Construct a multi-layer perceptron. A MLP is a multi-layer neural network with - fully connected layers. - - :param SymbolicNode input: the input to the mlp. - :param spec: the mlp specification, a list of hidden dimensions. For example, - ``[128, (512, :sigmoid), 10]``. The number in the list indicate the - number of hidden units in each layer. A tuple could be used to specify - the activation of each layer. Otherwise, the default activation will - be used (except for the last layer). - :param Base.Symbol hidden_activation: keyword argument, default ``:relu``, indicating - the default activation for hidden layers. The specification here could be overwritten - by layer-wise specification in the ``spec`` argument. Also activation is not - applied to the last, i.e. the prediction layer. See :func:`Activation` for a - list of supported activation types. - :param prefix: keyword argument, default ``gensym()``, used as the prefix to - name the constructed layers. - - :return: the constructed MLP. - - - diff --git a/docs/api/optimizer.rst b/docs/api/optimizer.rst deleted file mode 100644 index 03c9c11fed4a..000000000000 --- a/docs/api/optimizer.rst +++ /dev/null @@ -1,194 +0,0 @@ - -Optimizers -========== - -Common interfaces ------------------ - - - - -.. class:: AbstractOptimizer - - Base type for all optimizers. - - - - -.. class:: AbstractLearningRateScheduler - - Base type for all learning rate scheduler. - - - - -.. class:: AbstractMomentumScheduler - - Base type for all momentum scheduler. - - - - -.. class:: OptimizationState - - .. attribute:: batch_size - - The size of the mini-batch used in stochastic training. - - .. attribute:: curr_epoch - - The current epoch count. Epoch 0 means no training yet, during the first - pass through the data, the epoch will be 1; during the second pass, the - epoch count will be 1, and so on. - - .. attribute:: curr_batch - - The current mini-batch count. The batch count is reset during every epoch. - The batch count 0 means the beginning of each epoch, with no mini-batch - seen yet. During the first mini-batch, the mini-batch count will be 1. - - .. attribute:: curr_iter - - The current iteration count. One iteration corresponds to one mini-batch, - but unlike the mini-batch count, the iteration count does **not** reset - in each epoch. So it track the *total* number of mini-batches seen so far. - - - - -.. function:: get_learning_rate(scheduler, state) - - :param AbstractLearningRateScheduler scheduler: a learning rate scheduler. - :param OptimizationState state: the current state about epoch, mini-batch and iteration count. - :return: the current learning rate. - - - - -.. class:: LearningRate.Fixed - - Fixed learning rate scheduler always return the same learning rate. - - - - -.. class:: LearningRate.Exp - - :math:`\eta_t = \eta_0\gamma^t`. Here :math:`t` is the epoch count, or the iteration - count if ``decay_on_iteration`` is set to true. - - - - -.. class:: LearningRate.Inv - - :math:`\eta_t = \eta_0 * (1 + \gamma * t)^(-power)`. - Here :math:`t` is the epoch count, or the iteration count if ``decay_on_iteration`` - is set to true. - - - - -.. function:: get_momentum(scheduler, state) - - :param AbstractMomentumScheduler scheduler: the momentum scheduler. - :param OptimizationState state: the state about current epoch, mini-batch and iteration count. - :return: the current momentum. - - - - -.. class:: Momentum.Null - - The null momentum scheduler always returns 0 for momentum. It is also used to - explicitly indicate momentum should not be used. - - - - -.. class:: Momentum.Fixed - - Fixed momentum scheduler always returns the same value. - - - - -.. function:: get_updater(optimizer) - - :param AbstractOptimizer optimizer: the underlying optimizer. - - A utility function to create an updater function, that uses its closure to - store all the states needed for each weights. - - - - -Built-in optimizers -------------------- - - - - -.. class:: AbstractOptimizerOptions - - Base class for all optimizer options. - - - - -.. function:: normalized_gradient(opts, state, grad) - - :param AbstractOptimizerOptions opts: options for the optimizer, should contain the field - ``grad_scale``, ``grad_clip`` and ``weight_decay``. - :param OptimizationState state: the current optimization state. - :param NDArray weight: the trainable weights. - :param NDArray grad: the original gradient of the weights. - - Get the properly normalized gradient (re-scaled and clipped if necessary). - - - - -.. class:: SGD - - Stochastic gradient descent optimizer. - - .. function:: SGD(; kwargs...) - - :param Real lr: default `0.01`, learning rate. - :param AbstractLearningRateScheduler lr_scheduler: default `nothing`, a - dynamic learning rate scheduler. If set, will overwrite the `lr` - parameter. - :param Real momentum: default `0.0`, the momentum. - :param AbstractMomentumScheduler momentum_scheduler: default `nothing`, - a dynamic momentum scheduler. If set, will overwrite the `momentum` - parameter. - :param Real grad_clip: default `0`, if positive, will clip the gradient - into the bounded range `[-grad_clip, grad_clip]`. - :param Real weight_decay: default `0.0001`, weight decay is equivalent to - adding a global l2 regularizer to the parameters. - - - - -.. class:: ADAM - - The solver described in Diederik Kingma, Jimmy Ba: *Adam: A Method for - Stochastic Optimization*. arXiv:1412.6980 [cs.LG]. - - .. function:: ADAM(; kwargs...) - - :param Real lr: default `0.001`, learning rate. - :param AbstractLearningRateScheduler lr_scheduler: default `nothing`, a - dynamic learning rate scheduler. If set, will overwrite the `lr` - parameter. - :param Real beta1: default `0.9`. - :param Real beta2: default `0.999`. - :param Real epsilon: default `1e-8`. - :param Real grad_clip: default `0`, if positive, will clip the gradient - into the range `[-grad_clip, grad_clip]`. - :param Real weight_decay: default `0.00001`, weight decay is equivalent - to adding a global l2 regularizer for all the parameters. - - - diff --git a/docs/api/symbolic-node.rst b/docs/api/symbolic-node.rst deleted file mode 100644 index 125b391046cb..000000000000 --- a/docs/api/symbolic-node.rst +++ /dev/null @@ -1,1591 +0,0 @@ - -Symbolic API -============ - - - - -.. class:: SymbolicNode - - SymbolicNode is the basic building block of the symbolic graph in MXNet.jl. - - - - -.. function:: deepcopy(self :: SymbolicNode) - - Make a deep copy of a SymbolicNode. - - - - -.. function:: copy(self :: SymbolicNode) - - Make a copy of a SymbolicNode. The same as making a deep copy. - - - - -.. function:: - call(self :: SymbolicNode, args :: SymbolicNode...) - call(self :: SymbolicNode; kwargs...) - - Make a new node by composing ``self`` with ``args``. Or the arguments - can be specified using keyword arguments. - - - - -.. function:: list_arguments(self :: SymbolicNode) - - List all the arguments of this node. The argument for a node contains both - the inputs and parameters. For example, a :class:`FullyConnected` node will - have both data and weights in its arguments. A composed node (e.g. a MLP) will - list all the arguments for intermediate nodes. - - :return: A list of symbols indicating the names of the arguments. - - - - -.. function:: list_outputs(self :: SymbolicNode) - - List all the outputs of this node. - - :return: A list of symbols indicating the names of the outputs. - - - - -.. function:: list_auxiliary_states(self :: SymbolicNode) - - - List all auxiliary states in the symbool. - - Auxiliary states are special states of symbols that do not corresponds to an argument, - and do not have gradient. But still be useful for the specific operations. - A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. - Most operators do not have Auxiliary states. - - :return: A list of symbols indicating the names of the auxiliary states. - - - - -.. function:: get_internals(self :: SymbolicNode) - - Get a new grouped :class:`SymbolicNode` whose output contains all the internal outputs of - this :class:`SymbolicNode`. - - - - -.. function:: get_attr(self :: SymbolicNode, key :: Symbol) - - Get attribute attached to this :class:`SymbolicNode` belonging to key. - :return: The value belonging to key as a :class:`Nullable`. - - - - -.. function:: set_attr(self:: SymbolicNode, key :: Symbol, value :: AbstractString) - - Set the attribute key to value for this :class:`SymbolicNode`. - - .. warning:: - - It is encouraged not to call this function directly, unless you know exactly what you are doing. The - recommended way of setting attributes is when creating the :class:`SymbolicNode`. Changing - the attributes of a :class:`SymbolicNode` that is already been used somewhere else might - cause unexpected behavior and inconsistency. - - - - -.. function:: Variable(name :: Union{Symbol, AbstractString}) - - Create a symbolic variable with the given name. This is typically used as a placeholder. - For example, the data node, acting as the starting point of a network architecture. - - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`Variable`. - - - - -.. function:: Group(nodes :: SymbolicNode...) - - Create a :class:`SymbolicNode` by grouping nodes together. - - - - -.. function:: - infer_shape(self :: SymbolicNode; args...) - infer_shape(self :: SymbolicNode; kwargs...) - - Do shape inference according to the input shapes. The input shapes could be provided - as a list of shapes, which should specify the shapes of inputs in the same order as - the arguments returned by :func:`list_arguments`. Alternatively, the shape information - could be specified via keyword arguments. - - :return: A 3-tuple containing shapes of all the arguments, shapes of all the outputs and - shapes of all the auxiliary variables. If shape inference failed due to incomplete - or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. - - - - -.. function:: - getindex(self :: SymbolicNode, idx :: Union{Int, Base.Symbol, AbstractString}) - - Get a node representing the specified output of this node. The index could be - a symbol or string indicating the name of the output, or a 1-based integer - indicating the index, as in the list of :func:`list_outputs`. - - - - -.. function:: to_json(self :: SymbolicNode) - - Convert a :class:`SymbolicNode` into a JSON string. - - - - -.. function:: from_json(repr :: AbstractString, ::Type{SymbolicNode}) - - Load a :class:`SymbolicNode` from a JSON string representation. - - - - -.. function:: load(filename :: AbstractString, ::Type{SymbolicNode}) - - Load a :class:`SymbolicNode` from a JSON file. - - - - -.. function:: save(filename :: AbstractString, node :: SymbolicNode) - - Save a :class:`SymbolicNode` to a JSON file. - - - - -libmxnet APIs -------------- - -Public APIs -^^^^^^^^^^^ -.. function:: Activation(...) - - Apply activation function to input.Softmax Activation is only available with CUDNN on GPUand will be computed at each location across channel if input is 4D. - - :param data: Input data to activation function. - :type data: SymbolicNode - - - :param act_type: Activation function to be applied. - :type act_type: {'relu', 'sigmoid', 'softrelu', 'tanh'}, required - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: BatchNorm(...) - - Apply batch normalization to input. - - :param data: Input data to batch normalization - :type data: SymbolicNode - - - :param eps: Epsilon to prevent div 0 - :type eps: float, optional, default=0.001 - - - :param momentum: Momentum for moving average - :type momentum: float, optional, default=0.9 - - - :param fix_gamma: Fix gamma while training - :type fix_gamma: boolean, optional, default=True - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: BlockGrad(...) - - Get output from a symbol and pass 0 gradient back - - :param data: Input data. - :type data: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Cast(...) - - Cast array to a different data type. - - :param data: Input data to cast function. - :type data: SymbolicNode - - - :param dtype: Target data type. - :type dtype: {'float16', 'float32', 'float64', 'int32', 'uint8'}, required - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Concat(...) - - Perform an feature concat on channel dim (dim 1) over all the inputs. - - This function support variable length positional :class:`SymbolicNode` inputs. - - :param data: List of tensors to concatenate - :type data: SymbolicNode[] - - - :param num_args: Number of inputs to be concated. - :type num_args: int, required - - - :param dim: the dimension to be concated. - :type dim: int, optional, default='1' - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Convolution(...) - - Apply convolution to input then add a bias. - - :param data: Input data to the ConvolutionOp. - :type data: SymbolicNode - - - :param weight: Weight matrix. - :type weight: SymbolicNode - - - :param bias: Bias parameter. - :type bias: SymbolicNode - - - :param kernel: convolution kernel size: (y, x) - :type kernel: Shape(tuple), required - - - :param stride: convolution stride: (y, x) - :type stride: Shape(tuple), optional, default=(1,1) - - - :param dilate: convolution dilate: (y, x) - :type dilate: Shape(tuple), optional, default=(1,1) - - - :param pad: pad for convolution: (y, x) - :type pad: Shape(tuple), optional, default=(0,0) - - - :param num_filter: convolution filter(channel) number - :type num_filter: int (non-negative), required - - - :param num_group: Number of groups partition. This option is not supported by CuDNN, you can use SliceChannel to num_group,apply convolution and concat instead to achieve the same need. - :type num_group: int (non-negative), optional, default=1 - - - :param workspace: Tmp workspace for convolution (MB). - :type workspace: long (non-negative), optional, default=512 - - - :param no_bias: Whether to disable bias parameter. - :type no_bias: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Crop(...) - - Crop the 2nd and 3rd dim of input data, with the corresponding size of h_w or with width and height of the second input symbol, i.e., with one input, we need h_w to specify the crop height and width, otherwise the second input symbol's size will be used - - This function support variable length positional :class:`SymbolicNode` inputs. - - :param data: Tensor or List of Tensors, the second input will be used as crop_like shape reference - :type data: SymbolicNode or SymbolicNode[] - - - :param num_args: Number of inputs for crop, if equals one, then we will use the h_wfor crop height and width, else if equals two, then we will use the heightand width of the second input symbol, we name crop_like here - :type num_args: int, required - - - :param offset: crop offset coordinate: (y, x) - :type offset: Shape(tuple), optional, default=(0,0) - - - :param h_w: crop height and weight: (h, w) - :type h_w: Shape(tuple), optional, default=(0,0) - - - :param center_crop: If set to true, then it will use be the center_crop,or it will crop using the shape of crop_like - :type center_crop: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: CuDNNBatchNorm(...) - - Apply batch normalization to input. - - :param data: Input data to batch normalization - :type data: SymbolicNode - - - :param eps: Epsilon to prevent div 0 - :type eps: float, optional, default=0.001 - - - :param momentum: Momentum for moving average - :type momentum: float, optional, default=0.9 - - - :param fix_gamma: Fix gamma while training - :type fix_gamma: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Deconvolution(...) - - Apply deconvolution to input then add a bias. - - :param data: Input data to the DeconvolutionOp. - :type data: SymbolicNode - - - :param weight: Weight matrix. - :type weight: SymbolicNode - - - :param bias: Bias parameter. - :type bias: SymbolicNode - - - :param kernel: deconvolution kernel size: (y, x) - :type kernel: Shape(tuple), required - - - :param stride: deconvolution stride: (y, x) - :type stride: Shape(tuple), optional, default=(1,1) - - - :param pad: pad for deconvolution: (y, x) - :type pad: Shape(tuple), optional, default=(0,0) - - - :param num_filter: deconvolution filter(channel) number - :type num_filter: int (non-negative), required - - - :param num_group: number of groups partition - :type num_group: int (non-negative), optional, default=1 - - - :param workspace: Tmp workspace for deconvolution (MB) - :type workspace: long (non-negative), optional, default=512 - - - :param no_bias: Whether to disable bias parameter. - :type no_bias: boolean, optional, default=True - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Dropout(...) - - Apply dropout to input - - :param data: Input data to dropout. - :type data: SymbolicNode - - - :param p: Fraction of the input that gets dropped out at training time - :type p: float, optional, default=0.5 - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: ElementWiseSum(...) - - Perform an elementwise sum over all the inputs. - - This function support variable length positional :class:`SymbolicNode` inputs. - - :param num_args: Number of inputs to be summed. - :type num_args: int, required - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Embedding(...) - - Get embedding for one-hot input. A n-dimensional input tensor will be trainsformed into a (n+1)-dimensional tensor, where a new dimension is added for the embedding results. - - :param data: Input data to the EmbeddingOp. - :type data: SymbolicNode - - - :param weight: Enbedding weight matrix. - :type weight: SymbolicNode - - - :param input_dim: input dim of one-hot encoding - :type input_dim: int, required - - - :param output_dim: output dim of embedding - :type output_dim: int, required - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Flatten(...) - - Flatten input - - :param data: Input data to flatten. - :type data: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: FullyConnected(...) - - Apply matrix multiplication to input then add a bias. - - :param data: Input data to the FullyConnectedOp. - :type data: SymbolicNode - - - :param weight: Weight matrix. - :type weight: SymbolicNode - - - :param bias: Bias parameter. - :type bias: SymbolicNode - - - :param num_hidden: Number of hidden nodes of the output. - :type num_hidden: int, required - - - :param no_bias: Whether to disable bias parameter. - :type no_bias: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: IdentityAttachKLSparseReg(...) - - Apply a sparse regularization to the output a sigmoid activation function. - - :param data: Input data. - :type data: SymbolicNode - - - :param sparseness_target: The sparseness target - :type sparseness_target: float, optional, default=0.1 - - - :param penalty: The tradeoff parameter for the sparseness penalty - :type penalty: float, optional, default=0.001 - - - :param momentum: The momentum for running average - :type momentum: float, optional, default=0.9 - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: LRN(...) - - Apply convolution to input then add a bias. - - :param data: Input data to the ConvolutionOp. - :type data: SymbolicNode - - - :param alpha: value of the alpha variance scaling parameter in the normalization formula - :type alpha: float, optional, default=0.0001 - - - :param beta: value of the beta power parameter in the normalization formula - :type beta: float, optional, default=0.75 - - - :param knorm: value of the k parameter in normalization formula - :type knorm: float, optional, default=2 - - - :param nsize: normalization window width in elements. - :type nsize: int (non-negative), required - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: LeakyReLU(...) - - Apply activation function to input. - - :param data: Input data to activation function. - :type data: SymbolicNode - - - :param act_type: Activation function to be applied. - :type act_type: {'elu', 'leaky', 'prelu', 'rrelu'},optional, default='leaky' - - - :param slope: Init slope for the activation. (For leaky and elu only) - :type slope: float, optional, default=0.25 - - - :param lower_bound: Lower bound of random slope. (For rrelu only) - :type lower_bound: float, optional, default=0.125 - - - :param upper_bound: Upper bound of random slope. (For rrelu only) - :type upper_bound: float, optional, default=0.334 - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: LinearRegressionOutput(...) - - Use linear regression for final output, this is used on final output of a net. - - :param data: Input data to function. - :type data: SymbolicNode - - - :param label: Input label to function. - :type label: SymbolicNode - - - :param grad_scale: Scale the gradient by a float factor - :type grad_scale: float, optional, default=1 - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: LogisticRegressionOutput(...) - - Use Logistic regression for final output, this is used on final output of a net. - Logistic regression is suitable for binary classification or probability prediction tasks. - - :param data: Input data to function. - :type data: SymbolicNode - - - :param label: Input label to function. - :type label: SymbolicNode - - - :param grad_scale: Scale the gradient by a float factor - :type grad_scale: float, optional, default=1 - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: MAERegressionOutput(...) - - Use mean absolute error regression for final output, this is used on final output of a net. - - :param data: Input data to function. - :type data: SymbolicNode - - - :param label: Input label to function. - :type label: SymbolicNode - - - :param grad_scale: Scale the gradient by a float factor - :type grad_scale: float, optional, default=1 - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Pooling(...) - - Perform spatial pooling on inputs. - - :param data: Input data to the pooling operator. - :type data: SymbolicNode - - - :param kernel: pooling kernel size: (y, x) - :type kernel: Shape(tuple), required - - - :param pool_type: Pooling type to be applied. - :type pool_type: {'avg', 'max', 'sum'}, required - - - :param stride: stride: for pooling (y, x) - :type stride: Shape(tuple), optional, default=(1,1) - - - :param pad: pad for pooling: (y, x) - :type pad: Shape(tuple), optional, default=(0,0) - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: Reshape(...) - - Reshape input to target shape - - :param data: Input data to reshape. - :type data: SymbolicNode - - - :param target_shape: Target new shape. One and only one dim can be 0, in which case it will be inferred from the rest of dims - :type target_shape: Shape(tuple), required - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: SliceChannel(...) - - Slice input equally along specified axis - - :param num_outputs: Number of outputs to be sliced. - :type num_outputs: int, required - - - :param axis: Dimension along which to slice. - :type axis: int, optional, default='1' - - - :param squeeze_axis: If true AND the sliced dimension becomes 1, squeeze that dimension. - :type squeeze_axis: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode[]. - - - - - -.. function:: Softmax(...) - - DEPRECATED: Perform a softmax transformation on input. Please use SoftmaxOutput - - :param data: Input data to softmax. - :type data: SymbolicNode - - - :param grad_scale: Scale the gradient by a float factor - :type grad_scale: float, optional, default=1 - - - :param ignore_label: the ignore_label will not work in backward, and this only be used when multi_output=true - :type ignore_label: float, optional, default=-1 - - - :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensional input tensor, softmax will generate n*x_1*...*x_n output, each has k classes - :type multi_output: boolean, optional, default=False - - - :param use_ignore: If set to true, the ignore_label value will not contribute to the backward gradient - :type use_ignore: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: SoftmaxActivation(...) - - Apply softmax activation to input. This is intended for internal layers. For output (loss layer) please use SoftmaxOutput. If type=instance, this operator will compute a softmax for each instance in the batch; this is the default mode. If type=channel, this operator will compute a num_channel-class softmax at each position of each instance; this can be used for fully convolutional network, image segmentation, etc. - - :param data: Input data to activation function. - :type data: SymbolicNode - - - :param type: Softmax Mode. If set to instance, this operator will compute a softmax for each instance in the batch; this is the default mode. If set to channel, this operator will compute a num_channel-class softmax at each position of each instance; this can be used for fully convolutional network, image segmentation, etc. - :type type: {'channel', 'instance'},optional, default='instance' - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: SoftmaxOutput(...) - - Perform a softmax transformation on input, backprop with logloss. - - :param data: Input data to softmax. - :type data: SymbolicNode - - - :param label: Label data. - :type label: SymbolicNode - - - :param grad_scale: Scale the gradient by a float factor - :type grad_scale: float, optional, default=1 - - - :param ignore_label: the ignore_label will not work in backward, and this only be used when multi_output=true - :type ignore_label: float, optional, default=-1 - - - :param multi_output: If set to true, for a (n,k,x_1,..,x_n) dimensional input tensor, softmax will generate n*x_1*...*x_n output, each has k classes - :type multi_output: boolean, optional, default=False - - - :param use_ignore: If set to true, the ignore_label value will not contribute to the backward gradient - :type use_ignore: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: SwapAxis(...) - - Apply swapaxis to input. - - :param data: Input data to the SwapAxisOp. - :type data: SymbolicNode - - - :param dim1: the first axis to be swapped. - :type dim1: int (non-negative), optional, default=0 - - - :param dim2: the second axis to be swapped. - :type dim2: int (non-negative), optional, default=0 - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: UpSampling(...) - - Perform nearest neighboor/bilinear up sampling to inputs - - This function support variable length positional :class:`SymbolicNode` inputs. - - :param data: Array of tensors to upsample - :type data: SymbolicNode[] - - - :param scale: Up sampling scale - :type scale: int (non-negative), required - - - :param num_filter: Input filter. Only used by nearest sample_type. - :type num_filter: int (non-negative), optional, default=0 - - - :param sample_type: upsampling method - :type sample_type: {'bilinear', 'nearest'}, required - - - :param multi_input_mode: How to handle multiple input. concat means concatenate upsampled images along the channel dimension. sum means add all images together, only available for nearest neighbor upsampling. - :type multi_input_mode: {'concat', 'sum'},optional, default='concat' - - - :param num_args: Number of inputs to be upsampled. For nearest neighbor upsampling, this can be 1-N; the size of output will be(scale*h_0,scale*w_0) and all other inputs will be upsampled to thesame size. For bilinear upsampling this must be 2; 1 input and 1 weight. - :type num_args: int, required - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: abs(...) - - Take absolute value of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: ceil(...) - - Take ceil value of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: cos(...) - - Take cos of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: exp(...) - - Take exp of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: floor(...) - - Take floor value of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: log(...) - - Take log of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: round(...) - - Take round value of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: rsqrt(...) - - Take rsqrt of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: sign(...) - - Take sign value of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: sin(...) - - Take sin of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: sqrt(...) - - Take sqrt of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: square(...) - - Take square of the src - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: transpose(...) - - Transpose the input matrix and return a new one - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - -Internal APIs -^^^^^^^^^^^^^ - -.. note:: - - Document and signatures for internal API functions might be incomplete. - -.. function:: _CrossDeviceCopy(...) - - Special op to copy data cross device - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: _Div(...) - - Multiply lhs by rhs - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: _DivScalar(...) - - Perform an elementwise div. - - :param array: Input array operand to the operation. - :type array: SymbolicNode - - - :param scalar: scalar value. - :type scalar: float, required - - - :param scalar_on_left: scalar operand is on the left. - :type scalar_on_left: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: _Maximum(...) - - Elementwise max of lhs by rhs - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: _MaximumScalar(...) - - Perform an elementwise maximum. - - :param array: Input array operand to the operation. - :type array: SymbolicNode - - - :param scalar: scalar value. - :type scalar: float, required - - - :param scalar_on_left: scalar operand is on the left. - :type scalar_on_left: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: _Minimum(...) - - Elementwise min of lhs by rhs - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: _MinimumScalar(...) - - Perform an elementwise minimum. - - :param array: Input array operand to the operation. - :type array: SymbolicNode - - - :param scalar: scalar value. - :type scalar: float, required - - - :param scalar_on_left: scalar operand is on the left. - :type scalar_on_left: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: _Minus(...) - - Minus lhs and rhs - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: _MinusScalar(...) - - Perform an elementwise minus. - - :param array: Input array operand to the operation. - :type array: SymbolicNode - - - :param scalar: scalar value. - :type scalar: float, required - - - :param scalar_on_left: scalar operand is on the left. - :type scalar_on_left: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: _Mul(...) - - Multiply lhs and rhs - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: _MulScalar(...) - - Perform an elementwise mul. - - :param array: Input array operand to the operation. - :type array: SymbolicNode - - - :param scalar: scalar value. - :type scalar: float, required - - - :param scalar_on_left: scalar operand is on the left. - :type scalar_on_left: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: _NDArray(...) - - Stub for implementing an operator implemented in native frontend language with ndarray. - - :param info: - :type info: , required - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: _Native(...) - - Stub for implementing an operator implemented in native frontend language. - - :param info: - :type info: , required - - - :param need_top_grad: Whether this layer needs out grad for backward. Should be false for loss layers. - :type need_top_grad: boolean, optional, default=True - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: _Plus(...) - - Add lhs and rhs - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: _PlusScalar(...) - - Perform an elementwise plus. - - :param array: Input array operand to the operation. - :type array: SymbolicNode - - - :param scalar: scalar value. - :type scalar: float, required - - - :param scalar_on_left: scalar operand is on the left. - :type scalar_on_left: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - -.. function:: _Power(...) - - Elementwise power(lhs, rhs) - - :param lhs: Left symbolic input to the function - :type lhs: SymbolicNode - - - :param rhs: Left symbolic input to the function - :type rhs: SymbolicNode - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: . - - - - - -.. function:: _PowerScalar(...) - - Perform an elementwise power. - - :param array: Input array operand to the operation. - :type array: SymbolicNode - - - :param scalar: scalar value. - :type scalar: float, required - - - :param scalar_on_left: scalar operand is on the left. - :type scalar_on_left: boolean, optional, default=False - - :param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`. - - :return: SymbolicNode. - - - - - - - - diff --git a/docs/api/visualize.rst b/docs/api/visualize.rst deleted file mode 100644 index 42857c5f4ff0..000000000000 --- a/docs/api/visualize.rst +++ /dev/null @@ -1,19 +0,0 @@ - -Network Visualization -===================== - - - - -.. function:: to_graphviz(network) - - :param SymbolicNode network: the network to visualize. - :param AbstractString title: keyword argument, default "Network Visualization", - the title of the GraphViz graph. - :param input_shapes: keyword argument, default ``nothing``. If provided, - will run shape inference and plot with the shape information. Should - be either a dictionary of name-shape mapping or an array of shapes. - :return: the graph description in GraphViz ``dot`` language. - - - diff --git a/docs/build-api.jl b/docs/build-api.jl deleted file mode 100644 index c8e54677096f..000000000000 --- a/docs/build-api.jl +++ /dev/null @@ -1,98 +0,0 @@ -# extract API docs -using MXNet - -const SRC_DIR = joinpath(Pkg.dir("MXNet"), "src") -const API_DIR = joinpath(Pkg.dir("MXNet"), "docs", "api") - -################################################################################# -# Document Builders -################################################################################# -function extract_doc(output_filename::AbstractString, input_filenames::AbstractString...) - mkpath(API_DIR) - open(joinpath(API_DIR, output_filename), "w") do io - for in_fn in input_filenames - for doc in eachmatch(r"^#=doc\s*$(.*?)^=#\s*$"ms, readall(joinpath(SRC_DIR, in_fn))) - println(io, doc.captures[1], "\n\n") - end - end - end -end - -function sort_api_names(names) - names = collect(names) - names_pub = filter(x -> !startswith(string(x), '_'), names) - names_pri = filter(x -> startswith(string(x), '_'), names) - return (sort(names_pub), sort(names_pri)) -end - -function embed_mxnet_api(output_filename::AbstractString, key::AbstractString, generator::Function) - output_filename = joinpath(API_DIR, output_filename) - contents = readall(output_filename) - open(output_filename, "w") do io - docs = generator(gen_docs=true) - function gen_doc(fname) - doc = replace(docs[fname], r"^"m, " ") - """ - .. function:: $fname(...) - - $doc - - """ - end - - names_pub, names_pri = sort_api_names(keys(docs)) - docs_pub = join(map(gen_doc, names_pub), "\n\n") - docs_pri = join(map(gen_doc, names_pri), "\n\n") - if isempty(names_pri) - docstrings = "" - else - docstrings = """ - Public APIs - ^^^^^^^^^^^ - """ - end - docstrings *= docs_pub - - if !isempty(names_pri) - docstrings *= """ - - Internal APIs - ^^^^^^^^^^^^^ - - .. note:: - - Document and signatures for internal API functions might be incomplete. - - """ * docs_pri - end - - key = mx.format(mx.DOC_EMBED_ANCHOR, key) - println(io, replace(contents, key, docstrings)) - end -end - -################################################################################# -# Build Documents -################################################################################# -extract_doc("context.rst", "context.jl") - -extract_doc("ndarray.rst", "ndarray.jl") -embed_mxnet_api("ndarray.rst", "ndarray", mx._import_ndarray_functions) - -extract_doc("symbolic-node.rst", "symbolic-node.jl") -embed_mxnet_api("symbolic-node.rst", "symbolic-node", mx._import_atomic_symbol_creators) - -extract_doc("executor.rst", "executor.jl") - -extract_doc("initializer.rst", "initializer.jl") -extract_doc("callback.rst", "callback.jl") -extract_doc("model.rst", "model.jl") - -extract_doc("optimizer.rst", "optimizer.jl", "optimizers/sgd.jl", "optimizers/adam.jl") -extract_doc("metric.rst", "metric.jl") - -extract_doc("io.rst", "io.jl") -embed_mxnet_api("io.rst", "io", mx._import_io_iterators) - -extract_doc("visualize.rst", "visualize.jl") -extract_doc("nn-factory.rst", "nn-factory.jl") diff --git a/docs/conf.py b/docs/conf.py deleted file mode 100644 index 7454faa99eee..000000000000 --- a/docs/conf.py +++ /dev/null @@ -1,277 +0,0 @@ -# -*- coding: utf-8 -*- -# -# MXNet documentation build configuration file, created by -# sphinx-quickstart on Thu Nov 13 00:43:40 2014. -# -# This file is execfile()d with the current directory set to its -# containing dir. -# -# Note that not all possible configuration values are present in this -# autogenerated file. -# -# All configuration values have a default; values that are commented out -# serve to show the default. - -import sys -import os - -# If extensions (or modules to document with autodoc) are in another directory, -# add these directories to sys.path here. If the directory is relative to the -# documentation root, use os.path.abspath to make it absolute, like shown here. -#sys.path.insert(0, os.path.abspath('.')) -sys.path.insert(0, os.path.abspath("sphinx")) -import julia - -# -- General configuration ------------------------------------------------ - -# If your documentation needs a minimal Sphinx version, state it here. -#needs_sphinx = '1.0' - -# Add any Sphinx extension module names here, as strings. They can be -# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom -# ones. -extensions = [ - 'sphinx.ext.mathjax', - 'julia' -] - -# Add any paths that contain templates here, relative to this directory. -templates_path = ['_templates'] - -# The suffix of source filenames. -source_suffix = '.rst' - -# The encoding of source files. -#source_encoding = 'utf-8-sig' - -# The master toctree document. -master_doc = 'index' - -# General information about the project. -project = u'MXNet' -copyright = u'2015, pluskid' - -# The version info for the project you're documenting, acts as replacement for -# |version| and |release|, also used in various other places throughout the -# built documents. -# -# The short X.Y version. -version = '0.0.8' -# The full version, including alpha/beta/rc tags. -release = '0.0.8' - -# The language for content autogenerated by Sphinx. Refer to documentation -# for a list of supported languages. -#language = None - -# There are two options for replacing |today|: either, you set today to some -# non-false value, then it is used: -#today = '' -# Else, today_fmt is used as the format for a strftime call. -#today_fmt = '%B %d, %Y' - -# List of patterns, relative to source directory, that match files and -# directories to ignore when looking for source files. -exclude_patterns = ['_build'] - -# The reST default role (used for this markup: `text`) to use for all -# documents. -#default_role = None - -# If true, '()' will be appended to :func: etc. cross-reference text. -#add_function_parentheses = True - -# If true, the current module name will be prepended to all description -# unit titles (such as .. function::). -#add_module_names = True - -# If true, sectionauthor and moduleauthor directives will be shown in the -# output. They are ignored by default. -#show_authors = False - -# The name of the Pygments (syntax highlighting) style to use. -pygments_style = 'sphinx' - -# A list of ignored prefixes for module index sorting. -#modindex_common_prefix = [] - -primary_domain = 'jl' -highlight_language = 'julia' - -# If true, keep warnings as "system message" paragraphs in the built documents. -#keep_warnings = False - - -# -- Options for HTML output ---------------------------------------------- - -# The theme to use for HTML and HTML Help pages. See the documentation for -# a list of builtin theme -html_theme = 'default' - -import os -on_rtd = os.environ.get('READTHEDOCS', None) == 'True' - -if not on_rtd: # only import and set the theme if we're building docs locally - try: - import sphinx_rtd_theme - html_theme = "sphinx_rtd_theme" - html_theme_path = [sphinx_rtd_theme.get_html_theme_path()] - except: - pass - -# Theme options are theme-specific and customize the look and feel of a theme -# further. For a list of options available for each theme, see the -# documentation. -#html_theme_options = {} - -# Add any paths that contain custom themes here, relative to this directory. -#html_theme_path = [] - -# The name for this set of Sphinx documents. If None, it defaults to -# " v documentation". -#html_title = None - -# A shorter title for the navigation bar. Default is the same as html_title. -#html_short_title = None - -# The name of an image file (relative to this directory) to place at the top -# of the sidebar. -#html_logo = None - -# The name of an image file (within the static path) to use as favicon of the -# docs. This file should be a Windows icon file (.ico) being 16x16 or 32x32 -# pixels large. -#html_favicon = None - -# Add any paths that contain custom static files (such as style sheets) here, -# relative to this directory. They are copied after the builtin static files, -# so a file named "default.css" will overwrite the builtin "default.css". -html_static_path = ['_static'] - -# Add any extra paths that contain custom files (such as robots.txt or -# .htaccess) here, relative to this directory. These files are copied -# directly to the root of the documentation. -#html_extra_path = [] - -# If not '', a 'Last updated on:' timestamp is inserted at every page bottom, -# using the given strftime format. -#html_last_updated_fmt = '%b %d, %Y' - -# If true, SmartyPants will be used to convert quotes and dashes to -# typographically correct entities. -#html_use_smartypants = True - -# Custom sidebar templates, maps document names to template names. -#html_sidebars = {} - -# Additional templates that should be rendered to pages, maps page names to -# template names. -#html_additional_pages = {} - -# If false, no module index is generated. -#html_domain_indices = True - -# If false, no index is generated. -#html_use_index = True - -# If true, the index is split into individual pages for each letter. -#html_split_index = False - -# If true, links to the reST sources are added to the pages. -#html_show_sourcelink = True - -# If true, "Created using Sphinx" is shown in the HTML footer. Default is True. -#html_show_sphinx = True - -# If true, "(C) Copyright ..." is shown in the HTML footer. Default is True. -#html_show_copyright = True - -# If true, an OpenSearch description file will be output, and all pages will -# contain a tag referring to it. The value of this option must be the -# base URL from which the finished HTML is served. -#html_use_opensearch = '' - -# This is the file name suffix for HTML files (e.g. ".xhtml"). -#html_file_suffix = None - -# Output file base name for HTML help builder. -htmlhelp_basename = 'MXNetdoc' - - -# -- Options for LaTeX output --------------------------------------------- - -latex_elements = { -# The paper size ('letterpaper' or 'a4paper'). -#'papersize': 'letterpaper', - -# The font size ('10pt', '11pt' or '12pt'). -#'pointsize': '10pt', - -# Additional stuff for the LaTeX preamble. -#'preamble': '', -} - -# Grouping the document tree into LaTeX files. List of tuples -# (source start file, target name, title, -# author, documentclass [howto, manual, or own class]). -latex_documents = [ - ('index', 'MXNet.tex', u'MXNet Documentation', - u'pluskid', 'manual'), -] - -# The name of an image file (relative to this directory) to place at the top of -# the title page. -#latex_logo = None - -# For "manual" documents, if this is true, then toplevel headings are parts, -# not chapters. -#latex_use_parts = False - -# If true, show page references after internal links. -#latex_show_pagerefs = False - -# If true, show URL addresses after external links. -#latex_show_urls = False - -# Documents to append as an appendix to all manuals. -#latex_appendices = [] - -# If false, no module index is generated. -#latex_domain_indices = True - - -# -- Options for manual page output --------------------------------------- - -# One entry per manual page. List of tuples -# (source start file, name, description, authors, manual section). -man_pages = [ - ('index', 'mxnet', u'MXNet Documentation', - [u'pluskid'], 1) -] - -# If true, show URL addresses after external links. -#man_show_urls = False - - -# -- Options for Texinfo output ------------------------------------------- - -# Grouping the document tree into Texinfo files. List of tuples -# (source start file, target name, title, author, -# dir menu entry, description, category) -texinfo_documents = [ - ('index', 'MXNet', u'MXNet Documentation', - u'pluskid', 'MXNet', 'One line description of project.', - 'Miscellaneous'), -] - -# Documents to append as an appendix to all manuals. -#texinfo_appendices = [] - -# If false, no module index is generated. -#texinfo_domain_indices = True - -# How to display URL addresses: 'footnote', 'no', or 'inline'. -#texinfo_show_urls = 'footnote' - -# If true, do not generate a @detailmenu in the "Top" node's menu. -#texinfo_no_detailmenu = False diff --git a/docs/index.rst b/docs/index.rst deleted file mode 100644 index 7e95b6a7c10e..000000000000 --- a/docs/index.rst +++ /dev/null @@ -1,55 +0,0 @@ -%%%%%%%%%%%%%%%%%%% -MXNet Documentation -%%%%%%%%%%%%%%%%%%% - -`MXNet.jl `_ is `Julia -`_ package of `dmlc/mxnet -`_. MXNet.jl brings flexible and efficient GPU -computing and state-of-art deep learning to Julia. Some highlight of features -include: - -- Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. -- Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. - -For more details, see documentation below. Please also checkout the `examples -`_ directory. - -.. toctree:: - :maxdepth: 2 - :caption: Tutorials - - tutorial/mnist - tutorial/char-lstm - -.. toctree:: - :maxdepth: 2 - :caption: User's Guide - - user-guide/install - user-guide/overview - user-guide/faq - -.. toctree:: - :maxdepth: 1 - :caption: API Documentation - - api/context - api/model - api/initializer - api/optimizer - api/callback - api/metric - api/io - api/ndarray - api/symbolic-node - api/nn-factory - api/executor - api/visualize - -Indices and tables -================== - -* :ref:`genindex` -* :ref:`modindex` -* :ref:`search` - diff --git a/docs/sphinx/julia.py b/docs/sphinx/julia.py deleted file mode 100644 index 49d6af95b545..000000000000 --- a/docs/sphinx/julia.py +++ /dev/null @@ -1,23 +0,0 @@ -# Julia domain for Sphinx (stolen from StrPack.jl) -# http://sphinx.pocoo.org/domains.html - -import re -import sphinx.domains.python - -sphinx.domains.python.py_sig_re = re.compile( - r'''^ ([\w.]*\.)? # class name(s) - ([^\s(]+) \s* # thing name - (?: \((.*)\) # optional: arguments - (?:\s* -> \s* (.*))? # return annotation - )? $ # and nothing more - ''', re.VERBOSE | re.UNICODE) - -class JuliaDomain(sphinx.domains.python.PythonDomain): - """Julia language domain.""" - name = 'jl' - label = 'Julia' - -JuliaDomain.directives['type'] = JuliaDomain.directives['class'] - -def setup(app): - app.add_domain(JuliaDomain) diff --git a/docs/src/index.md b/docs/src/index.md index e69de29bb2d1..7e95b6a7c10e 100644 --- a/docs/src/index.md +++ b/docs/src/index.md @@ -0,0 +1,55 @@ +%%%%%%%%%%%%%%%%%%% +MXNet Documentation +%%%%%%%%%%%%%%%%%%% + +`MXNet.jl `_ is `Julia +`_ package of `dmlc/mxnet +`_. MXNet.jl brings flexible and efficient GPU +computing and state-of-art deep learning to Julia. Some highlight of features +include: + +- Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. +- Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. + +For more details, see documentation below. Please also checkout the `examples +`_ directory. + +.. toctree:: + :maxdepth: 2 + :caption: Tutorials + + tutorial/mnist + tutorial/char-lstm + +.. toctree:: + :maxdepth: 2 + :caption: User's Guide + + user-guide/install + user-guide/overview + user-guide/faq + +.. toctree:: + :maxdepth: 1 + :caption: API Documentation + + api/context + api/model + api/initializer + api/optimizer + api/callback + api/metric + api/io + api/ndarray + api/symbolic-node + api/nn-factory + api/executor + api/visualize + +Indices and tables +================== + +* :ref:`genindex` +* :ref:`modindex` +* :ref:`search` + diff --git a/docs/tutorial/char-lstm.rst b/docs/src/tutorial/char-lstm.rst similarity index 100% rename from docs/tutorial/char-lstm.rst rename to docs/src/tutorial/char-lstm.rst diff --git a/docs/tutorial/images/LSTM3-chain.png b/docs/src/tutorial/images/LSTM3-chain.png similarity index 100% rename from docs/tutorial/images/LSTM3-chain.png rename to docs/src/tutorial/images/LSTM3-chain.png diff --git a/docs/tutorial/images/char-lstm-vis.svg b/docs/src/tutorial/images/char-lstm-vis.svg similarity index 100% rename from docs/tutorial/images/char-lstm-vis.svg rename to docs/src/tutorial/images/char-lstm-vis.svg diff --git a/docs/tutorial/mnist.rst b/docs/src/tutorial/mnist.rst similarity index 100% rename from docs/tutorial/mnist.rst rename to docs/src/tutorial/mnist.rst diff --git a/docs/user-guide/faq.rst b/docs/src/user-guide/faq.rst similarity index 100% rename from docs/user-guide/faq.rst rename to docs/src/user-guide/faq.rst diff --git a/docs/user-guide/install.rst b/docs/src/user-guide/install.rst similarity index 100% rename from docs/user-guide/install.rst rename to docs/src/user-guide/install.rst diff --git a/docs/user-guide/overview.rst b/docs/src/user-guide/overview.rst similarity index 100% rename from docs/user-guide/overview.rst rename to docs/src/user-guide/overview.rst From 504aec63352f484fe915c902f2d9f92e6cc86ede Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 6 Jul 2016 04:19:29 +0900 Subject: [PATCH 347/630] do some housekeeping and start moving things to markdown --- docs/make.jl | 4 +- docs/src/api.md | 5 ++ docs/src/index.md | 61 ++++--------------- docs/src/tutorial.md | 0 .../tutorial/{char-lstm.rst => char-lstm.md} | 0 docs/src/tutorial/{mnist.rst => mnist.md} | 0 docs/src/user-guide.md | 0 7 files changed, 20 insertions(+), 50 deletions(-) create mode 100644 docs/src/api.md create mode 100644 docs/src/tutorial.md rename docs/src/tutorial/{char-lstm.rst => char-lstm.md} (100%) rename docs/src/tutorial/{mnist.rst => mnist.md} (100%) create mode 100644 docs/src/user-guide.md diff --git a/docs/make.jl b/docs/make.jl index 1a20e2b93826..f5569035bc69 100644 --- a/docs/make.jl +++ b/docs/make.jl @@ -1,3 +1,5 @@ using Documenter, MXNet -makedocs() +makedocs( + modules = [MXNet] +) diff --git a/docs/src/api.md b/docs/src/api.md new file mode 100644 index 000000000000..2316d3eda140 --- /dev/null +++ b/docs/src/api.md @@ -0,0 +1,5 @@ +# API + +```@contents +Pages = ["api/context.md"] +``` diff --git a/docs/src/index.md b/docs/src/index.md index 7e95b6a7c10e..0ad69711e41c 100644 --- a/docs/src/index.md +++ b/docs/src/index.md @@ -1,55 +1,18 @@ -%%%%%%%%%%%%%%%%%%% -MXNet Documentation -%%%%%%%%%%%%%%%%%%% +# MXNet Documentation -`MXNet.jl `_ is `Julia -`_ package of `dmlc/mxnet -`_. MXNet.jl brings flexible and efficient GPU +[`MXNet.jl`](https://github.com/dmlc/MXNet.jl>) is the +[`Julia`](http://julialang.org/) package of +[`dmlc/mxnet`](https://github.com/dmlc/mxnet). `MXNet.jl` brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of features include: -- Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. -- Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. +* Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. +* Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. -For more details, see documentation below. Please also checkout the `examples -`_ directory. - -.. toctree:: - :maxdepth: 2 - :caption: Tutorials - - tutorial/mnist - tutorial/char-lstm - -.. toctree:: - :maxdepth: 2 - :caption: User's Guide - - user-guide/install - user-guide/overview - user-guide/faq - -.. toctree:: - :maxdepth: 1 - :caption: API Documentation - - api/context - api/model - api/initializer - api/optimizer - api/callback - api/metric - api/io - api/ndarray - api/symbolic-node - api/nn-factory - api/executor - api/visualize - -Indices and tables -================== - -* :ref:`genindex` -* :ref:`modindex` -* :ref:`search` +For more details, see documentation below. Please also checkout the +[examples](https://github.com/dmlc/MXNet.jl/tree/master/examples) directory. +```@contents +Pages = ["tutorial.md", "user-guide.md", "api.md"] +Depth = 2 +``` diff --git a/docs/src/tutorial.md b/docs/src/tutorial.md new file mode 100644 index 000000000000..e69de29bb2d1 diff --git a/docs/src/tutorial/char-lstm.rst b/docs/src/tutorial/char-lstm.md similarity index 100% rename from docs/src/tutorial/char-lstm.rst rename to docs/src/tutorial/char-lstm.md diff --git a/docs/src/tutorial/mnist.rst b/docs/src/tutorial/mnist.md similarity index 100% rename from docs/src/tutorial/mnist.rst rename to docs/src/tutorial/mnist.md diff --git a/docs/src/user-guide.md b/docs/src/user-guide.md new file mode 100644 index 000000000000..e69de29bb2d1 From 733d46d1d6f85923d423fe3b05631b0c219edced Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 12 Jul 2016 07:14:35 +0900 Subject: [PATCH 348/630] setup api docs with autodoc --- docs/src/api.md | 4 ++-- docs/src/api/callback.md | 6 ++++++ docs/src/api/context.md | 7 +++---- docs/src/api/executor.md | 6 ++++++ docs/src/api/initializer.md | 6 ++++++ docs/src/api/io.md | 6 ++++++ docs/src/api/kvstore.md | 6 ++++++ docs/src/api/metric.md | 6 ++++++ docs/src/api/model.md | 6 ++++++ docs/src/api/ndarry.md | 6 ++++++ docs/src/api/nn-factory.md | 6 ++++++ docs/src/api/optimizer.md | 10 ++++++++++ docs/src/api/optimizers/adam.md | 6 ++++++ docs/src/api/optimizers/sgd.md | 6 ++++++ docs/src/api/random.md | 6 ++++++ docs/src/api/symbolic-node.md | 6 ++++++ docs/src/api/visualize.md | 6 ++++++ 17 files changed, 99 insertions(+), 6 deletions(-) create mode 100644 docs/src/api/callback.md create mode 100644 docs/src/api/executor.md create mode 100644 docs/src/api/initializer.md create mode 100644 docs/src/api/io.md create mode 100644 docs/src/api/kvstore.md create mode 100644 docs/src/api/metric.md create mode 100644 docs/src/api/model.md create mode 100644 docs/src/api/ndarry.md create mode 100644 docs/src/api/nn-factory.md create mode 100644 docs/src/api/optimizer.md create mode 100644 docs/src/api/optimizers/adam.md create mode 100644 docs/src/api/optimizers/sgd.md create mode 100644 docs/src/api/random.md create mode 100644 docs/src/api/symbolic-node.md create mode 100644 docs/src/api/visualize.md diff --git a/docs/src/api.md b/docs/src/api.md index 2316d3eda140..fa48c540721a 100644 --- a/docs/src/api.md +++ b/docs/src/api.md @@ -1,5 +1,5 @@ -# API +# API Documentation ```@contents -Pages = ["api/context.md"] +Pages = ["api/context.md", "api/model.md", "api/initializers.md", "api/optimizers.md", "api/callbacks.md", "api/metric.md", "api/io.md", "api/ndarray.md", "api/symbolic-node.md", "api/nn-factory.md", "api/executor.md", "api/visualize.md"] ``` diff --git a/docs/src/api/callback.md b/docs/src/api/callback.md new file mode 100644 index 000000000000..f67811cc41fe --- /dev/null +++ b/docs/src/api/callback.md @@ -0,0 +1,6 @@ +# Callback in training + +```@autodocs +Modules = [MXNet.mx] +Pages = ["callback.jl"] +``` diff --git a/docs/src/api/context.md b/docs/src/api/context.md index 2c2ac8f7d7ac..93ccf83e51ba 100644 --- a/docs/src/api/context.md +++ b/docs/src/api/context.md @@ -1,7 +1,6 @@ # Context -```@docs -mx.Context -mx.cpu -mx.gpu +```@autodocs +Modules = [MXNet.mx] +Pages = ["context.jl"] ``` diff --git a/docs/src/api/executor.md b/docs/src/api/executor.md new file mode 100644 index 000000000000..b560c7a0864d --- /dev/null +++ b/docs/src/api/executor.md @@ -0,0 +1,6 @@ +# Executor + +```@autodocs +Modules = [MXNet.mx] +Pages = ["executor.jl"] +``` diff --git a/docs/src/api/initializer.md b/docs/src/api/initializer.md new file mode 100644 index 000000000000..d0aad2def4cd --- /dev/null +++ b/docs/src/api/initializer.md @@ -0,0 +1,6 @@ +# Initializer + +```@autodocs +Modules = [MXNet.mx] +Pages = ["initializer.jl"] +``` diff --git a/docs/src/api/io.md b/docs/src/api/io.md new file mode 100644 index 000000000000..43439a930378 --- /dev/null +++ b/docs/src/api/io.md @@ -0,0 +1,6 @@ +# Data Providers + +```@autodocs +Modules = [MXNet.mx] +Pages = ["io.jl"] +``` diff --git a/docs/src/api/kvstore.md b/docs/src/api/kvstore.md new file mode 100644 index 000000000000..34a5027f85fb --- /dev/null +++ b/docs/src/api/kvstore.md @@ -0,0 +1,6 @@ +# Key-Value Store + +```@autodocs +Modules = [MXNet.mx] +Pages = ["kvstore.jl"] +``` diff --git a/docs/src/api/metric.md b/docs/src/api/metric.md new file mode 100644 index 000000000000..3c800b3a8152 --- /dev/null +++ b/docs/src/api/metric.md @@ -0,0 +1,6 @@ +# Evaluation Metrics + +```@autodocs +Modules = [MXNet.mx] +Pages = ["metric.jl"] +``` diff --git a/docs/src/api/model.md b/docs/src/api/model.md new file mode 100644 index 000000000000..739c3ea7bf9a --- /dev/null +++ b/docs/src/api/model.md @@ -0,0 +1,6 @@ +# Model + +```@autodocs +Modules = [MXNet.mx] +Pages = ["model.jl"] +``` diff --git a/docs/src/api/ndarry.md b/docs/src/api/ndarry.md new file mode 100644 index 000000000000..4c6832c58969 --- /dev/null +++ b/docs/src/api/ndarry.md @@ -0,0 +1,6 @@ +# NDArray API + +```@autodocs +Modules = [MXNet.mx] +Pages = ["ndarray.jl"] +``` diff --git a/docs/src/api/nn-factory.md b/docs/src/api/nn-factory.md new file mode 100644 index 000000000000..6aa6c4e5bb8e --- /dev/null +++ b/docs/src/api/nn-factory.md @@ -0,0 +1,6 @@ +# Neural Network Factory + +```@autodocs +Modules = [MXNet.mx] +Pages = ["nn-factory.jl"] +``` diff --git a/docs/src/api/optimizer.md b/docs/src/api/optimizer.md new file mode 100644 index 000000000000..b67a369587e4 --- /dev/null +++ b/docs/src/api/optimizer.md @@ -0,0 +1,10 @@ +# Optimizers + +```@contents +Pages = ["optimizers/adam.md", "optimizers/sgd.md"] +``` + +```@autodocs +Modules = [MXNet.mx] +Pages = ["optimizer.jl"] +``` diff --git a/docs/src/api/optimizers/adam.md b/docs/src/api/optimizers/adam.md new file mode 100644 index 000000000000..269d82a9c80e --- /dev/null +++ b/docs/src/api/optimizers/adam.md @@ -0,0 +1,6 @@ +# ADAM + +```@autodocs +Modules = [MXNet.mx] +Pages = ["adam.jl"] +``` diff --git a/docs/src/api/optimizers/sgd.md b/docs/src/api/optimizers/sgd.md new file mode 100644 index 000000000000..506c7b5c266d --- /dev/null +++ b/docs/src/api/optimizers/sgd.md @@ -0,0 +1,6 @@ +# Stochastic Gradient Descent + +```@autodocs +Modules = [MXNet.mx] +Pages = ["sgd.jl"] +``` diff --git a/docs/src/api/random.md b/docs/src/api/random.md new file mode 100644 index 000000000000..91372836c467 --- /dev/null +++ b/docs/src/api/random.md @@ -0,0 +1,6 @@ +# Random + +```@autodocs +Modules = [MXNet.mx] +Pages = ["random.jl"] +``` diff --git a/docs/src/api/symbolic-node.md b/docs/src/api/symbolic-node.md new file mode 100644 index 000000000000..ef731d9f7d00 --- /dev/null +++ b/docs/src/api/symbolic-node.md @@ -0,0 +1,6 @@ +# Symbolic API + +```@autodocs +Modules = [MXNet.mx] +Pages = ["symbolic-node.jl"] +``` diff --git a/docs/src/api/visualize.md b/docs/src/api/visualize.md new file mode 100644 index 000000000000..429a927012e4 --- /dev/null +++ b/docs/src/api/visualize.md @@ -0,0 +1,6 @@ +# Network Visualization + +```@autodocs +Modules = [MXNet.mx] +Pages = ["visualize.jl"] +``` From 9113b21721b8f39daf5a7238f755c9826e7dcc14 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 13 Jul 2016 02:44:50 +0900 Subject: [PATCH 349/630] rough first pass .rst -> .md --- docs/src/api/io.md | 3 + docs/src/api/metric.md | 4 + docs/src/api/model.md | 3 + docs/src/api/nn-factory.md | 5 +- docs/src/api/optimizer.md | 10 +- docs/src/api/random.md | 6 - src/callback.jl | 80 +++++---- src/executor.jl | 40 ++--- src/initializer.jl | 89 +++++----- src/io.jl | 105 +++++------ src/metric.jl | 63 +++---- src/model.jl | 109 ++++++------ src/ndarray.jl | 347 +++++++++++++++++-------------------- src/nn-factory.jl | 26 +-- src/optimizer.jl | 126 ++++++-------- src/symbolic-node.jl | 257 +++++++++++++-------------- src/visualize.jl | 17 +- 17 files changed, 583 insertions(+), 707 deletions(-) delete mode 100644 docs/src/api/random.md diff --git a/docs/src/api/io.md b/docs/src/api/io.md index 43439a930378..32a7d14f9144 100644 --- a/docs/src/api/io.md +++ b/docs/src/api/io.md @@ -1,5 +1,8 @@ # Data Providers +Data providers are wrappers that load external data, be it images, text, or general tensors, +and split it into mini-batches so that the model can consume the data in a uniformed way. + ```@autodocs Modules = [MXNet.mx] Pages = ["io.jl"] diff --git a/docs/src/api/metric.md b/docs/src/api/metric.md index 3c800b3a8152..63cca0cc41ba 100644 --- a/docs/src/api/metric.md +++ b/docs/src/api/metric.md @@ -1,5 +1,9 @@ # Evaluation Metrics +Evaluation metrics provide a way to evaluate the performance of a learned model. +This is typically used during training to monitor performance on the validation +set. + ```@autodocs Modules = [MXNet.mx] Pages = ["metric.jl"] diff --git a/docs/src/api/model.md b/docs/src/api/model.md index 739c3ea7bf9a..f793c7c406c7 100644 --- a/docs/src/api/model.md +++ b/docs/src/api/model.md @@ -1,5 +1,8 @@ # Model +The model API provides convenient high-level interface to do training and predicting on +a network described using the symbolic API. + ```@autodocs Modules = [MXNet.mx] Pages = ["model.jl"] diff --git a/docs/src/api/nn-factory.md b/docs/src/api/nn-factory.md index 6aa6c4e5bb8e..41474383aa76 100644 --- a/docs/src/api/nn-factory.md +++ b/docs/src/api/nn-factory.md @@ -1,4 +1,7 @@ -# Neural Network Factory +# Neural Network Factora + +Neural network factory provide convenient helper functions to define +common neural networks. ```@autodocs Modules = [MXNet.mx] diff --git a/docs/src/api/optimizer.md b/docs/src/api/optimizer.md index b67a369587e4..043529a670c1 100644 --- a/docs/src/api/optimizer.md +++ b/docs/src/api/optimizer.md @@ -1,10 +1,12 @@ # Optimizers -```@contents -Pages = ["optimizers/adam.md", "optimizers/sgd.md"] -``` - ```@autodocs Modules = [MXNet.mx] Pages = ["optimizer.jl"] ``` + +## Built-in optimizers + +```@contents +Pages = ["optimizers/adam.md", "optimizers/sgd.md"] +``` diff --git a/docs/src/api/random.md b/docs/src/api/random.md deleted file mode 100644 index 91372836c467..000000000000 --- a/docs/src/api/random.md +++ /dev/null @@ -1,6 +0,0 @@ -# Random - -```@autodocs -Modules = [MXNet.mx] -Pages = ["random.jl"] -``` diff --git a/src/callback.jl b/src/callback.jl index e18184b1131a..3aca66a7bbf0 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -1,27 +1,22 @@ -#=doc -Callbacks in training -===================== -=# +""" + AbstractCallback -#=doc -.. class:: AbstractCallback - - Abstract type of callback functions used in training. -=# +Abstract type of callback functions used in training. +""" abstract AbstractCallback -#=doc -.. class:: AbstractBatchCallback +""" + AbstractBatchCallback - Abstract type of callbacks to be called every mini-batch. -=# +Abstract type of callbacks to be called every mini-batch. +""" abstract AbstractBatchCallback <: AbstractCallback -#=doc -.. class:: AbstractEpochCallback +""" + AbstractEpochCallback - Abstract type of callbacks to be called every epoch. -=# +Abstract type of callbacks to be called every epoch. +""" abstract AbstractEpochCallback <: AbstractCallback type BatchCallback <: AbstractBatchCallback @@ -30,15 +25,16 @@ type BatchCallback <: AbstractBatchCallback callback :: Function end -#=doc -.. function:: every_n_batch(callback :: Function, n :: Int; call_on_0 = false) +""" + every_n_batch(callback :: Function, n :: Int; call_on_0 = false) - A convenient function to construct a callback that runs every ``n`` mini-batches. +A convenient function to construct a callback that runs every ``n`` mini-batches. - :param Int call_on_0: keyword argument, default false. Unless set, the callback +# Arguments +* `call_on_0::Bool`: keyword argument, default false. Unless set, the callback will **not** be run on batch 0. - For example, the :func:`speedometer` callback is defined as +For example, the :func:`speedometer` callback is defined as .. code-block:: julia @@ -51,7 +47,7 @@ end end :seealso: :func:`every_n_epoch`, :func:`speedometer`. -=# +""" function every_n_batch(callback :: Function, n :: Int; call_on_0 :: Bool = false) BatchCallback(n, call_on_0, callback) end @@ -65,15 +61,16 @@ function Base.call(cb :: BatchCallback, state :: OptimizationState) end end -#=doc -.. function:: speedometer(; frequency=50) +""" + speedometer(; frequency=50) - Create an :class:`AbstractBatchCallback` that measure the training speed +Create an :class:`AbstractBatchCallback` that measure the training speed (number of samples processed per second) every k mini-batches. - :param Int frequency: keyword argument, default 50. The frequency (number of +# Arguments +* Int frequency: keyword argument, default 50. The frequency (number of min-batches) to measure and report the speed. -=# +""" function speedometer(;frequency::Int=50) cl_tic = 0 every_n_batch(frequency, call_on_0=true) do state :: OptimizationState @@ -95,18 +92,18 @@ type EpochCallback <: AbstractEpochCallback callback :: Function end -#=doc -.. function:: every_n_epoch(callback :: Function, n :: Int; call_on_0 = false) +""" + every_n_epoch(callback :: Function, n :: Int; call_on_0 = false) - A convenient function to construct a callback that runs every ``n`` full data-passes. +A convenient function to construct a callback that runs every ``n`` full data-passes. - :param Int call_on_0: keyword argument, default false. Unless set, the callback +* Int call_on_0: keyword argument, default false. Unless set, the callback will **not** be run on epoch 0. Epoch 0 means no training has been performed yet. This is useful if you want to inspect the randomly initialized model that has not seen any data yet. :seealso: :func:`every_n_iter`. -=# +""" function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) end @@ -120,20 +117,21 @@ function Base.call{T<:Real}(cb :: EpochCallback, model :: Any, state :: Optimiza end end -#=doc -.. function:: do_checkpoint(prefix; frequency=1, save_epoch_0=false) +""" + do_checkpoint(prefix; frequency=1, save_epoch_0=false) - Create an :class:`AbstractEpochCallback` that save checkpoints of the model to disk. - The checkpoints can be loaded back later on. +Create an :class:`AbstractEpochCallback` that save checkpoints of the model to disk. +The checkpoints can be loaded back later on. - :param AbstractString prefix: the prefix of the filenames to save the model. The model +# Arguments +* `prefix::AbstractString`: the prefix of the filenames to save the model. The model architecture will be saved to prefix-symbol.json, while the weights will be saved to prefix-0012.params, for example, for the 12-th epoch. - :param Int frequency: keyword argument, default 1. The frequency (measured in epochs) to +* Int frequency: keyword argument, default 1. The frequency (measured in epochs) to save checkpoints. - :param Bool save_epoch_0: keyword argument, default false. Whether we should save a +* Bool save_epoch_0: keyword argument, default false. Whether we should save a checkpoint for epoch 0 (model initialized but not seen any data yet). -=# +""" function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) mkpath(dirname(prefix)) every_n_epoch(frequency, call_on_0=save_epoch_0) do model, state, metric diff --git a/src/executor.jl b/src/executor.jl index 86f3f65921f4..edebc79907c7 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -1,15 +1,10 @@ -#=doc -Executor -======== -=# - -#=doc -.. class:: Executor - - An executor is a realization of a symbolic architecture defined by a :class:`SymbolicNode`. - The actual forward and backward computation specified by the network architecture can - be carried out with an executor. -=# +""" + Executor + +An executor is a realization of a symbolic architecture defined by a :class:`SymbolicNode`. +The actual forward and backward computation specified by the network architecture can +be carried out with an executor. +""" type Executor handle :: MX_ExecutorHandle symbol :: SymbolicNode @@ -70,21 +65,22 @@ function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDA return (args_hdr, args_vec) end -#=doc -.. function:: bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) +""" + bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) - Create an :class:`Executor` by binding a :class:`SymbolicNode` to concrete :class:`NDArray`. +Create an :class:`Executor` by binding a :class:`SymbolicNode` to concrete :class:`NDArray`. - :param SymbolicNode sym: the network architecture describing the computation graph. - :param Context ctx: the context on which the computation should run. - :param args: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete +# Arguments +* `sym::SymbolicNode`: the network architecture describing the computation graph. +* `ctx::Context`: the context on which the computation should run. +* `args`: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete arrays for all the inputs in the network architecture. The inputs typically include network parameters (weights, bias, filters, etc.), data and labels. See :func:`list_arguments` and :func:`infer_shape`. - :param args_grad: TODO - :param aux_states: - :param grad_req: -=# +* `args_grad`: +* `aux_states`: +* `grad_req`: +""" @enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 function bind(self :: SymbolicNode, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; args_grad :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), diff --git a/src/initializer.jl b/src/initializer.jl index 8be33bdf66d2..7ee9920a9d12 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -1,27 +1,20 @@ -#=doc -Initializers -============ -Interface ---------- -=# +""" + AbstractInitializer -#=doc -.. class:: AbstractInitializer - - The abstract base class for all initializers. +The abstract base class for all initializers. To define a new initializer, it is enough to derive a new type, and implement one or more of the following methods: -.. function:: _init_weight(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -.. function:: _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -.. function:: _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -.. function:: _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + _init_weight(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + _init_gamma(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + _init_beta(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) Or, if full behavior customization is needed, override the following function -.. function:: init(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) -=# + init(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) +""" abstract AbstractInitializer function init{T<:AbstractInitializer}(self :: T, name :: Base.Symbol, array :: NDArray) @@ -60,67 +53,63 @@ function _init_default(self :: AbstractInitializer, name :: Base.Symbol, array : error("Do not know how to init $name") end -#=doc -Built-in initializers ---------------------- -=# -#=doc -.. class:: UniformInitializer +""" + UniformInitializer - Initialize weights according to a uniform distribution within the provided scale. -=# +Initialize weights according to a uniform distribution within the provided scale. +""" immutable UniformInitializer <: AbstractInitializer scale :: AbstractFloat end -#=doc -.. function UniformInitializer(scale=0.07) +""" + UniformInitializer(scale=0.07) - Construct a :class:`UniformInitializer` with the specified scale. -=# +Construct a :class:`UniformInitializer` with the specified scale. +""" UniformInitializer() = UniformInitializer(0.07) function _init_weight(self :: UniformInitializer, name :: Base.Symbol, array :: NDArray) rand!(-self.scale, self.scale, array) end -#=doc -.. class:: NormalInitializer +""" + NormalInitializer - Initialize weights according to a univariate Gaussian distribution. -=# +Initialize weights according to a univariate Gaussian distribution. +""" immutable NormalInitializer <: AbstractInitializer μ :: AbstractFloat σ :: AbstractFloat end -#=doc -.. function:: NormalIninitializer(; mu=0, sigma=0.01) +""" + NormalIninitializer(; mu=0, sigma=0.01) - Construct a :class:`NormalInitializer` with mean ``mu`` and variance ``sigma``. -=# +Construct a :class:`NormalInitializer` with mean ``mu`` and variance ``sigma``. +""" NormalInitializer(; mu=0, sigma=0.01) = NormalInitializer(mu, sigma) function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) randn!(self.μ, self.σ, array) end -#=doc -.. class:: XavierInitializer +""" + XavierInitializer - The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding - the difficulty of training deep feedforward neuralnetworks*. +The initializer documented in the paper [Bengio and Glorot 2010]: *Understanding +the difficulty of training deep feedforward neuralnetworks*. - There are several different version of the XavierInitializer used in the wild. - The general idea is that the variance of the initialization distribution is controlled - by the dimensionality of the input and output. As a distribution one can either choose - a normal distribution with μ = 0 and σ² or a uniform distribution from -σ to σ. +There are several different version of the XavierInitializer used in the wild. +The general idea is that the variance of the initialization distribution is controlled +by the dimensionality of the input and output. As a distribution one can either choose +a normal distribution with μ = 0 and σ² or a uniform distribution from -σ to σ. - Several different ways of calculating the variance are given in the literature or are - used by various libraries. +Several different ways of calculating the variance are given in the literature or are +used by various libraries. - - [Bengio and Glorot 2010]: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 1)`` - - [K. He, X. Zhang, S. Ren, and J. Sun 2015]: ``mx.XavierInitializer(distribution = mx.xv_gaussian, regularization = mx.xv_in, magnitude = 2)`` - - caffe_avg: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 3)`` -=# +* [Bengio and Glorot 2010]: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 1)`` +* [K. He, X. Zhang, S. Ren, and J. Sun 2015]: ``mx.XavierInitializer(distribution = mx.xv_gaussian, regularization = mx.xv_in, magnitude = 2)`` +* caffe_avg: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 3)`` +""" @enum XavierDistribution xv_uniform xv_normal @enum XavierRegularization xv_avg xv_in xv_out diff --git a/src/io.jl b/src/io.jl index 46fbcfe86a2d..0e7d5c22490c 100644 --- a/src/io.jl +++ b/src/io.jl @@ -1,31 +1,21 @@ -#=doc -Data Providers -============== -Interface ---------- +""" + AbstractDataProvider -Data providers are wrappers that load external data, be it images, text, or general tensors, -and split it into mini-batches so that the model can consume the data in a uniformed way. -=# +The root type for all data provider. A data provider should implement the following interfaces: -#=doc -.. class:: AbstractDataProvider - - The root type for all data provider. A data provider should implement the following interfaces: - - .. function:: get_batch_size(provider) -> Int + get_batch_size(provider) -> Int :param AbstractDataProvider provider: the data provider. :return: the mini-batch size of the provided data. All the provided data should have the same mini-batch size (i.e. the last dimension). - .. function:: provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} + provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} :param AbstractDataProvider provider: the data provider. :return: a vector of (name, shape) pairs describing the names of the data it provides, and the corresponding shapes. - .. function:: provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} + provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} :param AbstractDataProvider provider: the data provider. :return: a vector of (name, shape) pairs describing the names of the labels it provides, and @@ -65,25 +55,25 @@ and split it into mini-batches so that the model can consume the data in a unifo The detailed interface functions for the iterator API is listed below: -.. function:: Base.eltype(provider) -> AbstractDataBatch + Base.eltype(provider) -> AbstractDataBatch :param AbstractDataProvider provider: the data provider. :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. -.. function:: Base.start(provider) -> AbstractDataProviderState + Base.start(provider) -> AbstractDataProviderState :param AbstractDataProvider provider: the data provider. This function is always called before iterating into the dataset. It should initialize the iterator, reset the index, and do data shuffling if needed. -.. function:: Base.done(provider, state) -> Bool + Base.done(provider, state) -> Bool :param AbstractDataProvider provider: the data provider. :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. :return: true if there is no more data to iterate in this dataset. -.. function:: Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) + Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) :param AbstractDataProvider provider: the data provider. :return: the current data batch, and the state for the next iteration. @@ -118,29 +108,29 @@ of the built-in :class:`MXDataProvider` for example. # ... end end -=# +""" abstract AbstractDataProvider -#=doc -.. class:: AbstractDataProviderState +""" + AbstractDataProviderState Base type for data provider states. -=# +""" abstract AbstractDataProviderState -#=doc -.. class:: AbstractDataBatch +""" + AbstractDataBatch Base type for a data mini-batch. It should implement the following interfaces: - .. function:: count_samples(provider, batch) -> Int + count_samples(provider, batch) -> Int :param AbstractDataBatch batch: the data batch object. :return: the number of samples in this batch. This number should be greater than 0, but less than or equal to the batch size. This is used to indicate at the end of the data set, there might not be enough samples for a whole mini-batch. - .. function:: get_data(provider, batch) -> Vector{NDArray} + get_data(provider, batch) -> Vector{NDArray} :param AbstractDataProvider provider: the data provider. :param AbstractDataBatch batch: the data batch object. @@ -151,7 +141,7 @@ abstract AbstractDataProviderState :func:`count_samples` returns a value less than the batch size. In this case, the data provider is free to pad the remaining contents with any value. - .. function:: get_label(provider, batch) -> Vector{NDArray} + get_label(provider, batch) -> Vector{NDArray} :param AbstractDataProvider provider: the data provider. :param AbstractDataBatch batch: the data batch object. @@ -160,7 +150,7 @@ abstract AbstractDataProviderState The following utility functions will be automatically defined. - .. function:: get(provider, batch, name) -> NDArray + get(provider, batch, name) -> NDArray :param AbstractDataProvider provider: the data provider. :param AbstractDataBatch batch: the data batch object. @@ -169,7 +159,7 @@ abstract AbstractDataProviderState or :func:`provide_label() `. :return: the corresponding data array corresponding to that name. - .. function:: load_data!(provider, batch, targets) + load_data!(provider, batch, targets) :param AbstractDataProvider provider: the data provider. :param AbstractDataBatch batch: the data batch object. @@ -185,7 +175,7 @@ abstract AbstractDataProviderState This utility function is used in data parallelization, where a mini-batch is splited and computed on several different devices. - .. function:: load_label!(provider, batch, targets) + load_label!(provider, batch, targets) :param AbstractDataProvider provider: the data provider. :param AbstractDataBatch batch: the data batch object. @@ -193,15 +183,15 @@ abstract AbstractDataProviderState :type targets: Vector{Vector{SlicedNDArray}} The same as :func:`load_data!`, except that this is for loading labels. -=# +""" abstract AbstractDataBatch -#=doc -.. class:: DataBatch +""" + DataBatch A basic subclass of :class:`AbstractDataBatch`, that implement the interface by accessing member fields. -=# +""" type DataBatch <: AbstractDataBatch data :: Vector{NDArray} label :: Vector{NDArray} @@ -211,11 +201,11 @@ count_samples(batch :: DataBatch) = batch.count get_data{Provider<:AbstractDataProvider}(::Provider, batch :: DataBatch) = batch.data get_label{Provider<:AbstractDataProvider}(::Provider, batch :: DataBatch) = batch.label -#=doc -.. class:: SlicedNDArray +""" + SlicedNDArray A alias type of ``Tuple{UnitRange{Int},NDArray}``. -=# +""" typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} function _load_general!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, @@ -264,17 +254,11 @@ end eachbatch(provider :: AbstractDataProvider) = provider -#=doc -Built-in data providers ------------------------ -=# - -################################################################################ -#=doc -.. class:: ArrayDataProvider +""" + ArrayDataProvider A convenient tool to iterate :class:`NDArray` or Julia ``Array``. -=# +""" type ArrayDataProvider <: AbstractDataProvider data_arrays :: Vector{Array{MX_float}} data_names :: Vector{Base.Symbol} @@ -290,8 +274,8 @@ type ArrayDataProvider <: AbstractDataProvider label_batch :: Vector{NDArray} end -#=doc -.. function:: ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) +""" + ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) Construct a data provider from :class:`NDArray` or Julia Arrays. @@ -314,7 +298,7 @@ end TODO: remove ``data_padding`` and ``label_padding``, and implement rollover that copies the last or first several training samples to feed the padding. -=# +""" # Julia's type system is sometimes very frustrating. You cannot specify a function # with argument Vector{Pair} to expect to be matched when calling with the parameter # [:foo => zeros(2,3), :bar => zeros(3)] because the type inference gives very specific @@ -463,18 +447,12 @@ function get_label(provider :: ArrayDataProvider, batch :: ArrayDataBatch) end -#=doc -libmxnet data providers ------------------------ -=# - -################################################################################ -#=doc -.. class:: MXDataProvider +""" + MXDataProvider - A data provider that wrap built-in data iterators from libmxnet. See below for - a list of built-in data iterators. -=# +A data provider that wrap built-in data iterators from libmxnet. See below for +a list of built-in data iterators. +""" type MXDataProvider <: AbstractDataProvider handle :: MX_DataIterHandle data_shape :: Vector{Tuple{Base.Symbol, Tuple}} @@ -569,9 +547,6 @@ function count_samples(provider :: MXDataProvider, batch :: MXDataBatch) return provider.batch_size - Int(ref_pad[]) end -#=doc -**autogen:EMBED:io:EMBED:autogen** -=# function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) ref_name = Ref{char_p}(0) ref_desc = Ref{char_p}(0) diff --git a/src/metric.jl b/src/metric.jl index 1f601980ad13..21d5e4e34b14 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -1,17 +1,8 @@ -#=doc -Evaluation Metrics -================== +""" + AbstractEvalMetric -Evaluation metrics provide a way to evaluate the performance of a learned model. -This is typically used during training to monitor performance on the validation -set. -=# - -#=doc -.. class:: AbstractEvalMetric - - The base class for all evaluation metrics. The sub-types should implement the following - interfaces. +The base class for all evaluation metrics. The sub-types should implement the following +interfaces. .. function:: update!(metric, labels, preds) @@ -33,7 +24,7 @@ set. :return: ``Vector{Tuple{Base.Symbol, Real}}``, a list of name-value pairs. For example, ``[(:accuracy, 0.9)]``. -=# +""" abstract AbstractEvalMetric # Generic update! version @@ -49,14 +40,14 @@ function update!{T <: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray} end -#=doc -.. class:: Accuracy +""" + Accuracy - Multiclass classification accuracy. +Multiclass classification accuracy. - Calculates the mean accuracy per sample for softmax in one dimension. - For a multi-dimensional softmax the mean accuracy over all dimensions is calculated. -=# +Calculates the mean accuracy per sample for softmax in one dimension. +For a multi-dimensional softmax the mean accuracy over all dimensions is calculated. +""" type Accuracy <: AbstractEvalMetric acc_sum :: Float64 n_sample :: Int @@ -108,13 +99,13 @@ function reset!(metric :: Accuracy) metric.n_sample = 0 end -#=doc -.. class:: MSE +""" + MSE - Mean Squared Error. TODO: add support for multi-dimensional outputs. +Mean Squared Error. TODO: add support for multi-dimensional outputs. - Calculates the mean squared error regression loss in one dimension. -=# +Calculates the mean squared error regression loss in one dimension. +""" type MSE <: AbstractEvalMetric mse_sum :: Float64 @@ -144,13 +135,13 @@ function reset!(metric :: MSE) metric.n_sample = 0 end -#=doc -.. class:: ACE +""" + ACE - Averaged cross-entropy for classification. This also know als logloss. +Averaged cross-entropy for classification. This also know als logloss. - Calculated the averaged cross entropy for multi-dimentions output. -=# +Calculated the averaged cross entropy for multi-dimentions output. +""" type ACE <: AbstractEvalMetric ace_sum :: Float64 n_sample :: Int @@ -192,14 +183,14 @@ function _update_single_output(metric :: ACE, label :: NDArray, pred :: NDArray) end end -#=doc -.. class:: MultiACE +""" + MultiACE - Averaged cross-entropy for classification. This also know als logloss. - This variant keeps track of the different losses per class. +Averaged cross-entropy for classification. This also know als logloss. +This variant keeps track of the different losses per class. - Calculated the averaged cross entropy for multi-dimentions output. -=# +Calculated the averaged cross entropy for multi-dimentions output. +""" type MultiACE <: AbstractEvalMetric aces :: Vector{Float64} counts :: Vector{Int} diff --git a/src/model.jl b/src/model.jl index d9b81d02f3d9..ac96d047b668 100644 --- a/src/model.jl +++ b/src/model.jl @@ -1,27 +1,19 @@ -#=doc -Models -====== - -The model API provides convenient high-level interface to do training and predicting on -a network described using the symbolic API. -=# - -#=doc -.. class:: AbstractModel +""" + AbstractModel - The abstract super type of all models in MXNet.jl. -=# +The abstract super type of all models in MXNet.jl. +""" abstract AbstractModel -#=doc -.. class:: FeedForward +""" + FeedForward - The feedforward model provides convenient interface to train and predict on - feedforward architectures like multi-layer MLP, ConvNets, etc. There is no - explicitly handling of *time index*, but it is relatively easy to implement - unrolled RNN / LSTM under this framework (**TODO**: add example). For models - that handles sequential data explicitly, please use **TODO**... -=# +The feedforward model provides convenient interface to train and predict on +feedforward architectures like multi-layer MLP, ConvNets, etc. There is no +explicitly handling of *time index*, but it is relatively easy to implement +unrolled RNN / LSTM under this framework (**TODO**: add example). For models +that handles sequential data explicitly, please use **TODO**... +""" type FeedForward <: AbstractModel arch :: SymbolicNode ctx :: Vector{Context} @@ -35,9 +27,10 @@ type FeedForward <: AbstractModel FeedForward(arch :: SymbolicNode, ctx :: Vector{Context}) = new(arch, ctx) end -"""Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector - of length `n_split`, with each entry a `UnitRange{Int}` indicating the slice index for that - piece. +""" +Get a split of `batch_size` into `n_split` pieces for data parallelization. Returns a vector +of length `n_split`, with each entry a `UnitRange{Int}` indicating the slice index for that +piece. """ function _split_inputs(batch_size :: Int, n_split :: Int) @assert(batch_size >= n_split) @@ -51,14 +44,14 @@ function _split_inputs(batch_size :: Int, n_split :: Int) return idx end -#=doc -.. function:: FeedForward(arch :: SymbolicNode, ctx) +""" + FeedForward(arch :: SymbolicNode, ctx) - :param arch: the architecture of the network constructed using the symbolic API. - :param ctx: the devices on which this model should do computation. It could be a single :class:`Context` +* arch: the architecture of the network constructed using the symbolic API. +* ctx: the devices on which this model should do computation. It could be a single :class:`Context` or a list of :class:`Context` objects. In the latter case, data parallelization will be used for training. If no context is provided, the default context ``cpu()`` will be used. -=# +""" function FeedForward(arch :: SymbolicNode; context :: Union{Context, Vector{Context}, Void} = nothing) if isa(context, Void) context = [Context(CPU)] @@ -68,8 +61,8 @@ function FeedForward(arch :: SymbolicNode; context :: Union{Context, Vector{Cont FeedForward(arch, context) end -#=doc -.. function:: init_model(self, initializer; overwrite=false, input_shapes...) +""" + init_model(self, initializer; overwrite=false, input_shapes...) Initialize the weights in the model. @@ -77,12 +70,12 @@ end need to call this method unless one needs to inspect a model with only randomly initialized weights. - :param FeedForward self: the model to be initialized. - :param AbstractInitializer initializer: an initializer describing how the weights should be initialized. - :param Bool overwrite: keyword argument, force initialization even when weights already exists. - :param input_shapes: the shape of all data and label inputs to this model, given as keyword arguments. +* FeedForward self: the model to be initialized. +* AbstractInitializer initializer: an initializer describing how the weights should be initialized. +* Bool overwrite: keyword argument, force initialization even when weights already exists. +* input_shapes: the shape of all data and label inputs to this model, given as keyword arguments. For example, ``data=(28,28,1,100), label=(100,)``. -=# +""" function init_model(self :: FeedForward, initializer :: AbstractInitializer; overwrite::Bool=false, input_shapes...) # all arg names, including data, label, and parameters arg_names = list_arguments(self.arch) @@ -168,7 +161,7 @@ function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_sha end end -#=doc +""" .. function:: predict(self, data; overwrite=false, callback=nothing) @@ -182,9 +175,9 @@ end # consume or write batch_output to file end - :param FeedForward self: the model. - :param AbstractDataProvider data: the data to perform prediction on. - :param Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory +* FeedForward self: the model. +* AbstractDataProvider data: the data to perform prediction on. +* Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory allocation of the :class:`Executor` depends on the mini-batch size of the test data provider. If you call predict twice with data provider of the same batch-size, then the executor can be potentially be re-used. So, if ``overwrite`` is false, @@ -209,7 +202,7 @@ end predict and synchronize the weights again. :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` -=# +""" function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = true) predict(self, data; overwrite = overwrite, callback=callback) end @@ -314,41 +307,41 @@ function _invoke_callbacks{T<:Real}(self::FeedForward, callbacks::Vector{Abstrac end end -#=doc -.. function:: train(model :: FeedForward, ...) +""" + train(model :: FeedForward, ...) - Alias to :func:`fit`. -=# +Alias to :func:`fit`. +""" function train(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) fit(self, optimizer, data; kwargs...) end -#=doc -.. function:: fit(model :: FeedForward, optimizer, data; kwargs...) +""" + fit(model :: FeedForward, optimizer, data; kwargs...) - Train the ``model`` on ``data`` with the ``optimizer``. +Train the ``model`` on ``data`` with the ``optimizer``. - :param FeedForward model: the model to be trained. - :param AbstractOptimizer optimizer: the optimization algorithm to use. - :param AbstractDataProvider data: the training data provider. - :param Int n_epoch: default 10, the number of full data-passes to run. - :param AbstractDataProvider eval_data: keyword argument, default ``nothing``. The data provider for +* FeedForward model: the model to be trained. +* AbstractOptimizer optimizer: the optimization algorithm to use. +* AbstractDataProvider data: the training data provider. +* Int n_epoch: default 10, the number of full data-passes to run. +* AbstractDataProvider eval_data: keyword argument, default ``nothing``. The data provider for the validation set. - :param AbstractEvalMetric eval_metric: keyword argument, default ``Accuracy()``. The metric used +* AbstractEvalMetric eval_metric: keyword argument, default ``Accuracy()``. The metric used to evaluate the training performance. If ``eval_data`` is provided, the same metric is also calculated on the validation set. - :param kvstore: keyword argument, default ``:local``. The key-value store used to synchronize gradients +* kvstore: keyword argument, default ``:local``. The key-value store used to synchronize gradients and parameters when multiple devices are used for training. :type kvstore: :class:`KVStore` or ``Base.Symbol`` - :param AbstractInitializer initializer: keyword argument, default ``UniformInitializer(0.01)``. - :param Bool force_init: keyword argument, default false. By default, the random initialization using the +* AbstractInitializer initializer: keyword argument, default ``UniformInitializer(0.01)``. +* Bool force_init: keyword argument, default false. By default, the random initialization using the provided ``initializer`` will be skipped if the model weights already exists, maybe from a previous call to :func:`train` or an explicit call to :func:`init_model` or :func:`load_checkpoint`. When this option is set, it will always do random initialization at the begining of training. - :param callbacks: keyword argument, default ``[]``. Callbacks to be invoked at each epoch or mini-batch, +* callbacks: keyword argument, default ``[]``. Callbacks to be invoked at each epoch or mini-batch, see :class:`AbstractCallback`. :type callbacks: ``Vector{AbstractCallback}`` -=# +""" function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) opts = TrainingOptions(; kwargs...) diff --git a/src/ndarray.jl b/src/ndarray.jl index d78d647fe185..dacee56d7281 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1,8 +1,3 @@ -#=doc -NDArray API -=========== -=# - # All the types supported by mshadow. typealias DType Union{Float32, Float64, Float16, UInt8, Int32} @enum TypeFlag kFloat32 kFloat64 kFloat16 kUint8 kInt32 @@ -72,8 +67,8 @@ end ################################################################################ # NDArray Type ################################################################################ -#=doc -.. class:: NDArray +""" + NDArray Wrapper of the ``NDArray`` type in ``libmxnet``. This is the basic building block of tensor-based computation. @@ -88,7 +83,7 @@ end about shapes. For example, a mini-batch of 100 MNIST images is a tensor of C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory have shape (28,28,1,100). -=# +""" type NDArray handle :: MX_NDArrayHandle writable :: Bool @@ -115,11 +110,11 @@ Base.cconvert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) ################################################################################ # NDArray functions exported to the users ################################################################################ -#=doc -.. function:: context(arr :: NDArray) +""" + context(arr :: NDArray) Get the context that this :class:`NDArray` lives on. -=# +""" function context(arr :: NDArray) ref_typeid = Ref{Cint}(0) ref_devid = Ref{Cint}(0) @@ -129,14 +124,14 @@ function context(arr :: NDArray) end -#=doc +""" .. function:: empty(DType, shape :: Tuple, ctx :: Context) empty(DType, shape :: Tuple) empty(DType, dim1, dim2, ...) Allocate memory for an uninitialized :class:`NDArray` with a specified type. -=# +""" function empty{N,T<:DType}(::Type{T}, shape :: NTuple{N, Int}) empty(T, shape, cpu()) end @@ -147,14 +142,14 @@ function empty{T<:DType}(:: Type{T}, shape :: Int...) empty(T, shape) end -#=doc +""" .. function:: empty(shape :: Tuple, ctx :: Context) empty(shape :: Tuple) empty(dim1, dim2, ...) Allocate memory for an uninitialized :class:`NDArray` with specific shape of type Float32. -=# +""" function empty{N}(shape :: NTuple{N, Int}) empty(shape, cpu()) end @@ -165,19 +160,13 @@ function empty(shape :: Int...) empty(shape) end -#=doc -Interface functions similar to Julia Arrays -------------------------------------------- -=# - -#=doc -.. function:: - zeros(DType, shape :: Tuple, ctx :: Context) - zeros(DType, shape :: Tuple) - zeros(DType, dim1, dim2, ...) +""" + zeros(DType, shape :: Tuple, ctx :: Context) + zeros(DType, shape :: Tuple) + zeros(DType, dim1, dim2, ...) - Create zero-ed :class:`NDArray` with specific shape and type -=# +Create zero-ed :class:`NDArray` with specific shape and type +""" function zeros{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}) zeros(T, shape, cpu()) end @@ -190,14 +179,13 @@ function zeros{T<:DType}(:: Type{T}, shape :: Int...) zeros(T, shape) end -#=doc -.. function:: - zeros(shape :: Tuple, ctx :: Context) - zeros(shape :: Tuple) - zeros(dim1, dim2, ...) +""" + zeros(shape :: Tuple, ctx :: Context) + zeros(shape :: Tuple) + zeros(dim1, dim2, ...) - Create zero-ed :class:`NDArray` with specific shape. -=# +Create zero-ed :class:`NDArray` with specific shape. +""" function zeros{N}(shape :: NTuple{N, Int}) zeros(shape, cpu()) end @@ -210,14 +198,13 @@ function zeros(shape :: Int...) zeros(shape) end -#=doc -.. function:: - ones(DType, shape :: Tuple, ctx :: Context) - ones(DType, shape :: Tuple) - ones(DType, dim1, dim2, ...) +""" + ones(DType, shape :: Tuple, ctx :: Context) + ones(DType, shape :: Tuple) + ones(DType, dim1, dim2, ...) - Create an :class:`NDArray` with specific shape & type, and initialize with 1. -=# +Create an :class:`NDArray` with specific shape & type, and initialize with 1. +""" function ones{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}) ones(T, shape, cpu()) end @@ -230,14 +217,13 @@ function ones{T<:DType}(:: Type{T}, shape :: Int...) ones(T, shape) end -#=doc -.. function:: - ones(shape :: Tuple, ctx :: Context) - ones(shape :: Tuple) - ones(dim1, dim2, ...) +""" + ones(shape :: Tuple, ctx :: Context) + ones(shape :: Tuple) + ones(dim1, dim2, ...) - Create an :class:`NDArray` with specific shape and initialize with 1. -=# +Create an :class:`NDArray` with specific shape and initialize with 1. +""" function ones{N}(shape :: NTuple{N, Int}) ones(shape, cpu()) end @@ -252,14 +238,14 @@ end import Base: size, length, ndims, eltype -#=doc +""" .. function:: size(arr :: NDArray) size(arr :: NDArray, dim :: Int) Get the shape of an :class:`NDArray`. The shape is in Julia's column-major convention. See also the :ref:`notes on NDArray shapes `. -=# +""" function size(arr :: NDArray) ref_ndim = Ref{MX_uint}(0) ref_shape = Ref{Ptr{MX_uint}}(0) @@ -271,29 +257,29 @@ function size(arr :: NDArray, dim :: Int) size(arr)[dim] end -#=doc -.. function:: length(arr :: NDArray) +""" + length(arr :: NDArray) Get the number of elements in an :class:`NDArray`. -=# +""" function length(arr :: NDArray) prod(size(arr)) end -#=doc -.. function:: ndims(arr :: NDArray) +""" + ndims(arr :: NDArray) Get the number of dimensions of an :class:`NDArray`. Is equivalent to ``length(size(arr))``. -=# +""" function ndims(arr :: NDArray) length(size(arr)) end -#=doc -.. function:: eltype(arr :: NDArray) +""" + eltype(arr :: NDArray) Get the element type of an :class:`NDArray`. -=# +""" function eltype{T <: Union{NDArray, MX_NDArrayHandle}}(arr :: T) dtype_ref = Ref{Cint}(0) @mxcall(:MXNDArrayGetDType, (MX_handle, Ptr{Cint}), arr, dtype_ref) @@ -310,15 +296,15 @@ end import Base: slice -#=doc -.. function:: slice(arr :: NDArray, start:stop) +""" + slice(arr :: NDArray, start:stop) Create a view into a sub-slice of an :class:`NDArray`. Note only slicing at the slowest changing dimension is supported. In Julia's column-major perspective, this is the last dimension. For example, given an :class:`NDArray` of shape (2,3,4), ``slice(array, 2:3)`` will create a :class:`NDArray` of shape (2,3,2), sharing the data with the original array. This operation is used in data parallelization to split mini-batch into sub-batches for different devices. -=# +""" function slice(arr :: NDArray, ::Colon) arr end @@ -340,8 +326,8 @@ end import Base: setindex! -#=doc -.. function:: setindex!(arr :: NDArray, val, idx) +""" + setindex!(arr :: NDArray, val, idx) Assign values to an :class:`NDArray`. Elementwise assignment is not implemented, only the following scenarios are supported @@ -350,7 +336,7 @@ import Base: setindex! or :class:`NDArray`) of the same shape. - ``arr[start:stop] = val``: assignment to a *slice*, ``val`` could be a scalar or an array of the same shape to the slice. See also :func:`slice`. -=# +""" function setindex!(arr :: NDArray, val :: Real, ::Colon) @assert(arr.writable) _set_value(convert(eltype(arr), val), arr) @@ -366,10 +352,11 @@ function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, id setindex!(slice(arr, idx), val, Colon()) end -#=doc -.. function:: getindex(arr :: NDArray, idx) +import Base: getindex +""" + getindex(arr :: NDArray, idx) - Shortcut for :func:`slice`. A typical use is to write +Shortcut for :func:`slice`. A typical use is to write .. code-block:: julia @@ -392,29 +379,26 @@ end The behavior is quite different from indexing into Julia's ``Array``. For example, ``arr[2:5]`` create a **copy** of the sub-array for Julia ``Array``, while for :class:`NDArray`, this is a *slice* that shares the memory. -=# -import Base: getindex -"""Shortcut for `slice`. **NOTE** the behavior for Julia's built-in index slicing is to create a -copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. """ function getindex(arr :: NDArray, ::Colon) return arr end + +""" +Shortcut for `slice`. **NOTE** the behavior for Julia's built-in index slicing is to create a +copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. +""" function getindex(arr :: NDArray, idx::UnitRange{Int}) slice(arr, idx) end -#=doc -Copying functions ------------------ -=# import Base: copy!, copy, convert -#=doc +""" .. function:: copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) Copy contents of ``src`` into ``dst``. -=# +""" function copy!(dst :: NDArray, src :: NDArray) @assert(dst.writable) if dst.handle == src.handle @@ -456,7 +440,7 @@ function copy_ignore_shape!{T<:Real}(dst :: NDArray, src :: Array{T}) end -#=doc +""" .. function:: copy(arr :: NDArray) copy(arr :: NDArray, ctx :: Context) @@ -464,7 +448,7 @@ end Create a copy of an array. When no :class:`Context` is given, create a Julia ``Array``. Otherwise, create an :class:`NDArray` on the specified context. -=# +""" # Create copy: NDArray -> Julia Array function copy(arr :: NDArray) j_arr = Array{eltype(arr)}(size(arr)) @@ -483,31 +467,26 @@ function copy{T<:DType}(arr :: Array{T}, ctx :: Context) copy!(dst, arr) end -#=doc -.. function:: convert(::Type{Array{T}}, arr :: NDArray) +""" + convert(::Type{Array{T}}, arr :: NDArray) Convert an :class:`NDArray` into a Julia ``Array`` of specific type. Data will be copied. -=# +""" # Convert copy: NDArray -> Julia Array function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) convert(t, copy(arr)) end -#=doc -Basic arithmetics ------------------ -=# - -#=doc -.. function:: @inplace +""" + @inplace - Julia does not support re-definiton of ``+=`` operator (like ``__iadd__`` in python), - When one write ``a += b``, it gets translated to ``a = a+b``. ``a+b`` will allocate new - memory for the results, and the newly allocated :class:`NDArray` object is then assigned - back to a, while the original contents in a is discarded. This is very inefficient - when we want to do inplace update. +Julia does not support re-definiton of ``+=`` operator (like ``__iadd__`` in python), +When one write ``a += b``, it gets translated to ``a = a+b``. ``a+b`` will allocate new +memory for the results, and the newly allocated :class:`NDArray` object is then assigned +back to a, while the original contents in a is discarded. This is very inefficient +when we want to do inplace update. - This macro is a simple utility to implement this behavior. Write +This macro is a simple utility to implement this behavior. Write .. code-block:: julia @@ -520,7 +499,7 @@ Basic arithmetics mx.add_to!(a, b) which will do inplace adding of the contents of ``b`` into ``a``. -=# +""" macro inplace(stmt) if stmt.head == :+= || stmt.head == :.+= Expr(:call, :add_to!, esc(stmt.args[1]), esc(stmt.args[2])) @@ -535,11 +514,11 @@ macro inplace(stmt) end end -#=doc -.. function:: add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) +""" + add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) - Add a bunch of arguments into ``dst``. Inplace updating. -=# +Add a bunch of arguments into ``dst``. Inplace updating. +""" function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) @assert dst.writable for arg in args @@ -552,16 +531,16 @@ function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) return dst end -#=doc -.. function:: - +(args...) - .+(args...) - - Summation. Multiple arguments of either scalar or :class:`NDArray` could be - added together. Note at least the first or second argument needs to be an :class:`NDArray` to - avoid ambiguity of built-in summation. -=# import Base: +, .+ + +""" + +(args...) + .+(args...) + +Summation. Multiple arguments of either scalar or :class:`NDArray` could be +added together. Note at least the first or second argument needs to be an :class:`NDArray` to +avoid ambiguity of built-in summation. +""" function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) ret = copy(arg0, context(arg0)) add_to!(ret, args...) @@ -576,11 +555,11 @@ function .+(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) .+(arg1, arg0, args...) end -#=doc -.. function:: sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) +""" + sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) Subtract a bunch of arguments from ``dst``. Inplace updating. -=# +""" function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) @@ -590,16 +569,16 @@ function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) end end -#=doc -.. function:: - -(arg0, arg1) - -(arg0) - .-(arg0, arg1) - - Subtraction ``arg0 - arg1``, of scalar types or :class:`NDArray`. Or create - the negative of ``arg0``. -=# import Base: -, .- + +""" + -(arg0, arg1) + -(arg0) + .-(arg0, arg1) + +Subtraction ``arg0 - arg1``, of scalar types or :class:`NDArray`. Or create +the negative of ``arg0``. +""" function -(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) sub_from!(ret, arg1) @@ -620,12 +599,12 @@ function -(arg0 :: NDArray) _mul_scalar(arg0, -one(eltype(arg0))) end -#=doc -.. function:: mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) +""" + mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) Elementwise multiplication into ``dst`` of either a scalar or an :class:`NDArray` of the same shape. Inplace updating. -=# +""" function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) @@ -636,13 +615,13 @@ function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) return dst end -#=doc -.. function:: - .*(arg0, arg1) - - Elementwise multiplication of ``arg0`` and ``arg``, could be either scalar or :class:`NDArray`. -=# import Base: .*, * + +""" + .*(arg0, arg1) + +Elementwise multiplication of ``arg0`` and ``arg``, could be either scalar or :class:`NDArray`. +""" function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) mul_to!(ret, arg) @@ -651,13 +630,12 @@ function .*(arg0 :: Real, arg :: NDArray) .*(arg, arg0) end -#=doc -.. function:: - *(arg0, arg1) +""" + *(arg0, arg1) - Currently only multiplication a scalar with an :class:`NDArray` is implemented. Matrix multiplication - is to be added soon. -=# +Currently only multiplication a scalar with an :class:`NDArray` is implemented. Matrix multiplication +is to be added soon. +""" function *(arg0 :: NDArray, arg :: Real) ret = copy(arg0, context(arg0)) mul_to!(ret, arg) @@ -666,11 +644,11 @@ function *(arg0 :: Real, arg :: NDArray) *(arg, arg0) end -#=doc -.. function:: div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) +""" + div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) - Elementwise divide a scalar or an :class:`NDArray` of the same shape from ``dst``. Inplace updating. -=# +Elementwise divide a scalar or an :class:`NDArray` of the same shape from ``dst``. Inplace updating. +""" function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) @@ -681,31 +659,31 @@ function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) end import Base: ./, / -#=doc -.. function:: ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) +""" + ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) - Elementwise dividing an :class:`NDArray` by a scalar or another :class:`NDArray` of the same shape. -=# +Elementwise dividing an :class:`NDArray` by a scalar or another :class:`NDArray` of the same shape. +""" function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) div_from!(ret, arg) end -#=doc -.. function:: /(arg0 :: NDArray, arg :: Real) +""" + /(arg0 :: NDArray, arg :: Real) - Divide an :class:`NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. -=# +Divide an :class:`NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. +""" function /(arg0 :: NDArray, arg :: Real) ./(arg0, arg) end -#=doc +""" Manipulating as Julia Arrays ---------------------------- -.. function:: @nd_as_jl(captures..., statement) + @nd_as_jl(captures..., statement) A convenient macro that allows to operate :class:`NDArray` as Julia Arrays. For example, @@ -743,7 +721,7 @@ Manipulating as Julia Arrays - The statements are wrapped in a ``let``, thus locally introduced new variables will not be available after the statements. So you will need to declare the variables before calling the macro if needed. -=# +""" macro nd_as_jl(m_args...) @assert(length(m_args) > 0) stmts = m_args[end] @@ -831,18 +809,18 @@ function _wait_to_write(arr :: NDArray) @mxcall(:MXNDArrayWaitToWrite, (MX_handle,), arr) end -#=doc -.. function:: try_get_shared(arr) +""" + try_get_shared(arr) Try to create a Julia array by sharing the data with the underlying :class:`NDArray`. - :param NDArray arr: the array to be shared. +* NDArray arr: the array to be shared. .. warning:: The returned array does not guarantee to share data with the underlying :class:`NDArray`. In particular, data sharing is possible only when the :class:`NDArray` lives on CPU. -=# +""" function try_get_shared(arr :: NDArray) if context(arr).device_type == CPU # try to do data sharing @@ -854,14 +832,14 @@ function try_get_shared(arr :: NDArray) end end -#=doc -.. function:: is_shared(j_arr, arr) +""" + is_shared(j_arr, arr) Test whether ``j_arr`` is sharing data with ``arr``. - :param Array j_arr: the Julia Array. - :param NDArray arr: the :class:`NDArray`. -=# +* Array j_arr: the Julia Array. +* NDArray arr: the :class:`NDArray`. +""" function is_shared(j_arr :: Array, arr :: NDArray) false end @@ -875,24 +853,19 @@ function is_shared{T<:DType}(j_arr :: Array{T}, arr :: NDArray) return pointer(j_arr) == pointer(arr) end -#=doc -IO --- -=# -#=doc -.. function:: load(filename, ::Type{NDArray}) +""" + load(filename, ::Type{NDArray}) - Load NDArrays from binary file. +Load NDArrays from binary file. - :param AbstractString filename: the path of the file to load. It could be S3 or HDFS address. +* AbstractString filename: the path of the file to load. It could be S3 or HDFS address. :return: Either ``Dict{Base.Symbol, NDArray}`` or ``Vector{NDArray}``. - If the ``libmxnet`` is built with the corresponding component enabled. Examples - - * ``s3://my-bucket/path/my-s3-ndarray`` - * ``hdfs://my-bucket/path/my-hdfs-ndarray`` - * ``/path-to/my-local-ndarray`` -=# +If the ``libmxnet`` is built with the corresponding component enabled. Examples +* ``s3://my-bucket/path/my-s3-ndarray`` +* ``hdfs://my-bucket/path/my-hdfs-ndarray`` +* ``/path-to/my-local-ndarray`` +""" function load(filename::AbstractString, ::Type{NDArray}) out_size = Ref{MX_uint}(0) out_hdrs = Ref{Ptr{MX_handle}}(0) @@ -911,16 +884,16 @@ function load(filename::AbstractString, ::Type{NDArray}) end end -#=doc -.. function:: save(filename :: AbstractString, data) +""" + save(filename :: AbstractString, data) - Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built - with corresponding support. +Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built +with corresponding support. - :param AbstractString filename: path to the binary file to write to. - :param data: data to save to file. +* AbstractString filename: path to the binary file to write to. +* data: data to save to file. :type data: :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. -=# +""" function save(filename::AbstractString, data::NDArray) save(filename, [data]) end @@ -937,10 +910,6 @@ function save(filename::AbstractString, data::Dict{Base.Symbol,NDArray}) filename, length(names), arrays, names) end -#=doc -libmxnet APIs -------------- -=# ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -959,7 +928,7 @@ end # functions can overload them import Base: sqrt -#=doc +""" The libxmnet APIs are automatically imported from ``libmxnet.so``. The functions listed here operate on :class:`NDArray` objects. The arguments to the functions are typically ordered as @@ -985,9 +954,7 @@ Upon calling, the output arguments will be automatically initialized with empty Those functions always return the output arguments. If there is only one output (the typical situation), that object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. - -**autogen:EMBED:ndarray:EMBED:autogen** -=# +""" function _get_ndarray_functions() n = Ref{MX_uint}(0) diff --git a/src/nn-factory.jl b/src/nn-factory.jl index 3725587f37a1..b170214a1af9 100644 --- a/src/nn-factory.jl +++ b/src/nn-factory.jl @@ -1,33 +1,25 @@ -#=doc -Neural Networks Factory -======================= +""" + MLP(input, spec) -Neural network factory provide convenient helper functions to define -common neural networks. -=# +Construct a multi-layer perceptron. A MLP is a multi-layer neural network with +fully connected layers. -#=doc -.. function:: MLP(input, spec) - - Construct a multi-layer perceptron. A MLP is a multi-layer neural network with - fully connected layers. - - :param SymbolicNode input: the input to the mlp. - :param spec: the mlp specification, a list of hidden dimensions. For example, +* SymbolicNode input: the input to the mlp. +* spec: the mlp specification, a list of hidden dimensions. For example, ``[128, (512, :sigmoid), 10]``. The number in the list indicate the number of hidden units in each layer. A tuple could be used to specify the activation of each layer. Otherwise, the default activation will be used (except for the last layer). - :param Base.Symbol hidden_activation: keyword argument, default ``:relu``, indicating +* Base.Symbol hidden_activation: keyword argument, default ``:relu``, indicating the default activation for hidden layers. The specification here could be overwritten by layer-wise specification in the ``spec`` argument. Also activation is not applied to the last, i.e. the prediction layer. See :func:`Activation` for a list of supported activation types. - :param prefix: keyword argument, default ``gensym()``, used as the prefix to +* prefix: keyword argument, default ``gensym()``, used as the prefix to name the constructed layers. :return: the constructed MLP. -=# +""" function MLP(input, spec; hidden_activation::Base.Symbol=:relu, prefix=gensym()) spec = convert(Vector{Union{Int,Tuple}}, spec) diff --git a/src/optimizer.jl b/src/optimizer.jl index 887fd9ab59e0..e2fc44338a2f 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -1,37 +1,28 @@ -#=doc -Optimizers -========== +""" + AbstractOptimizer -Common interfaces ------------------ -=# - - -#=doc -.. class:: AbstractOptimizer - - Base type for all optimizers. -=# +Base type for all optimizers. +""" abstract AbstractOptimizer -#=doc -.. class:: AbstractLearningRateScheduler +""" + AbstractLearningRateScheduler - Base type for all learning rate scheduler. -=# +Base type for all learning rate scheduler. +""" abstract AbstractLearningRateScheduler -#=doc -.. class:: AbstractMomentumScheduler +""" + AbstractMomentumScheduler - Base type for all momentum scheduler. -=# +Base type for all momentum scheduler. +""" abstract AbstractMomentumScheduler -#=doc -.. class:: OptimizationState +""" + OptimizationState .. attribute:: batch_size @@ -54,7 +45,7 @@ abstract AbstractMomentumScheduler The current iteration count. One iteration corresponds to one mini-batch, but unlike the mini-batch count, the iteration count does **not** reset in each epoch. So it track the *total* number of mini-batches seen so far. -=# +""" type OptimizationState batch_size :: Int curr_epoch :: Int @@ -64,13 +55,14 @@ end OptimizationState(batch_size::Int) = OptimizationState(batch_size, 0, 0, 0) -#=doc -.. function:: get_learning_rate(scheduler, state) +""" + get_learning_rate(scheduler, state) - :param AbstractLearningRateScheduler scheduler: a learning rate scheduler. - :param OptimizationState state: the current state about epoch, mini-batch and iteration count. +# Arguments +* AbstractLearningRateScheduler scheduler: a learning rate scheduler. +* OptimizationState state: the current state about epoch, mini-batch and iteration count. :return: the current learning rate. -=# +""" function get_learning_rate end @@ -79,22 +71,22 @@ end module LearningRate import ..mx: AbstractLearningRateScheduler, OptimizationState, get_learning_rate -#=doc -.. class:: LearningRate.Fixed +""" + LearningRate.Fixed Fixed learning rate scheduler always return the same learning rate. -=# +""" type Fixed <: AbstractLearningRateScheduler learning_rate :: Float64 end get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rate -#=doc -.. class:: LearningRate.Exp +""" + LearningRate.Exp :math:`\eta_t = \eta_0\gamma^t`. Here :math:`t` is the epoch count, or the iteration count if ``decay_on_iteration`` is set to true. -=# +""" type Exp <: AbstractLearningRateScheduler learning_rate :: Float64 gamma :: Float64 @@ -106,13 +98,13 @@ function Exp(base_lr::Real; gamma::Real=0.9, decay_on_iteration::Bool=false) end get_learning_rate(self :: Exp, state :: OptimizationState) = self.learning_rate * self.gamma ^ (self.on_iteration ? state.curr_iter : state.curr_epoch) -#=doc -.. class:: LearningRate.Inv +""" + LearningRate.Inv :math:`\eta_t = \eta_0 * (1 + \gamma * t)^(-power)`. Here :math:`t` is the epoch count, or the iteration count if ``decay_on_iteration`` is set to true. -=# +""" type Inv <: AbstractLearningRateScheduler learning_rate :: Float64 gamma :: Float64 @@ -137,13 +129,13 @@ function get_lr_scheduler(scheduler :: Any, lr :: Real) end -#=doc -.. function:: get_momentum(scheduler, state) +""" + get_momentum(scheduler, state) - :param AbstractMomentumScheduler scheduler: the momentum scheduler. - :param OptimizationState state: the state about current epoch, mini-batch and iteration count. +* AbstractMomentumScheduler scheduler: the momentum scheduler. +* OptimizationState state: the state about current epoch, mini-batch and iteration count. :return: the current momentum. -=# +""" function get_momentum end @@ -153,21 +145,21 @@ end module Momentum import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum -#=doc -.. class:: Momentum.Null +""" + Momentum.Null The null momentum scheduler always returns 0 for momentum. It is also used to explicitly indicate momentum should not be used. -=# +""" type Null <: AbstractMomentumScheduler end get_momentum(self :: Null, state :: OptimizationState) = 0.0 -#=doc -.. class:: Momentum.Fixed +""" + Momentum.Fixed Fixed momentum scheduler always returns the same value. -=# +""" type Fixed <: AbstractMomentumScheduler momentum :: Float64 end @@ -185,14 +177,14 @@ function get_momentum_scheduler(scheduler :: Any, momentum :: Real) end -#=doc -.. function:: get_updater(optimizer) +""" + get_updater(optimizer) - :param AbstractOptimizer optimizer: the underlying optimizer. +* AbstractOptimizer optimizer: the underlying optimizer. A utility function to create an updater function, that uses its closure to store all the states needed for each weights. -=# +""" function get_updater(optimizer :: AbstractOptimizer) states = Dict{Int,Any}() function updater(index :: Int, grad :: NDArray, weight :: NDArray) @@ -204,30 +196,24 @@ function get_updater(optimizer :: AbstractOptimizer) return updater end -################################################################################ -#=doc -Built-in optimizers -------------------- -=# - -#=doc -.. class:: AbstractOptimizerOptions +""" + AbstractOptimizerOptions - Base class for all optimizer options. -=# +Base class for all optimizer options. +""" abstract AbstractOptimizerOptions -#=doc -.. function:: normalized_gradient(opts, state, grad) +""" + normalized_gradient(opts, state, grad) - :param AbstractOptimizerOptions opts: options for the optimizer, should contain the field +* AbstractOptimizerOptions opts: options for the optimizer, should contain the field ``grad_scale``, ``grad_clip`` and ``weight_decay``. - :param OptimizationState state: the current optimization state. - :param NDArray weight: the trainable weights. - :param NDArray grad: the original gradient of the weights. +* OptimizationState state: the current optimization state. +* NDArray weight: the trainable weights. +* NDArray grad: the original gradient of the weights. Get the properly normalized gradient (re-scaled and clipped if necessary). -=# +""" function normalized_gradient(opts::AbstractOptimizerOptions, state::OptimizationState, weight::NDArray, grad::NDArray) grad_scale = 1.0 / state.batch_size diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 5bd1a6120f0e..850379899642 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -1,13 +1,8 @@ -#=doc -Symbolic API -============ -=# +""" + SymbolicNode -#=doc -.. class:: SymbolicNode - - SymbolicNode is the basic building block of the symbolic graph in MXNet.jl. -=# +SymbolicNode is the basic building block of the symbolic graph in MXNet.jl. +""" type SymbolicNode handle :: MX_SymbolHandle end @@ -17,34 +12,33 @@ end Base.convert(t::Type{MX_handle}, obj::SymbolicNode) = Base.unsafe_convert(t, obj) Base.cconvert(t::Type{MX_handle}, obj::SymbolicNode) = Base.unsafe_convert(t, obj) -#=doc -.. function:: deepcopy(self :: SymbolicNode) +""" + deepcopy(self :: SymbolicNode) - Make a deep copy of a SymbolicNode. -=# +Make a deep copy of a SymbolicNode. +""" function Base.deepcopy(self :: SymbolicNode) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCopy, (MX_handle, Ref{MX_handle}), self, ref_hdr) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -#=doc -.. function:: copy(self :: SymbolicNode) +""" + copy(self :: SymbolicNode) - Make a copy of a SymbolicNode. The same as making a deep copy. -=# +Make a copy of a SymbolicNode. The same as making a deep copy. +""" function Base.copy(self :: SymbolicNode) Base.deepcopy(self) end -#=doc -.. function:: - call(self :: SymbolicNode, args :: SymbolicNode...) - call(self :: SymbolicNode; kwargs...) +""" + call(self :: SymbolicNode, args :: SymbolicNode...) + call(self :: SymbolicNode; kwargs...) - Make a new node by composing ``self`` with ``args``. Or the arguments - can be specified using keyword arguments. -=# +Make a new node by composing ``self`` with ``args``. Or the arguments +can be specified using keyword arguments. +""" function Base.call(self :: SymbolicNode, args :: SymbolicNode...) s = deepcopy(self) _compose!(s, args...) @@ -67,67 +61,67 @@ macro _list_symbol_info(self, func_name) end end -#=doc -.. function:: list_arguments(self :: SymbolicNode) +""" + list_arguments(self :: SymbolicNode) - List all the arguments of this node. The argument for a node contains both - the inputs and parameters. For example, a :class:`FullyConnected` node will - have both data and weights in its arguments. A composed node (e.g. a MLP) will - list all the arguments for intermediate nodes. +List all the arguments of this node. The argument for a node contains both +the inputs and parameters. For example, a :class:`FullyConnected` node will +have both data and weights in its arguments. A composed node (e.g. a MLP) will +list all the arguments for intermediate nodes. :return: A list of symbols indicating the names of the arguments. -=# +""" function list_arguments(self :: SymbolicNode) @_list_symbol_info(self, :MXSymbolListArguments) end -#=doc -.. function:: list_outputs(self :: SymbolicNode) +""" + list_outputs(self :: SymbolicNode) - List all the outputs of this node. +List all the outputs of this node. :return: A list of symbols indicating the names of the outputs. -=# +""" function list_outputs(self :: SymbolicNode) @_list_symbol_info(self, :MXSymbolListOutputs) end -#=doc -.. function:: list_auxiliary_states(self :: SymbolicNode) +""" + list_auxiliary_states(self :: SymbolicNode) - List all auxiliary states in the symbool. +List all auxiliary states in the symbool. - Auxiliary states are special states of symbols that do not corresponds to an argument, - and do not have gradient. But still be useful for the specific operations. - A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. - Most operators do not have Auxiliary states. +Auxiliary states are special states of symbols that do not corresponds to an argument, +and do not have gradient. But still be useful for the specific operations. +A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. +Most operators do not have Auxiliary states. :return: A list of symbols indicating the names of the auxiliary states. -=# +""" function list_auxiliary_states(self :: SymbolicNode) @_list_symbol_info(self, :MXSymbolListAuxiliaryStates) end -#=doc -.. function:: get_internals(self :: SymbolicNode) +""" + get_internals(self :: SymbolicNode) - Get a new grouped :class:`SymbolicNode` whose output contains all the internal outputs of - this :class:`SymbolicNode`. -=# +Get a new grouped :class:`SymbolicNode` whose output contains all the internal outputs of +this :class:`SymbolicNode`. +""" function get_internals(self :: SymbolicNode) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolGetInternals, (MX_handle, Ref{MX_handle}), self, ref_hdr) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -#=doc -.. function:: get_attr(self :: SymbolicNode, key :: Symbol) +""" + get_attr(self :: SymbolicNode, key :: Symbol) - Get attribute attached to this :class:`SymbolicNode` belonging to key. - :return: The value belonging to key as a :class:`Nullable`. -=# +Get attribute attached to this :class:`SymbolicNode` belonging to key. +:return: The value belonging to key as a :class:`Nullable`. +""" function get_attr(self :: SymbolicNode, key :: Symbol) key_s = @compat String(string(key)) ref_out = Ref{Cstring}() @@ -141,12 +135,12 @@ function get_attr(self :: SymbolicNode, key :: Symbol) end end -#=doc -.. function: list_attr(self :: SymbolicNode) +""" + list_attr(self :: SymbolicNode) - Get all attributes from a symbol. - :return: Dictionary of attributes. -=# +Get all attributes from a symbol. +:return: Dictionary of attributes. +""" function list_attr(self :: SymbolicNode) ref_sz = Ref{MX_uint}(0) ref_strings = Ref{char_pp}(0) @@ -163,12 +157,12 @@ function list_attr(self :: SymbolicNode) return out end -#=doc -.. function: list_all_attr(self :: SymbolicNode) +""" + list_all_attr(self :: SymbolicNode) - Get all attributes from the symbol graph. - :return: Dictionary of attributes. -=# +Get all attributes from the symbol graph. +:return: Dictionary of attributes. +""" function list_all_attr(self :: SymbolicNode) ref_sz = Ref{MX_uint}(0) ref_strings = Ref{char_pp}(0) @@ -185,18 +179,17 @@ function list_all_attr(self :: SymbolicNode) return out end -#=doc -.. function:: set_attr(self:: SymbolicNode, key :: Symbol, value :: AbstractString) - - Set the attribute key to value for this :class:`SymbolicNode`. +""" + set_attr(self:: SymbolicNode, key :: Symbol, value :: AbstractString) - .. warning:: +Set the attribute key to value for this :class:`SymbolicNode`. - It is encouraged not to call this function directly, unless you know exactly what you are doing. The - recommended way of setting attributes is when creating the :class:`SymbolicNode`. Changing - the attributes of a :class:`SymbolicNode` that is already been used somewhere else might - cause unexpected behavior and inconsistency. -=# +# Warning +It is encouraged not to call this function directly, unless you know exactly what you are doing. The +recommended way of setting attributes is when creating the :class:`SymbolicNode`. Changing +the attributes of a :class:`SymbolicNode` that is already been used somewhere else might +cause unexpected behavior and inconsistency. +""" function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) key_s = @compat String(string(key)) value_s = @compat String(value) @@ -204,14 +197,15 @@ function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) @mxcall(:MXSymbolSetAttr, (MX_handle, Cstring, Cstring), self, key_s, value_s) end -#=doc -.. function:: Variable(name :: Union{Symbol, AbstractString}) +""" + Variable(name :: Union{Symbol, AbstractString}) - Create a symbolic variable with the given name. This is typically used as a placeholder. - For example, the data node, acting as the starting point of a network architecture. +Create a symbolic variable with the given name. This is typically used as a placeholder. +For example, the data node, acting as the starting point of a network architecture. - :param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`Variable`. -=# +# Arguments +* Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`Variable`. +""" function Variable(name :: Union{Symbol, AbstractString}; attrs = Dict()) attrs = convert(Dict{Symbol, AbstractString}, attrs) hdr_ref = Ref{MX_handle}(0) @@ -223,11 +217,11 @@ function Variable(name :: Union{Symbol, AbstractString}; attrs = Dict()) node end -#=doc -.. function:: Group(nodes :: SymbolicNode...) +""" + Group(nodes :: SymbolicNode...) - Create a :class:`SymbolicNode` by grouping nodes together. -=# +Create a :class:`SymbolicNode` by grouping nodes together. +""" function Group(nodes :: SymbolicNode...) handles = MX_handle[nodes...] ref_hdr = Ref{MX_handle}(0) @@ -279,20 +273,19 @@ function _infer_shape(self, keys, indptr, sdata) end end -#=doc -.. function:: - infer_shape(self :: SymbolicNode, args...) - infer_shape(self :: SymbolicNode; kwargs...) +""" + infer_shape(self :: SymbolicNode, args...) + infer_shape(self :: SymbolicNode; kwargs...) - Do shape inference according to the input shapes. The input shapes could be provided - as a list of shapes, which should specify the shapes of inputs in the same order as - the arguments returned by :func:`list_arguments`. Alternatively, the shape information - could be specified via keyword arguments. +Do shape inference according to the input shapes. The input shapes could be provided +as a list of shapes, which should specify the shapes of inputs in the same order as +the arguments returned by :func:`list_arguments`. Alternatively, the shape information +could be specified via keyword arguments. - :return: A 3-tuple containing shapes of all the arguments, shapes of all the outputs and - shapes of all the auxiliary variables. If shape inference failed due to incomplete - or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. -=# +:return: A 3-tuple containing shapes of all the arguments, shapes of all the outputs and + shapes of all the auxiliary variables. If shape inference failed due to incomplete + or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. +""" function infer_shape(self :: SymbolicNode; kwargs...) sdata = MX_uint[] indptr = MX_uint[0] @@ -348,20 +341,19 @@ function _infer_type(self, keys, arg_type_data) end end -#=doc -.. function:: - infer_type(self :: SymbolicNode; kwargs...) - infer_type(self :: SymbolicNode, args...) +""" + infer_type(self :: SymbolicNode; kwargs...) + infer_type(self :: SymbolicNode, args...) - Do type inference according to the input types. The input types could be provided - as a list of types, which should specify the types of inputs in the same order as - the arguments returned by :func:`list_arguments`. Alternatively, the type information - could be specified via keyword arguments. +Do type inference according to the input types. The input types could be provided +as a list of types, which should specify the types of inputs in the same order as +the arguments returned by :func:`list_arguments`. Alternatively, the type information +could be specified via keyword arguments. - :return: A 3-tuple containing types of all the arguments, types of all the outputs and - types of all the auxiliary variables. If type inference failed due to incomplete - or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. -=# +:return: A 3-tuple containing types of all the arguments, types of all the outputs and + types of all the auxiliary variables. If type inference failed due to incomplete + or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. +""" function infer_type(self :: SymbolicNode; kwargs...) types = Cint[toTypeFlag(x[2]) for x in kwargs] keys = AbstractString[string(x[1]) for x in kwargs] @@ -379,14 +371,13 @@ function infer_type(self :: SymbolicNode, args :: Union{Tuple, Void}...) _infer_type(self, keys, types) end -#=doc -.. function:: - getindex(self :: SymbolicNode, idx :: Union{Int, Base.Symbol, AbstractString}) +""" + getindex(self :: SymbolicNode, idx :: Union{Int, Base.Symbol, AbstractString}) - Get a node representing the specified output of this node. The index could be - a symbol or string indicating the name of the output, or a 1-based integer - indicating the index, as in the list of :func:`list_outputs`. -=# +Get a node representing the specified output of this node. The index could be +a symbol or string indicating the name of the output, or a 1-based integer +indicating the index, as in the list of :func:`list_outputs`. +""" function Base.getindex(self :: SymbolicNode, idx :: Union{Base.Symbol, AbstractString}) idx = Symbol(idx) i_idx = find(idx .== list_outputs(self)) @@ -529,54 +520,48 @@ function _compose!(node :: SymbolicNode, name :: Union{Base.Symbol, char_p}, arg return node end -#=doc -.. function:: to_json(self :: SymbolicNode) +""" + to_json(self :: SymbolicNode) - Convert a :class:`SymbolicNode` into a JSON string. -=# +Convert a :class:`SymbolicNode` into a JSON string. +""" function to_json(self :: SymbolicNode) ref_json = Ref{char_p}(0) @mxcall(:MXSymbolSaveToJSON, (MX_handle, Ref{char_p}), self, ref_json) return @compat String(ref_json[]) end -#=doc -.. function:: from_json(repr :: AbstractString, ::Type{SymbolicNode}) +""" + from_json(repr :: AbstractString, ::Type{SymbolicNode}) - Load a :class:`SymbolicNode` from a JSON string representation. -=# +Load a :class:`SymbolicNode` from a JSON string representation. +""" function from_json(repr :: AbstractString, ::Type{SymbolicNode}) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateFromJSON, (char_p, Ref{MX_handle}), repr, ref_hdr) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -#=doc -.. function:: load(filename :: AbstractString, ::Type{SymbolicNode}) +""" + load(filename :: AbstractString, ::Type{SymbolicNode}) - Load a :class:`SymbolicNode` from a JSON file. -=# +Load a :class:`SymbolicNode` from a JSON file. +""" function load(filename :: AbstractString, ::Type{SymbolicNode}) ref_hdr = Ref{MX_handle}(0) @mxcall(:MXSymbolCreateFromFile, (char_p, Ref{MX_handle}), filename, ref_hdr) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -#=doc -.. function:: save(filename :: AbstractString, node :: SymbolicNode) +""" + save(filename :: AbstractString, node :: SymbolicNode) - Save a :class:`SymbolicNode` to a JSON file. -=# +Save a :class:`SymbolicNode` to a JSON file. +""" function save(filename :: AbstractString, node :: SymbolicNode) @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), node, filename) end -#=doc -libmxnet APIs -------------- - -**autogen:EMBED:symbolic-node:EMBED:autogen** -=# ################################################################################ # Atomic SymbolicNode functions dynamically imported from libmxnet ################################################################################ diff --git a/src/visualize.jl b/src/visualize.jl index 3d46b9c38cb3..15f23c6bfffc 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -1,21 +1,16 @@ import JSON -#=doc -Network Visualization -===================== -=# +""" + to_graphviz(network) -#=doc -.. function:: to_graphviz(network) - - :param SymbolicNode network: the network to visualize. - :param AbstractString title: keyword argument, default "Network Visualization", +* SymbolicNode network: the network to visualize. +* AbstractString title: keyword argument, default "Network Visualization", the title of the GraphViz graph. - :param input_shapes: keyword argument, default ``nothing``. If provided, +* input_shapes: keyword argument, default ``nothing``. If provided, will run shape inference and plot with the shape information. Should be either a dictionary of name-shape mapping or an array of shapes. :return: the graph description in GraphViz ``dot`` language. -=# +""" function to_graphviz(network :: SymbolicNode; title="Network Visualization", input_shapes=nothing) if !isa(input_shapes, Void) internals = get_internals(network) From d8de74250c059aa2916d596c60b08720063da046 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 13 Jul 2016 02:58:29 +0900 Subject: [PATCH 350/630] improve autogenerated documentation --- src/util.jl | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/src/util.jl b/src/util.jl index 73c3316fa9f7..13ce10f58a77 100644 --- a/src/util.jl +++ b/src/util.jl @@ -67,12 +67,12 @@ function _format_typestring(typestr :: AbstractString) replace(typestr, r"\bSymbol\b", "SymbolicNode") end function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{char_pp}, arg_descs::Ref{char_pp}, remove_dup::Bool=true) - param_keys = Set{AbstractString}() + param_keys = Set{String}() arg_names = pointer_to_array(arg_names[], narg) arg_types = pointer_to_array(arg_types[], narg) arg_descs = pointer_to_array(arg_descs[], narg) - docstrings = AbstractString[] + docstrings = String[] for i = 1:narg arg_name = @compat String(arg_names[i]) @@ -83,7 +83,7 @@ function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{ch arg_type = _format_typestring(@compat String(arg_types[i])) arg_desc = @compat String(arg_descs[i]) - push!(docstrings, ":param $arg_name: $arg_desc\n:type $arg_name: $arg_type\n\n") + push!(docstrings, "* `$arg_name::$arg_type`: $arg_desc\n") end return join(docstrings, "\n") end From 597c7366b4c023acb67155e03a3c7faab454bf75 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 13 Jul 2016 04:00:20 +0900 Subject: [PATCH 351/630] convert rst to md with pandoc --- docs/src/tutorial/char-lstm.md | 574 ++++++++++++++----------------- docs/src/tutorial/mnist.md | 455 ++++++++++++------------ docs/src/user-guide/faq.md | 8 + docs/src/user-guide/faq.rst | 7 - docs/src/user-guide/install.md | 67 ++++ docs/src/user-guide/install.rst | 56 --- docs/src/user-guide/overview.md | 412 ++++++++++++++++++++++ docs/src/user-guide/overview.rst | 376 -------------------- 8 files changed, 980 insertions(+), 975 deletions(-) create mode 100644 docs/src/user-guide/faq.md delete mode 100644 docs/src/user-guide/faq.rst create mode 100644 docs/src/user-guide/install.md delete mode 100644 docs/src/user-guide/install.rst create mode 100644 docs/src/user-guide/overview.md delete mode 100644 docs/src/user-guide/overview.rst diff --git a/docs/src/tutorial/char-lstm.md b/docs/src/tutorial/char-lstm.md index 5b1c348e5568..5c20c8f05830 100644 --- a/docs/src/tutorial/char-lstm.md +++ b/docs/src/tutorial/char-lstm.md @@ -1,368 +1,308 @@ Generating Random Sentence with LSTM RNN ======================================== -This tutorial shows how to train a LSTM (Long short-term memory) RNN (recurrent -neural network) to perform character-level sequence training and prediction. The -original model, usually called ``char-rnn`` is described in `Andrej Karpathy's -blog `_, with -a reference implementation in Torch available `here -`_. - -Because MXNet.jl does not have a specialized model for recurrent neural networks -yet, the example shown here is an implementation of LSTM by using the default -:class:`FeedForward` model via explicitly unfolding over time. We will be using -fixed-length input sequence for training. The code is adapted from the `char-rnn -example for MXNet's Python binding -`_, which -demonstrates how to use low-level :doc:`symbolic APIs ` to -build customized neural network models directly. - -The most important code snippets of this example is shown and explained here. -To see and run the complete code, please refer to the `examples/char-lstm -`_ directory. -You will need to install `Iterators.jl -`_ and `StatsBase.jl -`_ to run this example. +This tutorial shows how to train a LSTM (Long short-term memory) RNN +(recurrent neural network) to perform character-level sequence training +and prediction. The original model, usually called `char-rnn` is +described in [Andrej Karpathy's +blog](http://karpathy.github.io/2015/05/21/rnn-effectiveness/), with a +reference implementation in Torch available +[here](https://github.com/karpathy/char-rnn). + +Because MXNet.jl does not have a specialized model for recurrent neural +networks yet, the example shown here is an implementation of LSTM by +using the default FeedForward model via explicitly unfolding over time. +We will be using fixed-length input sequence for training. The code is +adapted from the [char-rnn example for MXNet's Python +binding](https://github.com/dmlc/mxnet/blob/master/example/rnn/char_lstm.ipynb), +which demonstrates how to use low-level +symbolic APIs </api/symbolic-node> to build customized neural +network models directly. + +The most important code snippets of this example is shown and explained +here. To see and run the complete code, please refer to the +[examples/char-lstm](https://github.com/dmlc/MXNet.jl/tree/master/examples/char-lstm) +directory. You will need to install +[Iterators.jl](https://github.com/JuliaLang/Iterators.jl) and +[StatsBase.jl](https://github.com/JuliaStats/StatsBase.jl) to run this +example. LSTM Cells ---------- -Christopher Olah has a `great blog post about LSTM -`_ with beautiful and -clear illustrations. So we will not repeat the definition and explanation of -what an LSTM cell is here. Basically, an LSTM cell takes input ``x``, as well as -previous states (including ``c`` and ``h``), and produce the next states. -We define a helper type to bundle the two state variables together: +Christopher Olah has a [great blog post about +LSTM](http://colah.github.io/posts/2015-08-Understanding-LSTMs/) with +beautiful and clear illustrations. So we will not repeat the definition +and explanation of what an LSTM cell is here. Basically, an LSTM cell +takes input `x`, as well as previous states (including `c` and `h`), and +produce the next states. We define a helper type to bundle the two state +variables together: -.. literalinclude:: ../../examples/char-lstm/lstm.jl - :language: julia - :start-after: #--LSTMState - :end-before: #--/LSTMState +Because LSTM weights are shared at every time when we do explicit +unfolding, so we also define a helper type to hold all the weights (and +bias) for an LSTM cell for convenience. -Because LSTM weights are shared at every time when we do explicit unfolding, so -we also define a helper type to hold all the weights (and bias) for an LSTM cell -for convenience. +Note all the variables are of type SymbolicNode. We will construct the +LSTM network as a symbolic computation graph, which is then instantiated +with NDArray for actual computation. -.. literalinclude:: ../../examples/char-lstm/lstm.jl - :language: julia - :start-after: #--LSTMParam - :end-before: #--/LSTMParam +The following figure is stolen (permission requested) from [Christopher +Olah's blog](http://colah.github.io/posts/2015-08-Understanding-LSTMs/), +which illustrate exactly what the code snippet above is doing. -Note all the variables are of type :class:`SymbolicNode`. We will construct the -LSTM network as a symbolic computation graph, which is then instantiated with -:class:`NDArray` for actual computation. +![image](images/LSTM3-chain.png) -.. literalinclude:: ../../examples/char-lstm/lstm.jl - :language: julia - :start-after: #--lstm_cell - :end-before: #--/lstm_cell - -The following figure is stolen (permission requested) from -`Christopher Olah's blog -`_, which illustrate -exactly what the code snippet above is doing. - -.. image:: images/LSTM3-chain.png - -In particular, instead of defining the four gates independently, we do the -computation together and then use :class:`SliceChannel` to split them into four -outputs. The computation of gates are all done with the symbolic API. The return -value is a LSTM state containing the output of a LSTM cell. +In particular, instead of defining the four gates independently, we do +the computation together and then use SliceChannel to split them into +four outputs. The computation of gates are all done with the symbolic +API. The return value is a LSTM state containing the output of a LSTM +cell. Unfolding LSTM -------------- -Using the LSTM cell defined above, we are now ready to define a function to -unfold a LSTM network with L layers and T time steps. The first part of the -function is just defining all the symbolic variables for the shared weights and -states. - -The ``embed_W`` is the weights used for character embedding --- i.e. mapping the -one-hot encoded characters into real vectors. The ``pred_W`` and ``pred_b`` are -weights and bias for the final prediction at each time step. - -Then we define the weights for each LSTM cell. Note there is one cell for each -layer, and it will be replicated (unrolled) over time. The states are, however, -*not* shared over time. Instead, here we define the initial states here at the -beginning of a sequence, and we will update them with the output states at each -time step as we explicitly unroll the LSTM. - -.. literalinclude:: ../../examples/char-lstm/lstm.jl - :language: julia - :start-after: #--LSTM-part1 - :end-before: #--/LSTM-part1 - -Unrolling over time is a straightforward procedure of stacking the embedding -layer, and then LSTM cells, on top of which the prediction layer. During -unrolling, we update the states and collect all the outputs. Note each time step -takes data and label as inputs. If the LSTM is named as ``:ptb``, the data and -label at step ``t`` will be named ``:ptb_data_$t`` and ``:ptb_label_$t``. Late -on when we prepare the data, we will define the data provider to match those -names. - -.. literalinclude:: ../../examples/char-lstm/lstm.jl - :language: julia - :start-after: #--LSTM-part2 - :end-before: #--/LSTM-part2 - -Note at each time step, the prediction is connected to a :class:`SoftmaxOutput` -operator, which could back propagate when corresponding labels are provided. The -states are then connected to the next time step, which allows back propagate -through time. However, at the end of the sequence, the final states are not -connected to anything. This dangling outputs is problematic, so we explicitly -connect each of them to a :class:`BlockGrad` operator, which simply back -propagates 0-gradient and closes the computation graph. - -In the end, we just group all the prediction outputs at each time step as -a single :class:`SymbolicNode` and return. Optionally we will also group the -final states, this is used when we use the trained LSTM to sample sentences. - -.. literalinclude:: ../../examples/char-lstm/lstm.jl - :language: julia - :start-after: #--LSTM-part3 - :end-before: #--/LSTM-part3 + +Using the LSTM cell defined above, we are now ready to define a function +to unfold a LSTM network with L layers and T time steps. The first part +of the function is just defining all the symbolic variables for the +shared weights and states. + +The `embed_W` is the weights used for character embedding --- i.e. +mapping the one-hot encoded characters into real vectors. The `pred_W` +and `pred_b` are weights and bias for the final prediction at each time +step. + +Then we define the weights for each LSTM cell. Note there is one cell +for each layer, and it will be replicated (unrolled) over time. The +states are, however, *not* shared over time. Instead, here we define the +initial states here at the beginning of a sequence, and we will update +them with the output states at each time step as we explicitly unroll +the LSTM. + +Unrolling over time is a straightforward procedure of stacking the +embedding layer, and then LSTM cells, on top of which the prediction +layer. During unrolling, we update the states and collect all the +outputs. Note each time step takes data and label as inputs. If the LSTM +is named as `:ptb`, the data and label at step `t` will be named +`:ptb_data_$t` and `:ptb_label_$t`. Late on when we prepare the data, we +will define the data provider to match those names. + +Note at each time step, the prediction is connected to a SoftmaxOutput +operator, which could back propagate when corresponding labels are +provided. The states are then connected to the next time step, which +allows back propagate through time. However, at the end of the sequence, +the final states are not connected to anything. This dangling outputs is +problematic, so we explicitly connect each of them to a BlockGrad +operator, which simply back propagates 0-gradient and closes the +computation graph. + +In the end, we just group all the prediction outputs at each time step +as a single SymbolicNode and return. Optionally we will also group the +final states, this is used when we use the trained LSTM to sample +sentences. Data Provider for Text Sequences -------------------------------- -Now we need to construct a data provider that takes a text file, divide the text -into mini-batches of fixed-length character-sequences, and provide them as -one-hot encoded vectors. - -Note the is no fancy feature extraction at all. Each character is simply encoded -as a one-hot vector: a 0-1 vector of the size given by the vocabulary. Here we -just construct the vocabulary by collecting all the unique characters in the -training text -- there are not too many of them (including punctuations and -whitespace) for English text. Each input character is then encoded as a vector -of 0s on all coordinates, and 1 on the coordinate corresponding to that -character. The character-to-coordinate mapping is giving by the vocabulary. - -The text sequence data provider implement the :doc:`data provider API -`. We define the ``CharSeqProvider`` as below: - -.. literalinclude:: ../../examples/char-lstm/seq-data.jl - :language: julia - :start-after: #--CharSeqProvider - :end-before: #--/CharSeqProvider - -The provided data and labels follow the naming convention of inputs used when -unrolling the LSTM. Note in the code below, apart from ``$name_data_$t`` and -``$name_label_$t``, we also provides the initial ``c`` and ``h`` states for each -layer. This is because we are using the high-level :class:`FeedForward` API, -which has no idea about time and states. So we will feed the initial states for -each sequence from the data provider. Since the initial states is always zero, -we just need to always provide constant zero blobs. - -.. literalinclude:: ../../examples/char-lstm/seq-data.jl - :language: julia - :start-after: #--provide - :end-before: #--/provide - -Next we implement the :func:`AbstractDataProvider.eachbatch` interface for the provider. -We start by defining the data and label arrays, and the ``DataBatch`` object we -will provide in each iteration. - -.. literalinclude:: ../../examples/char-lstm/seq-data.jl - :language: julia - :start-after: #--eachbatch-part1 - :end-before: #--/eachbatch-part1 - -The actual data providing iteration is implemented as a Julia **coroutine**. In this -way, we can write the data loading logic as a simple coherent ``for`` loop, and -do not need to implement the interface functions like :func:`Base.start`, -:func:`Base.next`, etc. - -Basically, we partition the text into -batches, each batch containing several contiguous text sequences. Note at each -time step, the LSTM is trained to predict the next character, so the label is -the same as the data, but shifted ahead by one index. - -.. literalinclude:: ../../examples/char-lstm/seq-data.jl - :language: julia - :start-after: #--eachbatch-part2 - :end-before: #--/eachbatch-part2 - +Now we need to construct a data provider that takes a text file, divide +the text into mini-batches of fixed-length character-sequences, and +provide them as one-hot encoded vectors. + +Note the is no fancy feature extraction at all. Each character is simply +encoded as a one-hot vector: a 0-1 vector of the size given by the +vocabulary. Here we just construct the vocabulary by collecting all the +unique characters in the training text -- there are not too many of them +(including punctuations and whitespace) for English text. Each input +character is then encoded as a vector of 0s on all coordinates, and 1 on +the coordinate corresponding to that character. The +character-to-coordinate mapping is giving by the vocabulary. + +The text sequence data provider implement the data provider API +</api/io>. We define the `CharSeqProvider` as below: + +The provided data and labels follow the naming convention of inputs used +when unrolling the LSTM. Note in the code below, apart from +`$name_data_$t` and `$name_label_$t`, we also provides the initial `c` +and `h` states for each layer. This is because we are using the +high-level FeedForward API, which has no idea about time and states. So +we will feed the initial states for each sequence from the data +provider. Since the initial states is always zero, we just need to +always provide constant zero blobs. + +Next we implement the AbstractDataProvider.eachbatch interface for the +provider. We start by defining the data and label arrays, and the +`DataBatch` object we will provide in each iteration. + +The actual data providing iteration is implemented as a Julia +**coroutine**. In this way, we can write the data loading logic as a +simple coherent `for` loop, and do not need to implement the interface +functions like Base.start, Base.next, etc. + +Basically, we partition the text into batches, each batch containing +several contiguous text sequences. Note at each time step, the LSTM is +trained to predict the next character, so the label is the same as the +data, but shifted ahead by one index. Training the LSTM ----------------- -Now we have implemented all the supporting infrastructures for our char-lstm. -To train the model, we just follow the standard high-level API. Firstly, we -construct a LSTM symbolic architecture: - -.. literalinclude:: ../../examples/char-lstm/train.jl - :language: julia - :start-after: #--LSTM - :end-before: #--/LSTM - -Note all the parameters are defined in `examples/char-lstm/config.jl -`_. -Now we load the text file and define the data provider. The data ``input.txt`` -we used in this example is `a tiny Shakespeare dataset -`_. But you -can try with other text files. - -.. literalinclude:: ../../examples/char-lstm/train.jl - :language: julia - :start-after: #--data - :end-before: #--/data - -The last step is to construct a model, an optimizer and fit the mode to the -data. We are using the :class:`ADAM` optimizer [Adam]_ in this example. - -.. literalinclude:: ../../examples/char-lstm/train.jl - :language: julia - :start-after: #--train - :end-before: #--/train - -Note we are also using a customized ``NLL`` evaluation metric, which calculate -the negative log-likelihood during training. Here is an output sample at the end of -the training process. - -.. code-block:: text - - ... - INFO: Speed: 357.72 samples/sec - INFO: == Epoch 020 ========== - INFO: ## Training summary - INFO: NLL = 1.4672 - INFO: perplexity = 4.3373 - INFO: time = 87.2631 seconds - INFO: ## Validation summary - INFO: NLL = 1.6374 - INFO: perplexity = 5.1418 - INFO: Saved checkpoint to 'char-lstm/checkpoints/ptb-0020.params' - INFO: Speed: 368.74 samples/sec - INFO: Speed: 361.04 samples/sec - INFO: Speed: 360.02 samples/sec - INFO: Speed: 362.34 samples/sec - INFO: Speed: 360.80 samples/sec - INFO: Speed: 362.77 samples/sec - INFO: Speed: 357.18 samples/sec - INFO: Speed: 355.30 samples/sec - INFO: Speed: 362.33 samples/sec - INFO: Speed: 359.23 samples/sec - INFO: Speed: 358.09 samples/sec - INFO: Speed: 356.89 samples/sec - INFO: Speed: 371.91 samples/sec - INFO: Speed: 372.24 samples/sec - INFO: Speed: 356.59 samples/sec - INFO: Speed: 356.64 samples/sec - INFO: Speed: 360.24 samples/sec - INFO: Speed: 360.32 samples/sec - INFO: Speed: 362.38 samples/sec - INFO: == Epoch 021 ========== - INFO: ## Training summary - INFO: NLL = 1.4655 - INFO: perplexity = 4.3297 - INFO: time = 86.9243 seconds - INFO: ## Validation summary - INFO: NLL = 1.6366 - INFO: perplexity = 5.1378 - INFO: Saved checkpoint to 'examples/char-lstm/checkpoints/ptb-0021.params' - - -.. [Adam] Diederik Kingma and Jimmy Ba: *Adam: A Method for Stochastic - Optimization*. `arXiv:1412.6980 `_ - [cs.LG]. - +Now we have implemented all the supporting infrastructures for our +char-lstm. To train the model, we just follow the standard high-level +API. Firstly, we construct a LSTM symbolic architecture: + +Note all the parameters are defined in +[examples/char-lstm/config.jl](https://github.com/dmlc/MXNet.jl/blob/master/examples/char-lstm/config.jl). +Now we load the text file and define the data provider. The data +`input.txt` we used in this example is [a tiny Shakespeare +dataset](https://github.com/dmlc/web-data/tree/master/mxnet/tinyshakespeare). +But you can try with other text files. + +The last step is to construct a model, an optimizer and fit the mode to +the data. We are using the ADAM optimizer \[Adam\]\_ in this example. + +Note we are also using a customized `NLL` evaluation metric, which +calculate the negative log-likelihood during training. Here is an output +sample at the end of the training process. + +``` {.sourceCode .text} +... +INFO: Speed: 357.72 samples/sec +INFO: == Epoch 020 ========== +INFO: ## Training summary +INFO: NLL = 1.4672 +INFO: perplexity = 4.3373 +INFO: time = 87.2631 seconds +INFO: ## Validation summary +INFO: NLL = 1.6374 +INFO: perplexity = 5.1418 +INFO: Saved checkpoint to 'char-lstm/checkpoints/ptb-0020.params' +INFO: Speed: 368.74 samples/sec +INFO: Speed: 361.04 samples/sec +INFO: Speed: 360.02 samples/sec +INFO: Speed: 362.34 samples/sec +INFO: Speed: 360.80 samples/sec +INFO: Speed: 362.77 samples/sec +INFO: Speed: 357.18 samples/sec +INFO: Speed: 355.30 samples/sec +INFO: Speed: 362.33 samples/sec +INFO: Speed: 359.23 samples/sec +INFO: Speed: 358.09 samples/sec +INFO: Speed: 356.89 samples/sec +INFO: Speed: 371.91 samples/sec +INFO: Speed: 372.24 samples/sec +INFO: Speed: 356.59 samples/sec +INFO: Speed: 356.64 samples/sec +INFO: Speed: 360.24 samples/sec +INFO: Speed: 360.32 samples/sec +INFO: Speed: 362.38 samples/sec +INFO: == Epoch 021 ========== +INFO: ## Training summary +INFO: NLL = 1.4655 +INFO: perplexity = 4.3297 +INFO: time = 86.9243 seconds +INFO: ## Validation summary +INFO: NLL = 1.6366 +INFO: perplexity = 5.1378 +INFO: Saved checkpoint to 'examples/char-lstm/checkpoints/ptb-0021.params' +``` Sampling Random Sentences ------------------------- -After training the LSTM, we can now sample random sentences from the trained -model. The sampler works in the following way: - -- Starting from some fixed character, take ``a`` for example, and feed it as input to the LSTM. -- The LSTM will produce an output distribution over the vocabulary and a state - in the first time step. We sample a character from the output distribution, - fix it as the second character. -- In the next time step, we feed the previously sampled character as input and - continue running the LSTM by also taking the previous states (instead of the - 0 initial states). -- Continue running until we sampled enough characters. +After training the LSTM, we can now sample random sentences from the +trained model. The sampler works in the following way: -Note we are running with mini-batches, so several sentences could be sampled -simultaneously. Here are some sampled outputs from a network I trained for -around half an hour on the Shakespeare dataset. Note all the line-breaks, -punctuations and upper-lower case letters are produced by the sampler itself. -I did not do any post-processing. +- Starting from some fixed character, take `a` for example, and feed + it as input to the LSTM. +- The LSTM will produce an output distribution over the vocabulary and + a state in the first time step. We sample a character from the + output distribution, fix it as the second character. +- In the next time step, we feed the previously sampled character as + input and continue running the LSTM by also taking the previous + states (instead of the 0 initial states). +- Continue running until we sampled enough characters. -.. code-block:: text +Note we are running with mini-batches, so several sentences could be +sampled simultaneously. Here are some sampled outputs from a network I +trained for around half an hour on the Shakespeare dataset. Note all the +line-breaks, punctuations and upper-lower case letters are produced by +the sampler itself. I did not do any post-processing. - ## Sample 1 - all have sir, - Away will fill'd in His time, I'll keep her, do not madam, if they here? Some more ha? +``` {.sourceCode .text} +## Sample 1 +all have sir, +Away will fill'd in His time, I'll keep her, do not madam, if they here? Some more ha? - ## Sample 2 - am. +## Sample 2 +am. - CLAUDIO: - Hone here, let her, the remedge, and I know not slept a likely, thou some soully free? +CLAUDIO: +Hone here, let her, the remedge, and I know not slept a likely, thou some soully free? - ## Sample 3 - arrel which noble thing - The exchnachsureding worns: I ne'er drunken Biancas, fairer, than the lawfu? +## Sample 3 +arrel which noble thing +The exchnachsureding worns: I ne'er drunken Biancas, fairer, than the lawfu? - ## Sample 4 - augh assalu, you'ld tell me corn; - Farew. First, for me of a loved. Has thereat I knock you presents? +## Sample 4 +augh assalu, you'ld tell me corn; +Farew. First, for me of a loved. Has thereat I knock you presents? - ## Sample 5 - ame the first answer. +## Sample 5 +ame the first answer. - MARIZARINIO: - Door of Angelo as her lord, shrield liken Here fellow the fool ? +MARIZARINIO: +Door of Angelo as her lord, shrield liken Here fellow the fool ? - ## Sample 6 - ad well. +## Sample 6 +ad well. - CLAUDIO: - Soon him a fellows here; for her fine edge in a bogms' lord's wife. +CLAUDIO: +Soon him a fellows here; for her fine edge in a bogms' lord's wife. - LUCENTIO: - I? +LUCENTIO: +I? - ## Sample 7 - adrezilian measure. +## Sample 7 +adrezilian measure. - LUCENTIO: - So, help'd you hath nes have a than dream's corn, beautio, I perchas? +LUCENTIO: +So, help'd you hath nes have a than dream's corn, beautio, I perchas? - ## Sample 8 - as eatter me; - The girlly: and no other conciolation! +## Sample 8 +as eatter me; +The girlly: and no other conciolation! - BISTRUMIO: - I have be rest girl. O, that I a h? +BISTRUMIO: +I have be rest girl. O, that I a h? - ## Sample 9 - and is intend you sort: - What held her all 'clama's for maffice. Some servant.' what I say me the cu? +## Sample 9 +and is intend you sort: +What held her all 'clama's for maffice. Some servant.' what I say me the cu? - ## Sample 10 - an thoughts will said in our pleasue, - Not scanin on him that you live; believaries she. +## Sample 10 +an thoughts will said in our pleasue, +Not scanin on him that you live; believaries she. - ISABELLLLL? +ISABELLLLL? +``` -See `Andrej Karpathy's blog post -`_ on more examples and -links including Linux source codes, Algebraic Geometry Theorems, and even -cooking recipes. The code for sampling can be found in -`examples/char-lstm/sampler.jl -`_. +See [Andrej Karpathy's blog +post](http://karpathy.github.io/2015/05/21/rnn-effectiveness/) on more +examples and links including Linux source codes, Algebraic Geometry +Theorems, and even cooking recipes. The code for sampling can be found +in +[examples/char-lstm/sampler.jl](https://github.com/dmlc/MXNet.jl/blob/master/examples/char-lstm/sampler.jl). Visualizing the LSTM -------------------- -Finally, you could visualize the LSTM by calling :func:`to_graphviz` on the -constructed LSTM symbolic architecture. We only show an example of 1-layer and -2-time-step LSTM below. The automatic layout produced by GraphViz is definitely -much less clear than `Christopher Olah's illustrations -`_, but could -otherwise be very useful for debugging. As we can see, the LSTM unfolded over -time is just a (very) deep neural network. The complete code for producing this -visualization can be found in `examples/char-lstm/visualize.jl -`_. - -.. image:: images/char-lstm-vis.svg +Finally, you could visualize the LSTM by calling to\_graphviz on the +constructed LSTM symbolic architecture. We only show an example of +1-layer and 2-time-step LSTM below. The automatic layout produced by +GraphViz is definitely much less clear than [Christopher Olah's +illustrations](http://colah.github.io/posts/2015-08-Understanding-LSTMs/), +but could otherwise be very useful for debugging. As we can see, the +LSTM unfolded over time is just a (very) deep neural network. The +complete code for producing this visualization can be found in +[examples/char-lstm/visualize.jl](https://github.com/dmlc/MXNet.jl/blob/master/examples/char-lstm/visualize.jl). + +![image](images/char-lstm-vis.svg) diff --git a/docs/src/tutorial/mnist.md b/docs/src/tutorial/mnist.md index fc2e548dd1c2..b4e7a3be89ee 100644 --- a/docs/src/tutorial/mnist.md +++ b/docs/src/tutorial/mnist.md @@ -1,253 +1,270 @@ Digit Recognition on MNIST ========================== -In this tutorial, we will work through examples of training a simple multi-layer -perceptron and then a convolutional neural network (the LeNet architecture) on -the `MNIST handwritten digit dataset `_. The -code for this tutorial could be found in `examples/mnist -`_. +In this tutorial, we will work through examples of training a simple +multi-layer perceptron and then a convolutional neural network (the +LeNet architecture) on the [MNIST handwritten digit +dataset](http://yann.lecun.com/exdb/mnist/). The code for this tutorial +could be found in +[examples/mnist](https://github.com/dmlc/MXNet.jl/tree/master/examples/mnist). Simple 3-layer MLP ------------------ -This is a tiny 3-layer MLP that could be easily trained on CPU. The script starts with +This is a tiny 3-layer MLP that could be easily trained on CPU. The +script starts with -.. code-block:: julia +``` {.sourceCode .julia} +using MXNet +``` - using MXNet +to load the `MXNet` module. Then we are ready to define the network +architecture via the symbolic API </user-guide/overview>. We start +with a placeholder `data` symbol, -to load the ``MXNet`` module. Then we are ready to define the network -architecture via the :doc:`symbolic API `. We start with -a placeholder ``data`` symbol, - -.. code-block:: julia - - data = mx.Variable(:data) +``` {.sourceCode .julia} +data = mx.Variable(:data) +``` and then cascading fully-connected layers and activation functions: -.. code-block:: julia - - fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) - act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) - fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) - act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) - fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) - -Note each composition we take the previous symbol as the `data` argument, forming a feedforward chain. The architecture looks like - -.. code-block:: julia - - Input --> 128 units (ReLU) --> 64 units (ReLU) --> 10 units - -where the last 10 units correspond to the 10 output classes (digits 0,...,9). We -then add a final :class:`SoftmaxOutput` operation to turn the 10-dimensional prediction to proper probability values for the 10 classes: - -.. code-block:: julia - - mlp = mx.SoftmaxOutput(data = fc3, name=:softmax) - -As we can see, the MLP is just a chain of layers. For this case, we can also use -the ``mx.chain`` macro. The same architecture above can be defined as - -.. code-block:: julia - - mlp = @mx.chain mx.Variable(:data) => - mx.FullyConnected(name=:fc1, num_hidden=128) => - mx.Activation(name=:relu1, act_type=:relu) => - mx.FullyConnected(name=:fc2, num_hidden=64) => - mx.Activation(name=:relu2, act_type=:relu) => - mx.FullyConnected(name=:fc3, num_hidden=10) => - mx.SoftmaxOutput(name=:softmax) - -After defining the architecture, we are ready to load the MNIST data. MXNet.jl -provide built-in data providers for the MNIST dataset, which could automatically -download the dataset into ``Pkg.dir("MXNet")/data/mnist`` if necessary. We wrap -the code to construct the data provider into ``mnist-data.jl`` so that it could be shared by both the MLP example and the LeNet ConvNets example. - -.. code-block:: julia - - batch_size = 100 - include("mnist-data.jl") - train_provider, eval_provider = get_mnist_providers(batch_size) - -If you need to write your own data providers for customized data format, please -refer to :class:`AbstractDataProvider`. - -Given the architecture and data, we can instantiate an *model* to do the actual -training. ``mx.FeedForward`` is the built-in model that is suitable for most feed-forward architectures. When constructing the model, we also specify the *context* on which the computation should be carried out. Because this is a really tiny MLP, we will just run on a single CPU device. - -.. code-block:: julia - - model = mx.FeedForward(mlp, context=mx.cpu()) - -You can use a ``mx.gpu()`` or if a list of devices (e.g. ``[mx.gpu(0), -mx.gpu(1)]``) is provided, data-parallelization will be used automatically. But for this tiny example, using a GPU device might not help. - -The last thing we need to specify is the optimization algorithm (a.k.a. *optimizer*) to use. We use the basic SGD with a fixed learning rate 0.1 and momentum 0.9: - -.. code-block:: julia - - optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) - -Now we can do the training. Here the ``n_epoch`` parameter specifies that we -want to train for 20 epochs. We also supply a ``eval_data`` to monitor validation accuracy on the validation set. - -.. code-block:: julia - - mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +``` {.sourceCode .julia} +fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) +act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) +fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) +act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) +fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) +``` + +Note each composition we take the previous symbol as the data argument, +forming a feedforward chain. The architecture looks like + +``` {.sourceCode .julia} +Input --> 128 units (ReLU) --> 64 units (ReLU) --> 10 units +``` + +where the last 10 units correspond to the 10 output classes (digits +0,...,9). We then add a final SoftmaxOutput operation to turn the +10-dimensional prediction to proper probability values for the 10 +classes: + +``` {.sourceCode .julia} +mlp = mx.SoftmaxOutput(data = fc3, name=:softmax) +``` + +As we can see, the MLP is just a chain of layers. For this case, we can +also use the `mx.chain` macro. The same architecture above can be +defined as + +``` {.sourceCode .julia} +mlp = @mx.chain mx.Variable(:data) => + mx.FullyConnected(name=:fc1, num_hidden=128) => + mx.Activation(name=:relu1, act_type=:relu) => + mx.FullyConnected(name=:fc2, num_hidden=64) => + mx.Activation(name=:relu2, act_type=:relu) => + mx.FullyConnected(name=:fc3, num_hidden=10) => + mx.SoftmaxOutput(name=:softmax) +``` + +After defining the architecture, we are ready to load the MNIST data. +MXNet.jl provide built-in data providers for the MNIST dataset, which +could automatically download the dataset into +`Pkg.dir("MXNet")/data/mnist` if necessary. We wrap the code to +construct the data provider into `mnist-data.jl` so that it could be +shared by both the MLP example and the LeNet ConvNets example. + +``` {.sourceCode .julia} +batch_size = 100 +include("mnist-data.jl") +train_provider, eval_provider = get_mnist_providers(batch_size) +``` + +If you need to write your own data providers for customized data format, +please refer to AbstractDataProvider. + +Given the architecture and data, we can instantiate an *model* to do the +actual training. `mx.FeedForward` is the built-in model that is suitable +for most feed-forward architectures. When constructing the model, we +also specify the *context* on which the computation should be carried +out. Because this is a really tiny MLP, we will just run on a single CPU +device. + +``` {.sourceCode .julia} +model = mx.FeedForward(mlp, context=mx.cpu()) +``` + +You can use a `mx.gpu()` or if a list of devices (e.g. +`[mx.gpu(0), mx.gpu(1)]`) is provided, data-parallelization will be used +automatically. But for this tiny example, using a GPU device might not +help. + +The last thing we need to specify is the optimization algorithm (a.k.a. +*optimizer*) to use. We use the basic SGD with a fixed learning rate 0.1 +and momentum 0.9: + +``` {.sourceCode .julia} +optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) +``` + +Now we can do the training. Here the `n_epoch` parameter specifies that +we want to train for 20 epochs. We also supply a `eval_data` to monitor +validation accuracy on the validation set. + +``` {.sourceCode .julia} +mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +``` Here is a sample output -.. code-block:: text - - INFO: Start training on [CPU0] - INFO: Initializing parameters... - INFO: Creating KVStore... - INFO: == Epoch 001 ========== - INFO: ## Training summary - INFO: :accuracy = 0.7554 - INFO: time = 1.3165 seconds - INFO: ## Validation summary - INFO: :accuracy = 0.9502 - ... - INFO: == Epoch 020 ========== - INFO: ## Training summary - INFO: :accuracy = 0.9949 - INFO: time = 0.9287 seconds - INFO: ## Validation summary - INFO: :accuracy = 0.9775 - +``` {.sourceCode .text} +INFO: Start training on [CPU0] +INFO: Initializing parameters... +INFO: Creating KVStore... +INFO: == Epoch 001 ========== +INFO: ## Training summary +INFO: :accuracy = 0.7554 +INFO: time = 1.3165 seconds +INFO: ## Validation summary +INFO: :accuracy = 0.9502 +... +INFO: == Epoch 020 ========== +INFO: ## Training summary +INFO: :accuracy = 0.9949 +INFO: time = 0.9287 seconds +INFO: ## Validation summary +INFO: :accuracy = 0.9775 +``` Convolutional Neural Networks ----------------------------- -In the second example, we show a slightly more complicated architecture that -involves convolution and pooling. This architecture for the MNIST is usually -called the [LeNet]_. The first part of the architecture is listed below: - -.. code-block:: julia +In the second example, we show a slightly more complicated architecture +that involves convolution and pooling. This architecture for the MNIST +is usually called the \[LeNet\]\_. The first part of the architecture is +listed below: - # input - data = mx.Variable(:data) +``` {.sourceCode .julia} +# input +data = mx.Variable(:data) - # first conv - conv1 = @mx.chain mx.Convolution(data=data, kernel=(5,5), num_filter=20) => - mx.Activation(act_type=:tanh) => - mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) +# first conv +conv1 = @mx.chain mx.Convolution(data=data, kernel=(5,5), num_filter=20) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) - # second conv - conv2 = @mx.chain mx.Convolution(data=conv1, kernel=(5,5), num_filter=50) => - mx.Activation(act_type=:tanh) => - mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) +# second conv +conv2 = @mx.chain mx.Convolution(data=conv1, kernel=(5,5), num_filter=50) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) +``` We basically defined two convolution modules. Each convolution module is -actually a chain of ``Convolution``, ``tanh`` activation and then max ``Pooling`` operations. - -Each sample in the MNIST dataset is a 28x28 single-channel grayscale image. In -the tensor format used by ``NDArray``, a batch of 100 samples is a tensor of -shape ``(28,28,1,100)``. The convolution and pooling operates in the spatial -axis, so ``kernel=(5,5)`` indicate a square region of 5-width and 5-height. -The rest of the architecture follows as: - -.. code-block:: julia - - # first fully-connected - fc1 = @mx.chain mx.Flatten(data=conv2) => - mx.FullyConnected(num_hidden=500) => - mx.Activation(act_type=:tanh) - - # second fully-connected - fc2 = mx.FullyConnected(data=fc1, num_hidden=10) - - # softmax loss - lenet = mx.Softmax(data=fc2, name=:softmax) - -Note a fully-connected operator expects the input to be a matrix. However, the -results from spatial convolution and pooling are 4D tensors. So we explicitly -used a ``Flatten`` operator to flat the tensor, before connecting it to the -``FullyConnected`` operator. - -The rest of the network is the same as the previous MLP example. As before, we can now load the MNIST dataset: - -.. code-block:: julia - - batch_size = 100 - include("mnist-data.jl") - train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) - -Note we specified ``flat=false`` to tell the data provider to provide 4D tensors instead of 2D matrices because the convolution operators needs correct spatial shape information. We then construct a feedforward model on GPU, and train it. - -.. code-block:: julia - - #-------------------------------------------------------------------------------- - # fit model - model = mx.FeedForward(lenet, context=mx.gpu()) - - # optimizer - optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) - - # fit parameters - mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +actually a chain of `Convolution`, `tanh` activation and then max +`Pooling` operations. + +Each sample in the MNIST dataset is a 28x28 single-channel grayscale +image. In the tensor format used by `NDArray`, a batch of 100 samples is +a tensor of shape `(28,28,1,100)`. The convolution and pooling operates +in the spatial axis, so `kernel=(5,5)` indicate a square region of +5-width and 5-height. The rest of the architecture follows as: + +``` {.sourceCode .julia} +# first fully-connected +fc1 = @mx.chain mx.Flatten(data=conv2) => + mx.FullyConnected(num_hidden=500) => + mx.Activation(act_type=:tanh) + +# second fully-connected +fc2 = mx.FullyConnected(data=fc1, num_hidden=10) + +# softmax loss +lenet = mx.Softmax(data=fc2, name=:softmax) +``` + +Note a fully-connected operator expects the input to be a matrix. +However, the results from spatial convolution and pooling are 4D +tensors. So we explicitly used a `Flatten` operator to flat the tensor, +before connecting it to the `FullyConnected` operator. + +The rest of the network is the same as the previous MLP example. As +before, we can now load the MNIST dataset: + +``` {.sourceCode .julia} +batch_size = 100 +include("mnist-data.jl") +train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) +``` + +Note we specified `flat=false` to tell the data provider to provide 4D +tensors instead of 2D matrices because the convolution operators needs +correct spatial shape information. We then construct a feedforward model +on GPU, and train it. + +``` {.sourceCode .julia} +#-------------------------------------------------------------------------------- +# fit model +model = mx.FeedForward(lenet, context=mx.gpu()) + +# optimizer +optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) + +# fit parameters +mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) +``` And here is a sample of running outputs: -.. code-block:: text - - INFO: == Epoch 001 ========== - INFO: ## Training summary - INFO: :accuracy = 0.6750 - INFO: time = 4.9814 seconds - INFO: ## Validation summary - INFO: :accuracy = 0.9712 - ... - INFO: == Epoch 020 ========== - INFO: ## Training summary - INFO: :accuracy = 1.0000 - INFO: time = 4.0086 seconds - INFO: ## Validation summary - INFO: :accuracy = 0.9915 - - -.. [LeNet] Lecun, Y.; Bottou, L.; Bengio, Y.; Haffner, P., - *Gradient-based learning applied to document recognition*, - Proceedings of the IEEE, vol.86, no.11, pp.2278-2324, - Nov 1998. +``` {.sourceCode .text} +INFO: == Epoch 001 ========== +INFO: ## Training summary +INFO: :accuracy = 0.6750 +INFO: time = 4.9814 seconds +INFO: ## Validation summary +INFO: :accuracy = 0.9712 +... +INFO: == Epoch 020 ========== +INFO: ## Training summary +INFO: :accuracy = 1.0000 +INFO: time = 4.0086 seconds +INFO: ## Validation summary +INFO: :accuracy = 0.9915 +``` Predicting with a trained model ------------------------------- -Predicting with a trained model is very simple. By calling ``mx.predict`` with the -model and a data provider, we get the model output as a Julia Array: - -.. code-block:: julia - - probs = mx.predict(model, eval_provider) - -The following code shows a stupid way of getting all the labels from the data -provider, and compute the prediction accuracy manually: - -.. code-block:: julia - - # collect all labels from eval data - labels = Array[] - for batch in eval_provider - push!(labels, copy(mx.get_label(batch))) - end - labels = cat(1, labels...) - - # Now we use compute the accuracy - correct = 0 - for i = 1:length(labels) - # labels are 0...9 - if indmax(probs[:,i]) == labels[i]+1 - correct += 1 - end - end - println(mx.format("Accuracy on eval set: {1:.2f}%", 100correct/length(labels))) +Predicting with a trained model is very simple. By calling `mx.predict` +with the model and a data provider, we get the model output as a Julia +Array: + +``` {.sourceCode .julia} +probs = mx.predict(model, eval_provider) +``` + +The following code shows a stupid way of getting all the labels from the +data provider, and compute the prediction accuracy manually: + +``` {.sourceCode .julia} +# collect all labels from eval data +labels = Array[] +for batch in eval_provider + push!(labels, copy(mx.get_label(batch))) +end +labels = cat(1, labels...) + +# Now we use compute the accuracy +correct = 0 +for i = 1:length(labels) + # labels are 0...9 + if indmax(probs[:,i]) == labels[i]+1 + correct += 1 + end +end +println(mx.format("Accuracy on eval set: {1:.2f}%", 100correct/length(labels))) +``` Alternatively, when the dataset is huge, one can provide a callback to -``mx.predict``, then the callback function will be invoked with the outputs of -each mini-batch. The callback could, for example, write the data to disk for -future inspection. In this case, no value is returned from ``mx.predict``. See -also :func:`predict`. +`mx.predict`, then the callback function will be invoked with the +outputs of each mini-batch. The callback could, for example, write the +data to disk for future inspection. In this case, no value is returned +from `mx.predict`. See also predict. diff --git a/docs/src/user-guide/faq.md b/docs/src/user-guide/faq.md new file mode 100644 index 000000000000..8fd8a6b34551 --- /dev/null +++ b/docs/src/user-guide/faq.md @@ -0,0 +1,8 @@ +FAQ +=== + +Running MXNet on AWS GPU instances +---------------------------------- + +See the discussions and notes +[here](https://github.com/dmlc/MXNet.jl/issues/43). diff --git a/docs/src/user-guide/faq.rst b/docs/src/user-guide/faq.rst deleted file mode 100644 index 602c8ab9fda5..000000000000 --- a/docs/src/user-guide/faq.rst +++ /dev/null @@ -1,7 +0,0 @@ -FAQ -=== - -Running MXNet on AWS GPU instances ----------------------------------- -See the discussions and notes `here -`_. diff --git a/docs/src/user-guide/install.md b/docs/src/user-guide/install.md new file mode 100644 index 000000000000..9c66a84204da --- /dev/null +++ b/docs/src/user-guide/install.md @@ -0,0 +1,67 @@ +Installation Guide +================== + +Automatic Installation +---------------------- + +To install MXNet.jl, simply type + +``` {.sourceCode .julia} +Pkg.add("MXNet") +``` + +in the Julia REPL. Or to use the latest git version of MXNet.jl, use the +following command instead + +``` {.sourceCode .julia} +Pkg.checkout("MXNet") +``` + +MXNet.jl is built on top of [libmxnet](https://github.com/dmlc/mxnet). +Upon installation, Julia will try to automatically download and build +libmxnet. + +The libmxnet source is downloaded to `Pkg.dir("MXNet")/deps/src/mxnet`. +The automatic build is using default configurations, with OpenCV, CUDA +disabled. If the compilation failed due to unresolved dependency, or if +you want to customize the build, it is recommended to compile and +install libmxnet manually. Please see below <manual-compilation> +for more details. + +Manual Compilation +------------------ + +It is possible to compile libmxnet separately and point MXNet.jl to a +the existing library in case automatic compilation fails due to +unresolved dependencies in an un-standard environment; Or when one want +to work with a seperate, maybe customized libmxnet. + +To build libmxnet, please refer to [the installation guide of +libmxnet](http://mxnet.readthedocs.org/en/latest/build.html). After +successfully installing libmxnet, set the `MXNET_HOME` environment +variable to the location of libmxnet. In other words, the compiled +`libmxnet.so` should be found in `$MXNET_HOME/lib`. + +> **note** +> +> The constant `MXNET_HOME` is pre-compiled in MXNet.jl package cache. +> If you updated the environment variable after installing MXNet.jl, +> make sure to update the pre-compilation cache by +> `Base.compilecache("MXNet")`. + +When the `MXNET_HOME` environment variable is detected and the +corresponding `libmxnet.so` could be loaded successfully, MXNet.jl will +skip automatic building during installation and use the specified +libmxnet instead. + +Basically, MXNet.jl will search `libmxnet.so` or `libmxnet.dll` in the +following paths (and in that order): + +- `$MXNET_HOME/lib`: customized libmxnet builds +- `Pkg.dir("MXNet")/deps/usr/lib`: automatic builds +- Any system wide library search path + +Note that MXNet.jl will not find `libmxnet.so` even if it is on one of +the paths above if a library it depends upon is missing from the +`LD_LIBRARY_PATH`. Thus, if you are going to compile to add CUDA, the +path to the CUDA libraries will have to be added to `LD_LIBRARY_PATH`. diff --git a/docs/src/user-guide/install.rst b/docs/src/user-guide/install.rst deleted file mode 100644 index d53830a0cb37..000000000000 --- a/docs/src/user-guide/install.rst +++ /dev/null @@ -1,56 +0,0 @@ -Installation Guide -================== - -Automatic Installation ----------------------- - -To install MXNet.jl, simply type - -.. code-block:: julia - - Pkg.add("MXNet") - -in the Julia REPL. Or to use the latest git version of MXNet.jl, use the following command instead - -.. code-block:: julia - - Pkg.checkout("MXNet") - -MXNet.jl is built on top of `libmxnet -`_. Upon installation, Julia will try to -automatically download and build libmxnet. - -The libmxnet source is downloaded to ``Pkg.dir("MXNet")/deps/src/mxnet``. The -automatic build is using default configurations, with OpenCV, CUDA disabled. -If the compilation failed due to unresolved dependency, or if you want to -customize the build, it is recommended to compile and install libmxnet manually. -Please see :ref:`below ` for more details. - - -Manual Compilation ------------------- - -It is possible to compile libmxnet separately and point MXNet.jl to a the existing library in case automatic compilation fails due to unresolved dependencies in an un-standard environment; Or when one want to work with a seperate, maybe customized libmxnet. - -To build libmxnet, please refer to `the installation guide of libmxnet -`_. After successfully -installing libmxnet, set the ``MXNET_HOME`` environment variable to the location -of libmxnet. In other words, the compiled ``libmxnet.so`` should be found in -``$MXNET_HOME/lib``. - -.. note:: - - The constant ``MXNET_HOME`` is pre-compiled in MXNet.jl package cache. If you - updated the environment variable after installing MXNet.jl, make sure to - update the pre-compilation cache by ``Base.compilecache("MXNet")``. - -When the ``MXNET_HOME`` environment variable is detected and the corresponding -``libmxnet.so`` could be loaded successfully, MXNet.jl will skip automatic building during installation and use the specified libmxnet instead. - -Basically, MXNet.jl will search ``libmxnet.so`` or ``libmxnet.dll`` in the following paths (and in that order): - -* ``$MXNET_HOME/lib``: customized libmxnet builds -* ``Pkg.dir("MXNet")/deps/usr/lib``: automatic builds -* Any system wide library search path - -Note that MXNet.jl will not find ``libmxnet.so`` even if it is on one of the paths above if a library it depends upon is missing from the ``LD_LIBRARY_PATH``. Thus, if you are going to compile to add CUDA, the path to the CUDA libraries will have to be added to ``LD_LIBRARY_PATH``. diff --git a/docs/src/user-guide/overview.md b/docs/src/user-guide/overview.md new file mode 100644 index 000000000000..6197fc417a7e --- /dev/null +++ b/docs/src/user-guide/overview.md @@ -0,0 +1,412 @@ +Overview +======== + +MXNet.jl Namespace +------------------ + +Most the functions and types in MXNet.jl are organized in a flat +namespace. Because many some functions are conflicting with existing +names in the Julia Base module, we wrap them all in a `mx` module. The +convention of accessing the MXNet.jl interface is the to use the `mx.` +prefix explicitly: + +``` {.sourceCode .julia} +using MXNet + +x = mx.zeros(2,3) # MXNet NDArray +y = zeros(eltype(x), size(x)) # Julia Array +copy!(y, x) # Overloaded function in Julia Base +z = mx.ones(size(x), mx.gpu()) # MXNet NDArray on GPU +mx.copy!(z, y) # Same as copy!(z, y) +``` + +Note functions like `size`, `copy!` that is extensively overloaded for +various types works out of the box. But functions like `zeros` and +`ones` will be ambiguous, so we always use the `mx.` prefix. If you +prefer, the `mx.` prefix can be used explicitly for all MXNet.jl +functions, including `size` and `copy!` as shown in the last line. + +Low Level Interface +------------------- + +### NDArrays + +NDArray is the basic building blocks of the actual computations in +MXNet. It is like a Julia `Array` object, with some important +differences listed here: + +- The actual data could live on different `Context` (e.g. GPUs). For + some contexts, iterating into the elements one by one is very slow, + thus indexing into NDArray is not supported in general. The easiest + way to inspect the contents of an NDArray is to use the `copy` + function to copy the contents as a Julia `Array`. +- Operations on NDArray (including basic arithmetics and neural + network related operators) are executed in parallel with automatic + dependency tracking to ensure correctness. +- There is no generics in NDArray, the `eltype` is always + `mx.MX_float`. Because for applications in machine learning, single + precision floating point numbers are typical a best choice balancing + between precision, speed and portability. Also since libmxnet is + designed to support multiple languages as front-ends, it is much + simpler to implement with a fixed data type. + +While most of the computation is hidden in libmxnet by operators +corresponding to various neural network layers. Getting familiar with +the NDArray API is useful for implementing `Optimizer` or customized +operators in Julia directly. + +The followings are common ways to create NDArray objects: + +- `mx.empty(shape[, context])`: create on uninitialized array of a + given shape on a specific device. For example, + `` mx.empty(2,3)`, `mx.((2,3), mx.gpu(2)) ``. +- `mx.zeros(shape[, context])` and `mx.ones(shape[, context])`: + similar to the Julia's built-in `zeros` and `ones`. +- `mx.copy(jl_arr, context)`: copy the contents of a Julia `Array` to + a specific device. + +Most of the convenient functions like `size`, `length`, `ndims`, +`eltype` on array objects should work out-of-the-box. Although indexing +is not supported, it is possible to take *slices*: + +``` {.sourceCode .julia} +a = mx.ones(2,3) +b = mx.slice(a, 1:2) +b[:] = 2 +println(copy(a)) +# => +# Float32[2.0 2.0 1.0 +# 2.0 2.0 1.0] +``` + +A slice is a sub-region sharing the same memory with the original +NDArray object. A slice is always a contiguous piece of memory, so only +slicing on the *last* dimension is supported. The example above also +shows a way to set the contents of an NDArray. + +``` {.sourceCode .julia} +a = mx.empty(2,3) +a[:] = 0.5 # set all elements to a scalar +a[:] = rand(size(a)) # set contents with a Julia Array +copy!(a, rand(size(a))) # set value by copying a Julia Array +b = mx.empty(size(a)) +b[:] = a # copying and assignment between NDArrays +``` + +Note due to the intrinsic design of the Julia language, a normal +assignment + +``` {.sourceCode .julia} +a = b +``` + +does **not** mean copying the contents of `b` to `a`. Instead, it just +make the variable `a` pointing to a new object, which is `b`. Similarly, +inplace arithmetics does not work as expected: + +``` {.sourceCode .julia} +a = mx.ones(2) +r = a # keep a reference to a +b = mx.ones(2) +a += b # translates to a = a + b +println(copy(a)) +# => Float32[2.0f0,2.0f0] +println(copy(r)) +# => Float32[1.0f0,1.0f0] +``` + +As we can see, `a` has expected value, but instead of inplace updating, +a new NDArray is created and `a` is set to point to this new object. If +we look at `r`, which still reference to the old `a`, its content has +not changed. There is currently no way in Julia to overload the +operators like `+=` to get customized behavior. + +Instead, you will need to write `a[:] = a+b`, or if you want *real* +inplace `+=` operation, MXNet.jl provides a simple macro `@mx.inplace`: + +``` {.sourceCode .julia} +@mx.inplace a += b +macroexpand(:(@mx.inplace a += b)) +# => :(MXNet.mx.add_to!(a,b)) +``` + +As we can see, it translate the `+=` operator to an explicit `add_to!` +function call, which invokes into libmxnet to add the contents of `b` +into `a` directly. For example, the following is the update rule in the +SGD `Optimizer` (both `grad` and `weight` are NDArray objects): + +``` {.sourceCode .julia} +@inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) +``` + +Note there is no much magic in `mx.inplace`: it only does a shallow +translation. In the SGD update rule example above, the computation like +scaling the gradient by `grad_scale` and adding the weight decay all +create temporary NDArray objects. To mitigate this issue, libmxnet has a +customized memory allocator designed specifically to handle this kind of +situations. The following snippet does a simple benchmark on allocating +temp NDArray vs. pre-allocating: + +``` {.sourceCode .julia} +using Benchmark +using MXNet + +N_REP = 1000 +SHAPE = (128, 64) +CTX = mx.cpu() +LR = 0.1 + +function inplace_op() + weight = mx.zeros(SHAPE, CTX) + grad = mx.ones(SHAPE, CTX) + + # pre-allocate temp objects + grad_lr = mx.empty(SHAPE, CTX) + + for i = 1:N_REP + copy!(grad_lr, grad) + @mx.inplace grad_lr .*= LR + @mx.inplace weight -= grad_lr + end + return weight +end + +function normal_op() + weight = mx.zeros(SHAPE, CTX) + grad = mx.ones(SHAPE, CTX) + + for i = 1:N_REP + weight[:] -= LR * grad + end + return weight +end + +# make sure the results are the same +@assert(maximum(abs(copy(normal_op() - inplace_op()))) < 1e-6) + +println(compare([inplace_op, normal_op], 100)) +``` + +The comparison on my laptop shows that `normal_op` while allocating a +lot of temp NDArray in the loop (the performance gets worse when +increasing `N_REP`), is only about twice slower than the pre-allocated +one. + + Row Function Average Relative Replications + ------ --------------- ------------ ----------- --------------- + 1 "inplace\_op" 0.0074854 1.0 100 + 2 "normal\_op" 0.0174202 2.32723 100 + +So it will usually not be a big problem unless you are at the bottleneck +of the computation. + +### Distributed Key-value Store + +The type `KVStore` and related methods are used for data sharing across +different devices or machines. It provides a simple and efficient +integer - NDArray key-value storage system that each device can pull or +push. + +The following example shows how to create a local `KVStore`, initialize +a value and then pull it back. + +``` {.sourceCode .julia} +kv = mx.KVStore(:local) +shape = (2,3) +key = 3 + +mx.init!(kv, key, mx.ones(shape)*2) +a = mx.empty(shape) +mx.pull!(kv, key, a) # pull value into a +println(copy(a)) +# => +# Float32[2.0 2.0 2.0 +# 2.0 2.0 2.0] +``` + +Intermediate Level Interface +---------------------------- + +### Symbols and Composition + +The way we build deep learning models in MXNet.jl is to use the powerful +symbolic composition system. It is like +[Theano](http://deeplearning.net/software/theano/), except that we +avoided long expression compiliation time by providing *larger* neural +network related building blocks to guarantee computation performance. +See also [this +note](http://mxnet.readthedocs.org/en/latest/program_model.html) for the +design and trade-off of the MXNet symbolic composition system. + +The basic type is `mx.Symbol`. The following is a trivial example of +composing two symbols with the `+` operation. + +``` {.sourceCode .julia} +A = mx.Variable(:A) +B = mx.Variable(:B) +C = A + B +``` + +We get a new *symbol* by composing existing *symbols* by some +*operations*. A hierarchical architecture of a deep neural network could +be realized by recursive composition. For example, the following code +snippet shows a simple 2-layer MLP construction, using a hidden layer of +128 units and a ReLU activation function. + +``` {.sourceCode .julia} +net = mx.Variable(:data) +net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) +net = mx.Activation(data=net, name=:relu1, act_type=:relu) +net = mx.FullyConnected(data=net, name=:fc2, num_hidden=64) +net = mx.Softmax(data=net, name=:out) +``` + +Each time we take the previous symbol, and compose with an operation. +Unlike the simple `+` example above, the *operations* here are "bigger" +ones, that correspond to common computation layers in deep neural +networks. + +Each of those operation takes one or more input symbols for composition, +with optional hyper-parameters (e.g. `num_hidden`, `act_type`) to +further customize the composition results. + +When applying those operations, we can also specify a `name` for the +result symbol. This is convenient if we want to refer to this symbol +later on. If not supplied, a name will be automatically generated. + +Each symbol takes some arguments. For example, in the `+` case above, to +compute the value of `C`, we will need to know the values of the two +inputs `A` and `B`. For neural networks, the arguments are primarily two +categories: *inputs* and *parameters*. *inputs* are data and labels for +the networks, while *parameters* are typically trainable *weights*, +*bias*, *filters*. + +When composing symbols, their arguments accumulates. We can list all the +arguments by + +``` {.sourceCode .julia} +julia> mx.list_arguments(net) +6-element Array{Symbol,1}: + :data # Input data, name from the first data variable + :fc1_weight # Weights of the fully connected layer named :fc1 + :fc1_bias # Bias of the layer :fc1 + :fc2_weight # Weights of the layer :fc2 + :fc2_bias # Bias of the layer :fc2 + :out_label # Input label, required by the softmax layer named :out +``` + +Note the names of the arguments are generated according to the provided +name for each layer. We can also specify those names explicitly: + +``` {.sourceCode .julia} +net = mx.Variable(:data) +w = mx.Variable(:myweight) +net = mx.FullyConnected(data=data, weight=w, name=:fc1, num_hidden=128) +mx.list_arguments(net) +# => +# 3-element Array{Symbol,1}: +# :data +# :myweight +# :fc1_bias +``` + +The simple fact is that a `Variable` is just a placeholder `mx.Symbol`. +In composition, we can use arbitrary symbols for arguments. For example: + +``` {.sourceCode .julia} +net = mx.Variable(:data) +net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) +net2 = mx.Variable(:data2) +net2 = mx.FullyConnected(data=net2, name=:net2, num_hidden=128) +mx.list_arguments(net2) +# => +# 3-element Array{Symbol,1}: +# :data2 +# :net2_weight +# :net2_bias +composed_net = net2(data2=net, name=:composed) +mx.list_arguments(composed_net) +# => +# 5-element Array{Symbol,1}: +# :data +# :fc1_weight +# :fc1_bias +# :net2_weight +# :net2_bias +``` + +Note we use a composed symbol, `net` as the argument `data2` for `net2` +to get a new symbol, which we named `:composed`. It also shows that a +symbol itself is a call-able object, which can be invoked to fill in +missing arguments and get more complicated symbol compositions. + +### Shape Inference + +Given enough information, the shapes of all arguments in a composed +symbol could be inferred automatically. For example, given the input +shape, and some hyper-parameters like `num_hidden`, the shapes for the +weights and bias in a neural network could be inferred. + +``` {.sourceCode .julia} +net = mx.Variable(:data) +net = mx.FullyConnected(data=net, name=:fc1, num_hidden=10) +arg_shapes, out_shapes, aux_shapes = mx.infer_shape(net, data=(10, 64)) +``` + +The returned shapes corresponds to arguments with the same order as +returned by `mx.list_arguments`. The `out_shapes` are shapes for +outputs, and `aux_shapes` can be safely ignored for now. + +``` {.sourceCode .julia} +for (n,s) in zip(mx.list_arguments(net), arg_shapes) + println("$n => $s") +end +# => +# data => (10,64) +# fc1_weight => (10,10) +# fc1_bias => (10,) +for (n,s) in zip(mx.list_outputs(net), out_shapes) + println("$n => $s") +end +# => +# fc1_output => (10,64) +``` + +### Binding and Executing + +In order to execute the computation graph specified a composed symbol, +we will *bind* the free variables to concrete values, specified as +`mx.NDArray`. This will create an `mx.Executor` on a given `mx.Context`. +A context describes the computation devices (CPUs, GPUs, etc.) and an +executor will carry out the computation (forward/backward) specified in +the corresponding symbolic composition. + +``` {.sourceCode .julia} +A = mx.Variable(:A) +B = mx.Variable(:B) +C = A .* B +a = mx.ones(3) * 4 +b = mx.ones(3) * 2 +c_exec = mx.bind(C, context=mx.cpu(), args=Dict(:A => a, :B => b)) + +mx.forward(c_exec) +copy(c_exec.outputs[1]) # copy turns NDArray into Julia Array +# => +# 3-element Array{Float32,1}: +# 8.0 +# 8.0 +# 8.0 +``` + +For neural networks, it is easier to use `simple_bind`. By providing the +shape for input arguments, it will perform a shape inference for the +rest of the arguments and create the NDArray automatically. In practice, +the binding and executing steps are hidden under the `Model` interface. + +**TODO** Provide pointers to model tutorial and further details about +binding and symbolic API. + +High Level Interface +-------------------- + +The high level interface include model training and prediction API, etc. diff --git a/docs/src/user-guide/overview.rst b/docs/src/user-guide/overview.rst deleted file mode 100644 index b93de48fed7f..000000000000 --- a/docs/src/user-guide/overview.rst +++ /dev/null @@ -1,376 +0,0 @@ -Overview -======== - -MXNet.jl Namespace ------------------- - -Most the functions and types in MXNet.jl are organized in a flat namespace. -Because many some functions are conflicting with existing names in the Julia -Base module, we wrap them all in a ``mx`` module. The convention of accessing -the MXNet.jl interface is the to use the ``mx.`` prefix explicitly: - -.. code-block:: julia - - using MXNet - - x = mx.zeros(2,3) # MXNet NDArray - y = zeros(eltype(x), size(x)) # Julia Array - copy!(y, x) # Overloaded function in Julia Base - z = mx.ones(size(x), mx.gpu()) # MXNet NDArray on GPU - mx.copy!(z, y) # Same as copy!(z, y) - -Note functions like ``size``, ``copy!`` that is extensively overloaded for -various types works out of the box. But functions like ``zeros`` and ``ones`` -will be ambiguous, so we always use the ``mx.`` prefix. If you prefer, the -``mx.`` prefix can be used explicitly for all MXNet.jl functions, including -``size`` and ``copy!`` as shown in the last line. - -Low Level Interface -------------------- - -NDArrays -~~~~~~~~ - -:class:`NDArray` is the basic building blocks of the actual computations in MXNet. It -is like a Julia ``Array`` object, with some important differences listed here: - -* The actual data could live on different ``Context`` (e.g. GPUs). For some - contexts, iterating into the elements one by one is very slow, thus indexing - into :class:`NDArray` is not supported in general. The easiest way to inspect the - contents of an :class:`NDArray` is to use the ``copy`` function to copy the - contents as a Julia ``Array``. -* Operations on :class:`NDArray` (including basic arithmetics and neural network related operators) are executed in parallel with automatic dependency tracking to ensure correctness. -* There is no generics in :class:`NDArray`, the ``eltype`` is always ``mx.MX_float``. Because for applications in machine learning, single precision floating point numbers are typical a best choice balancing between precision, speed and portability. Also since libmxnet is designed to support multiple languages as front-ends, it is much simpler to implement with a fixed data type. - -While most of the computation is hidden in libmxnet by operators corresponding -to various neural network layers. Getting familiar with the :class:`NDArray` API is -useful for implementing ``Optimizer`` or customized operators in Julia directly. - -The followings are common ways to create :class:`NDArray` objects: - -* ``mx.empty(shape[, context])``: create on uninitialized array of a given shape - on a specific device. For example, ``mx.empty(2,3)`, `mx.((2,3), mx.gpu(2))``. -* ``mx.zeros(shape[, context])`` and ``mx.ones(shape[, context])``: similar to - the Julia's built-in ``zeros`` and ``ones``. -* ``mx.copy(jl_arr, context)``: copy the contents of a Julia ``Array`` to a specific device. - -Most of the convenient functions like ``size``, ``length``, ``ndims``, ``eltype`` on array objects should work out-of-the-box. Although indexing is not supported, it is possible to take *slices*: - -.. code-block:: julia - - a = mx.ones(2,3) - b = mx.slice(a, 1:2) - b[:] = 2 - println(copy(a)) - # => - # Float32[2.0 2.0 1.0 - # 2.0 2.0 1.0] - -A slice is a sub-region sharing the same memory with the original :class:`NDArray` -object. A slice is always a contiguous piece of memory, so only slicing on the -*last* dimension is supported. The example above also shows a way to set the -contents of an :class:`NDArray`. - -.. code-block:: julia - - a = mx.empty(2,3) - a[:] = 0.5 # set all elements to a scalar - a[:] = rand(size(a)) # set contents with a Julia Array - copy!(a, rand(size(a))) # set value by copying a Julia Array - b = mx.empty(size(a)) - b[:] = a # copying and assignment between NDArrays - -Note due to the intrinsic design of the Julia language, a normal assignment - -.. code-block:: julia - - a = b - -does **not** mean copying the contents of ``b`` to ``a``. Instead, it just make -the variable ``a`` pointing to a new object, which is ``b``. Similarly, inplace arithmetics does not work as expected: - -.. code-block:: julia - - a = mx.ones(2) - r = a # keep a reference to a - b = mx.ones(2) - a += b # translates to a = a + b - println(copy(a)) - # => Float32[2.0f0,2.0f0] - println(copy(r)) - # => Float32[1.0f0,1.0f0] - -As we can see, ``a`` has expected value, but instead of inplace updating, a new -:class:`NDArray` is created and ``a`` is set to point to this new object. If we look -at ``r``, which still reference to the old ``a``, its content has not changed. -There is currently no way in Julia to overload the operators like ``+=`` to get customized behavior. - -Instead, you will need to write ``a[:] = a+b``, or if you want *real* inplace -``+=`` operation, MXNet.jl provides a simple macro ``@mx.inplace``: - -.. code-block:: julia - - @mx.inplace a += b - macroexpand(:(@mx.inplace a += b)) - # => :(MXNet.mx.add_to!(a,b)) - -As we can see, it translate the ``+=`` operator to an explicit ``add_to!`` -function call, which invokes into libmxnet to add the contents of ``b`` into -``a`` directly. For example, the following is the update rule in the SGD -``Optimizer`` (both ``grad`` and ``weight`` are :class:`NDArray` objects): - -.. code-block:: julia - - @inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) - -Note there is no much magic in ``mx.inplace``: it only does a shallow -translation. In the SGD update rule example above, the computation like scaling -the gradient by ``grad_scale`` and adding the weight decay all create temporary -:class:`NDArray` objects. To mitigate this issue, libmxnet has a customized memory -allocator designed specifically to handle this kind of situations. The following -snippet does a simple benchmark on allocating temp :class:`NDArray` vs. pre-allocating: - -.. code-block:: julia - - using Benchmark - using MXNet - - N_REP = 1000 - SHAPE = (128, 64) - CTX = mx.cpu() - LR = 0.1 - - function inplace_op() - weight = mx.zeros(SHAPE, CTX) - grad = mx.ones(SHAPE, CTX) - - # pre-allocate temp objects - grad_lr = mx.empty(SHAPE, CTX) - - for i = 1:N_REP - copy!(grad_lr, grad) - @mx.inplace grad_lr .*= LR - @mx.inplace weight -= grad_lr - end - return weight - end - - function normal_op() - weight = mx.zeros(SHAPE, CTX) - grad = mx.ones(SHAPE, CTX) - - for i = 1:N_REP - weight[:] -= LR * grad - end - return weight - end - - # make sure the results are the same - @assert(maximum(abs(copy(normal_op() - inplace_op()))) < 1e-6) - - println(compare([inplace_op, normal_op], 100)) - -The comparison on my laptop shows that ``normal_op`` while allocating a lot of -temp :class:`NDArray` in the loop (the performance gets worse when increasing -``N_REP``), is only about twice slower than the pre-allocated one. - -+-----+--------------+-----------+----------+--------------+ -| Row | Function | Average | Relative | Replications | -+=====+==============+===========+==========+==============+ -| 1 | "inplace_op" | 0.0074854 | 1.0 | 100 | -+-----+--------------+-----------+----------+--------------+ -| 2 | "normal_op" | 0.0174202 | 2.32723 | 100 | -+-----+--------------+-----------+----------+--------------+ - -So it will usually not be a big problem unless you are at the bottleneck of the computation. - -Distributed Key-value Store -~~~~~~~~~~~~~~~~~~~~~~~~~~~ - -The type ``KVStore`` and related methods are used for data sharing across -different devices or machines. It provides a simple and efficient -integer - :class:`NDArray` key-value storage system that each device can pull or push. - -The following example shows how to create a local ``KVStore``, initialize a value and then pull it back. - -.. code-block:: julia - - kv = mx.KVStore(:local) - shape = (2,3) - key = 3 - - mx.init!(kv, key, mx.ones(shape)*2) - a = mx.empty(shape) - mx.pull!(kv, key, a) # pull value into a - println(copy(a)) - # => - # Float32[2.0 2.0 2.0 - # 2.0 2.0 2.0] - -Intermediate Level Interface ----------------------------- - -Symbols and Composition -~~~~~~~~~~~~~~~~~~~~~~~ - -The way we build deep learning models in MXNet.jl is to use the powerful -symbolic composition system. It is like `Theano -`_, except that we avoided long -expression compiliation time by providing *larger* neural network related -building blocks to guarantee computation performance. See also `this note -`_ for the design and trade-off of the MXNet symbolic composition system. - -The basic type is ``mx.Symbol``. The following is a trivial example of composing -two symbols with the ``+`` operation. - -.. code-block:: julia - - A = mx.Variable(:A) - B = mx.Variable(:B) - C = A + B - -We get a new *symbol* by composing existing *symbols* by some *operations*. A hierarchical architecture of a deep neural network could be realized by recursive composition. For example, the following code snippet shows a simple 2-layer MLP construction, using a hidden layer of 128 units and a ReLU activation function. - -.. code-block:: julia - - net = mx.Variable(:data) - net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) - net = mx.Activation(data=net, name=:relu1, act_type=:relu) - net = mx.FullyConnected(data=net, name=:fc2, num_hidden=64) - net = mx.Softmax(data=net, name=:out) - -Each time we take the previous symbol, and compose with an operation. Unlike the -simple ``+`` example above, the *operations* here are "bigger" ones, that correspond to common computation layers in deep neural networks. - -Each of those operation takes one or more input symbols for composition, with -optional hyper-parameters (e.g. ``num_hidden``, ``act_type``) to further customize the composition results. - -When applying those operations, we can also specify a ``name`` for the result symbol. This is convenient if we want to refer to this symbol later on. If not supplied, a name will be automatically generated. - -Each symbol takes some arguments. For example, in the ``+`` case above, to -compute the value of ``C``, we will need to know the values of the two inputs -``A`` and ``B``. For neural networks, the arguments are primarily two categories: *inputs* and *parameters*. *inputs* are data and labels for the networks, while *parameters* are typically trainable *weights*, *bias*, *filters*. - -When composing symbols, their arguments accumulates. We can list all the arguments by - -.. code-block:: julia - - julia> mx.list_arguments(net) - 6-element Array{Symbol,1}: - :data # Input data, name from the first data variable - :fc1_weight # Weights of the fully connected layer named :fc1 - :fc1_bias # Bias of the layer :fc1 - :fc2_weight # Weights of the layer :fc2 - :fc2_bias # Bias of the layer :fc2 - :out_label # Input label, required by the softmax layer named :out - -Note the names of the arguments are generated according to the provided name for each layer. We can also specify those names explicitly: - -.. code-block:: julia - - net = mx.Variable(:data) - w = mx.Variable(:myweight) - net = mx.FullyConnected(data=data, weight=w, name=:fc1, num_hidden=128) - mx.list_arguments(net) - # => - # 3-element Array{Symbol,1}: - # :data - # :myweight - # :fc1_bias - -The simple fact is that a ``Variable`` is just a placeholder ``mx.Symbol``. In composition, we can use arbitrary symbols for arguments. For example: - -.. code-block:: julia - - net = mx.Variable(:data) - net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) - net2 = mx.Variable(:data2) - net2 = mx.FullyConnected(data=net2, name=:net2, num_hidden=128) - mx.list_arguments(net2) - # => - # 3-element Array{Symbol,1}: - # :data2 - # :net2_weight - # :net2_bias - composed_net = net2(data2=net, name=:composed) - mx.list_arguments(composed_net) - # => - # 5-element Array{Symbol,1}: - # :data - # :fc1_weight - # :fc1_bias - # :net2_weight - # :net2_bias - -Note we use a composed symbol, ``net`` as the argument ``data2`` for ``net2`` to -get a new symbol, which we named ``:composed``. It also shows that a symbol itself is a call-able object, which can be invoked to fill in missing arguments and get more complicated symbol compositions. - -Shape Inference -~~~~~~~~~~~~~~~ - -Given enough information, the shapes of all arguments in a composed symbol could -be inferred automatically. For example, given the input shape, and some -hyper-parameters like ``num_hidden``, the shapes for the weights and bias in a neural network could be inferred. - -.. code-block:: julia - - net = mx.Variable(:data) - net = mx.FullyConnected(data=net, name=:fc1, num_hidden=10) - arg_shapes, out_shapes, aux_shapes = mx.infer_shape(net, data=(10, 64)) - -The returned shapes corresponds to arguments with the same order as returned by -``mx.list_arguments``. The ``out_shapes`` are shapes for outputs, and -``aux_shapes`` can be safely ignored for now. - -.. code-block:: julia - - for (n,s) in zip(mx.list_arguments(net), arg_shapes) - println("$n => $s") - end - # => - # data => (10,64) - # fc1_weight => (10,10) - # fc1_bias => (10,) - for (n,s) in zip(mx.list_outputs(net), out_shapes) - println("$n => $s") - end - # => - # fc1_output => (10,64) - - -Binding and Executing -~~~~~~~~~~~~~~~~~~~~~ - -In order to execute the computation graph specified a composed symbol, we will -*bind* the free variables to concrete values, specified as ``mx.NDArray``. This -will create an ``mx.Executor`` on a given ``mx.Context``. A context describes the computation devices (CPUs, GPUs, etc.) and an executor will carry out the computation (forward/backward) specified in the corresponding symbolic composition. - -.. code-block:: julia - - A = mx.Variable(:A) - B = mx.Variable(:B) - C = A .* B - a = mx.ones(3) * 4 - b = mx.ones(3) * 2 - c_exec = mx.bind(C, context=mx.cpu(), args=Dict(:A => a, :B => b)) - - mx.forward(c_exec) - copy(c_exec.outputs[1]) # copy turns NDArray into Julia Array - # => - # 3-element Array{Float32,1}: - # 8.0 - # 8.0 - # 8.0 - -For neural networks, it is easier to use ``simple_bind``. By providing the shape -for input arguments, it will perform a shape inference for the rest of the -arguments and create the :class:`NDArray` automatically. In practice, the binding and -executing steps are hidden under the ``Model`` interface. - -**TODO** Provide pointers to model tutorial and further details about binding and symbolic API. - - -High Level Interface --------------------- - -The high level interface include model training and prediction API, etc. From d7d4d9028e8e63d339ed2dd48c9026ab72a0683c Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 13 Jul 2016 06:31:50 +0900 Subject: [PATCH 352/630] finish mkdocs support --- docs/mkdocs.yml | 41 ++++++++++++++++++++++++++ docs/src/api/{ndarry.md => ndarray.md} | 0 docs/src/index.md | 23 ++++++++++++--- docs/src/tutorial.md | 0 docs/src/user-guide.md | 0 5 files changed, 60 insertions(+), 4 deletions(-) create mode 100644 docs/mkdocs.yml rename docs/src/api/{ndarry.md => ndarray.md} (100%) delete mode 100644 docs/src/tutorial.md delete mode 100644 docs/src/user-guide.md diff --git a/docs/mkdocs.yml b/docs/mkdocs.yml new file mode 100644 index 000000000000..287119257604 --- /dev/null +++ b/docs/mkdocs.yml @@ -0,0 +1,41 @@ +site_name: MXNet.jl +repo_url: https://github.com/dmlc/MXNet.jl + +theme: readthedocs + +extra_css: + - assets/Documenter.css + +extra_javascript: + - https://cdn.mathjax.org/mathjax/latest/MathJax.jl?config=TeX-AMS-MML_HTMLorMML + - assets/mathjaxhelper.js + +markdown_extensions: + - extra + - tables + - fenced_code + +docs_dir: 'build' + +pages: + - Home: index.md + - Tutorial: + - Digit Recognition on MNIST: tutorial/mnist.md + - Generating Random Sentence with LSTM RNN: tutorial/char-lstm.md + - User Guide: + - Installation Guide: user-guide/install.md + - Overview: user-guide/overview.md + - FAQ: user-guide/faq.md + - API Documentation: + - Context: api/context.md + - Models: api/model.md + - Initializers: api/initializer.md + - Optimizers: api/optimizer.md + - Callbacks in training: api/callback.md + - Evaluation Metrics: api/metric.md + - Data Providers: api/io.md + - NDArray API: api/ndarray.md + - Symbolic API: api/symbolic-node.md + - Neural Networks Factory: api/nn-factory.md + - Executor: api/executor.md + - Network Visualization: api/visualize.md diff --git a/docs/src/api/ndarry.md b/docs/src/api/ndarray.md similarity index 100% rename from docs/src/api/ndarry.md rename to docs/src/api/ndarray.md diff --git a/docs/src/index.md b/docs/src/index.md index 0ad69711e41c..93e3fa49660a 100644 --- a/docs/src/index.md +++ b/docs/src/index.md @@ -1,8 +1,8 @@ # MXNet Documentation -[`MXNet.jl`](https://github.com/dmlc/MXNet.jl>) is the -[`Julia`](http://julialang.org/) package of -[`dmlc/mxnet`](https://github.com/dmlc/mxnet). `MXNet.jl` brings flexible and efficient GPU +[MXNet.jl](https://github.com/dmlc/MXNet.jl>) is the +[Julia](http://julialang.org/) package of +[dmlc/mxnet](https://github.com/dmlc/mxnet). `MXNet.jl` brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of features include: @@ -12,7 +12,22 @@ include: For more details, see documentation below. Please also checkout the [examples](https://github.com/dmlc/MXNet.jl/tree/master/examples) directory. +## Tutorials + +```@contents +Pages = ["tutorial/mnist.md", "tutorial/char-lstm.md"] +Depth = 2 +``` + +## User's Guide + ```@contents -Pages = ["tutorial.md", "user-guide.md", "api.md"] +Pages = ["user-guide/install.md", "user-guide/overview.md", "user-guide/faq.md"] Depth = 2 ``` + +## API Documentation + +```@contents +Pages = ["api/context.md", "api/model.md", "api/initializers.md", "api/optimizers.md", "api/callbacks.md", "api/metric.md", "api/io.md", "api/ndarray.md", "api/symbolic-node.md", "api/nn-factory.md", "api/executor.md", "api/visualize.md"] +``` diff --git a/docs/src/tutorial.md b/docs/src/tutorial.md deleted file mode 100644 index e69de29bb2d1..000000000000 diff --git a/docs/src/user-guide.md b/docs/src/user-guide.md deleted file mode 100644 index e69de29bb2d1..000000000000 From 3dbec0f8d66b8d8bf617f2f6cfd35bfb0ada25f0 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 19 Jul 2016 03:52:06 +0900 Subject: [PATCH 353/630] cleanup docs --- docs/src/tutorial/char-lstm.md | 14 +++++------- docs/src/tutorial/mnist.md | 39 ++++++++++++++++----------------- docs/src/user-guide/install.md | 4 ++-- docs/src/user-guide/overview.md | 34 ++++++++++++++-------------- 4 files changed, 44 insertions(+), 47 deletions(-) diff --git a/docs/src/tutorial/char-lstm.md b/docs/src/tutorial/char-lstm.md index 5c20c8f05830..369bcddd53e9 100644 --- a/docs/src/tutorial/char-lstm.md +++ b/docs/src/tutorial/char-lstm.md @@ -16,7 +16,7 @@ We will be using fixed-length input sequence for training. The code is adapted from the [char-rnn example for MXNet's Python binding](https://github.com/dmlc/mxnet/blob/master/example/rnn/char_lstm.ipynb), which demonstrates how to use low-level -symbolic APIs </api/symbolic-node> to build customized neural +[Symbolic API](@ref) to build customized neural network models directly. The most important code snippets of this example is shown and explained @@ -30,8 +30,7 @@ example. LSTM Cells ---------- -Christopher Olah has a [great blog post about -LSTM](http://colah.github.io/posts/2015-08-Understanding-LSTMs/) with +Christopher Olah has a [great blog post about LSTM](http://colah.github.io/posts/2015-08-Understanding-LSTMs/) with beautiful and clear illustrations. So we will not repeat the definition and explanation of what an LSTM cell is here. Basically, an LSTM cell takes input `x`, as well as previous states (including `c` and `h`), and @@ -116,8 +115,7 @@ character is then encoded as a vector of 0s on all coordinates, and 1 on the coordinate corresponding to that character. The character-to-coordinate mapping is giving by the vocabulary. -The text sequence data provider implement the data provider API -</api/io>. We define the `CharSeqProvider` as below: +The text sequence data provider implements the [Data Providers](@ref) api. We define the `CharSeqProvider` as below: The provided data and labels follow the naming convention of inputs used when unrolling the LSTM. Note in the code below, apart from @@ -128,7 +126,7 @@ we will feed the initial states for each sequence from the data provider. Since the initial states is always zero, we just need to always provide constant zero blobs. -Next we implement the AbstractDataProvider.eachbatch interface for the +Next we implement the `eachbatch` method from the [`mx.AbstractDataProvider`](@ref) interface for the provider. We start by defining the data and label arrays, and the `DataBatch` object we will provide in each iteration. @@ -163,7 +161,7 @@ Note we are also using a customized `NLL` evaluation metric, which calculate the negative log-likelihood during training. Here is an output sample at the end of the training process. -``` {.sourceCode .text} +``` ... INFO: Speed: 357.72 samples/sec INFO: == Epoch 020 ========== @@ -227,7 +225,7 @@ trained for around half an hour on the Shakespeare dataset. Note all the line-breaks, punctuations and upper-lower case letters are produced by the sampler itself. I did not do any post-processing. -``` {.sourceCode .text} +``` ## Sample 1 all have sir, Away will fill'd in His time, I'll keep her, do not madam, if they here? Some more ha? diff --git a/docs/src/tutorial/mnist.md b/docs/src/tutorial/mnist.md index b4e7a3be89ee..8282f48ac8ca 100644 --- a/docs/src/tutorial/mnist.md +++ b/docs/src/tutorial/mnist.md @@ -14,7 +14,7 @@ Simple 3-layer MLP This is a tiny 3-layer MLP that could be easily trained on CPU. The script starts with -``` {.sourceCode .julia} +```julia using MXNet ``` @@ -22,7 +22,7 @@ to load the `MXNet` module. Then we are ready to define the network architecture via the symbolic API </user-guide/overview>. We start with a placeholder `data` symbol, -``` {.sourceCode .julia} +```julia data = mx.Variable(:data) ``` @@ -39,16 +39,16 @@ fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) Note each composition we take the previous symbol as the data argument, forming a feedforward chain. The architecture looks like -``` {.sourceCode .julia} +``` Input --> 128 units (ReLU) --> 64 units (ReLU) --> 10 units ``` where the last 10 units correspond to the 10 output classes (digits -0,...,9). We then add a final SoftmaxOutput operation to turn the +0,...,9). We then add a final `SoftmaxOutput` operation to turn the 10-dimensional prediction to proper probability values for the 10 classes: -``` {.sourceCode .julia} +```julia mlp = mx.SoftmaxOutput(data = fc3, name=:softmax) ``` @@ -56,7 +56,7 @@ As we can see, the MLP is just a chain of layers. For this case, we can also use the `mx.chain` macro. The same architecture above can be defined as -``` {.sourceCode .julia} +```julia mlp = @mx.chain mx.Variable(:data) => mx.FullyConnected(name=:fc1, num_hidden=128) => mx.Activation(name=:relu1, act_type=:relu) => @@ -73,14 +73,14 @@ could automatically download the dataset into construct the data provider into `mnist-data.jl` so that it could be shared by both the MLP example and the LeNet ConvNets example. -``` {.sourceCode .julia} +```julia batch_size = 100 include("mnist-data.jl") train_provider, eval_provider = get_mnist_providers(batch_size) ``` If you need to write your own data providers for customized data format, -please refer to AbstractDataProvider. +please refer to [`mx.AbstractDataProvider`](@ref). Given the architecture and data, we can instantiate an *model* to do the actual training. `mx.FeedForward` is the built-in model that is suitable @@ -89,7 +89,7 @@ also specify the *context* on which the computation should be carried out. Because this is a really tiny MLP, we will just run on a single CPU device. -``` {.sourceCode .julia} +```julia model = mx.FeedForward(mlp, context=mx.cpu()) ``` @@ -102,7 +102,7 @@ The last thing we need to specify is the optimization algorithm (a.k.a. *optimizer*) to use. We use the basic SGD with a fixed learning rate 0.1 and momentum 0.9: -``` {.sourceCode .julia} +```julia optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) ``` @@ -110,13 +110,13 @@ Now we can do the training. Here the `n_epoch` parameter specifies that we want to train for 20 epochs. We also supply a `eval_data` to monitor validation accuracy on the validation set. -``` {.sourceCode .julia} +```julia mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) ``` Here is a sample output -``` {.sourceCode .text} +``` INFO: Start training on [CPU0] INFO: Initializing parameters... INFO: Creating KVStore... @@ -143,7 +143,7 @@ that involves convolution and pooling. This architecture for the MNIST is usually called the \[LeNet\]\_. The first part of the architecture is listed below: -``` {.sourceCode .julia} +```julia # input data = mx.Variable(:data) @@ -168,7 +168,7 @@ a tensor of shape `(28,28,1,100)`. The convolution and pooling operates in the spatial axis, so `kernel=(5,5)` indicate a square region of 5-width and 5-height. The rest of the architecture follows as: -``` {.sourceCode .julia} +```ulia # first fully-connected fc1 = @mx.chain mx.Flatten(data=conv2) => mx.FullyConnected(num_hidden=500) => @@ -189,7 +189,7 @@ before connecting it to the `FullyConnected` operator. The rest of the network is the same as the previous MLP example. As before, we can now load the MNIST dataset: -``` {.sourceCode .julia} +```julia batch_size = 100 include("mnist-data.jl") train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) @@ -200,8 +200,7 @@ tensors instead of 2D matrices because the convolution operators needs correct spatial shape information. We then construct a feedforward model on GPU, and train it. -``` {.sourceCode .julia} -#-------------------------------------------------------------------------------- +```julia # fit model model = mx.FeedForward(lenet, context=mx.gpu()) @@ -214,7 +213,7 @@ mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) And here is a sample of running outputs: -``` {.sourceCode .text} +``` INFO: == Epoch 001 ========== INFO: ## Training summary INFO: :accuracy = 0.6750 @@ -237,14 +236,14 @@ Predicting with a trained model is very simple. By calling `mx.predict` with the model and a data provider, we get the model output as a Julia Array: -``` {.sourceCode .julia} +```julia probs = mx.predict(model, eval_provider) ``` The following code shows a stupid way of getting all the labels from the data provider, and compute the prediction accuracy manually: -``` {.sourceCode .julia} +```julia # collect all labels from eval data labels = Array[] for batch in eval_provider diff --git a/docs/src/user-guide/install.md b/docs/src/user-guide/install.md index 9c66a84204da..fe586c248da3 100644 --- a/docs/src/user-guide/install.md +++ b/docs/src/user-guide/install.md @@ -6,14 +6,14 @@ Automatic Installation To install MXNet.jl, simply type -``` {.sourceCode .julia} +```julia Pkg.add("MXNet") ``` in the Julia REPL. Or to use the latest git version of MXNet.jl, use the following command instead -``` {.sourceCode .julia} +```julia Pkg.checkout("MXNet") ``` diff --git a/docs/src/user-guide/overview.md b/docs/src/user-guide/overview.md index 6197fc417a7e..691ab93e9acb 100644 --- a/docs/src/user-guide/overview.md +++ b/docs/src/user-guide/overview.md @@ -10,7 +10,7 @@ names in the Julia Base module, we wrap them all in a `mx` module. The convention of accessing the MXNet.jl interface is the to use the `mx.` prefix explicitly: -``` {.sourceCode .julia} +```julia using MXNet x = mx.zeros(2,3) # MXNet NDArray @@ -69,7 +69,7 @@ Most of the convenient functions like `size`, `length`, `ndims`, `eltype` on array objects should work out-of-the-box. Although indexing is not supported, it is possible to take *slices*: -``` {.sourceCode .julia} +```julia a = mx.ones(2,3) b = mx.slice(a, 1:2) b[:] = 2 @@ -84,7 +84,7 @@ NDArray object. A slice is always a contiguous piece of memory, so only slicing on the *last* dimension is supported. The example above also shows a way to set the contents of an NDArray. -``` {.sourceCode .julia} +```julia a = mx.empty(2,3) a[:] = 0.5 # set all elements to a scalar a[:] = rand(size(a)) # set contents with a Julia Array @@ -96,7 +96,7 @@ b[:] = a # copying and assignment between NDArrays Note due to the intrinsic design of the Julia language, a normal assignment -``` {.sourceCode .julia} +```julia a = b ``` @@ -104,7 +104,7 @@ does **not** mean copying the contents of `b` to `a`. Instead, it just make the variable `a` pointing to a new object, which is `b`. Similarly, inplace arithmetics does not work as expected: -``` {.sourceCode .julia} +```julia a = mx.ones(2) r = a # keep a reference to a b = mx.ones(2) @@ -124,7 +124,7 @@ operators like `+=` to get customized behavior. Instead, you will need to write `a[:] = a+b`, or if you want *real* inplace `+=` operation, MXNet.jl provides a simple macro `@mx.inplace`: -``` {.sourceCode .julia} +```julia @mx.inplace a += b macroexpand(:(@mx.inplace a += b)) # => :(MXNet.mx.add_to!(a,b)) @@ -135,7 +135,7 @@ function call, which invokes into libmxnet to add the contents of `b` into `a` directly. For example, the following is the update rule in the SGD `Optimizer` (both `grad` and `weight` are NDArray objects): -``` {.sourceCode .julia} +```julia @inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) ``` @@ -147,7 +147,7 @@ customized memory allocator designed specifically to handle this kind of situations. The following snippet does a simple benchmark on allocating temp NDArray vs. pre-allocating: -``` {.sourceCode .julia} +```julia using Benchmark using MXNet @@ -210,7 +210,7 @@ push. The following example shows how to create a local `KVStore`, initialize a value and then pull it back. -``` {.sourceCode .julia} +```julia kv = mx.KVStore(:local) shape = (2,3) key = 3 @@ -241,7 +241,7 @@ design and trade-off of the MXNet symbolic composition system. The basic type is `mx.Symbol`. The following is a trivial example of composing two symbols with the `+` operation. -``` {.sourceCode .julia} +```julia A = mx.Variable(:A) B = mx.Variable(:B) C = A + B @@ -253,7 +253,7 @@ be realized by recursive composition. For example, the following code snippet shows a simple 2-layer MLP construction, using a hidden layer of 128 units and a ReLU activation function. -``` {.sourceCode .julia} +```julia net = mx.Variable(:data) net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) net = mx.Activation(data=net, name=:relu1, act_type=:relu) @@ -284,7 +284,7 @@ the networks, while *parameters* are typically trainable *weights*, When composing symbols, their arguments accumulates. We can list all the arguments by -``` {.sourceCode .julia} +```julia julia> mx.list_arguments(net) 6-element Array{Symbol,1}: :data # Input data, name from the first data variable @@ -298,7 +298,7 @@ julia> mx.list_arguments(net) Note the names of the arguments are generated according to the provided name for each layer. We can also specify those names explicitly: -``` {.sourceCode .julia} +```julia net = mx.Variable(:data) w = mx.Variable(:myweight) net = mx.FullyConnected(data=data, weight=w, name=:fc1, num_hidden=128) @@ -313,7 +313,7 @@ mx.list_arguments(net) The simple fact is that a `Variable` is just a placeholder `mx.Symbol`. In composition, we can use arbitrary symbols for arguments. For example: -``` {.sourceCode .julia} +```julia net = mx.Variable(:data) net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) net2 = mx.Variable(:data2) @@ -347,7 +347,7 @@ symbol could be inferred automatically. For example, given the input shape, and some hyper-parameters like `num_hidden`, the shapes for the weights and bias in a neural network could be inferred. -``` {.sourceCode .julia} +```julia net = mx.Variable(:data) net = mx.FullyConnected(data=net, name=:fc1, num_hidden=10) arg_shapes, out_shapes, aux_shapes = mx.infer_shape(net, data=(10, 64)) @@ -357,7 +357,7 @@ The returned shapes corresponds to arguments with the same order as returned by `mx.list_arguments`. The `out_shapes` are shapes for outputs, and `aux_shapes` can be safely ignored for now. -``` {.sourceCode .julia} +```julia for (n,s) in zip(mx.list_arguments(net), arg_shapes) println("$n => $s") end @@ -381,7 +381,7 @@ A context describes the computation devices (CPUs, GPUs, etc.) and an executor will carry out the computation (forward/backward) specified in the corresponding symbolic composition. -``` {.sourceCode .julia} +```julia A = mx.Variable(:A) B = mx.Variable(:B) C = A .* B From c74594f6f27eae02936d2265a243ce9f208e7395 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 2 Aug 2016 02:14:13 +0900 Subject: [PATCH 354/630] enable travis to build docs --- .travis.yml | 3 +++ 1 file changed, 3 insertions(+) diff --git a/.travis.yml b/.travis.yml index 9f08e176eed2..1f827371a6a8 100644 --- a/.travis.yml +++ b/.travis.yml @@ -37,3 +37,6 @@ script: after_success: - source $TRAVIS/run_coverage.sh + - julia -e 'Pkg.add("Documenter")' + - julia -e 'cd(Pkg.dir("PACKAGE_NAME")); include(joinpath("docs", "make.jl"))' + From 85ec1112333a5dd6432c6a54b1308feea4d2a3b4 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 2 Aug 2016 03:24:46 +0900 Subject: [PATCH 355/630] finalize mkdocs setup --- docs/make.jl | 8 +++++++- docs/mkdocs.yml | 9 ++++++++- 2 files changed, 15 insertions(+), 2 deletions(-) diff --git a/docs/make.jl b/docs/make.jl index f5569035bc69..06bbef0466cd 100644 --- a/docs/make.jl +++ b/docs/make.jl @@ -1,5 +1,11 @@ using Documenter, MXNet makedocs( - modules = [MXNet] + modules = MXNet, + doctest = false +) + +deploydocs( + deps = Deps.pip("pygments", "mkdocs", "mkdocs-material", "python-markdown-math"), + repo = "github.com/dmlc/MXNet.jl.git", ) diff --git a/docs/mkdocs.yml b/docs/mkdocs.yml index 287119257604..bf604818027e 100644 --- a/docs/mkdocs.yml +++ b/docs/mkdocs.yml @@ -1,7 +1,12 @@ site_name: MXNet.jl repo_url: https://github.com/dmlc/MXNet.jl -theme: readthedocs +theme: material + +extra: + palette: + primary: 'indigo' + accent: 'blue' extra_css: - assets/Documenter.css @@ -14,6 +19,8 @@ markdown_extensions: - extra - tables - fenced_code + - mdx_math + - admonition docs_dir: 'build' From 789bb6b16367c4fd7fc818ff254b2bcba67f40d3 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 2 Aug 2016 11:36:17 -0700 Subject: [PATCH 356/630] setup Documenter.jl --- docs/.documenter.enc | Bin 0 -> 1680 bytes 1 file changed, 0 insertions(+), 0 deletions(-) create mode 100644 docs/.documenter.enc diff --git a/docs/.documenter.enc b/docs/.documenter.enc new file mode 100644 index 0000000000000000000000000000000000000000..48bd92bc4742234f2364e62fe899efdf64a1f5d8 GIT binary patch literal 1680 zcmV;B25rWS<*O0{K{-TA^4}R}MY#~pBnC~nXf)$xi`VgJ=(}CLo z99B@ySk*kZH{=OD%kZt*$@gI0bE~V&8IFr)?w5O6@f*MXO1rRL!8xs5b~i-YSaAz8 z?Oa!ONEJ)LuTIWymjXYs=Oi>jHonzG$sc;Z*bK0{asSaCl)K8Dt9hwefjeLh>CozO zqh;;QUGT7%|V}q;lmM@=0X9JJ!pB?v8#q`2cOu+ zU@YKi4jzn?`JhZiTmUfQFk4;S}Pw~t=F}U z$%Rz&t@nw^pFcHC2L-yI$Y*cB3#7Rxc^W0K%)Ks79+Uzgm`KXYOBtz%nbUK)6W{GD z6vGFcsUm(_XRIWEX3zin!FjO}Sz?&zh2<}q#6!7T#mDR*Upz5b8j3x4wws>0y8d2U zgr4|K1?&yV3gZfVwYp8Mk)r^>44lPXYH~*@OrgnM4=fOdZBZK!f2-)hDy5ti9w|to z3b(Q=|AHjoLA#w>fJ(S+W#2{r*t{_IpAvCG#Dzda4Y6A710Z2cBun5P^+T7Tm*oQd z1GpiOufpgUcuJQvxFw|HHB`nA_*$k*K{RRaP4)YfMu!gzCr!upY4?3CSKuLt4nsHk z7GV%hH^^e+!1|r&n~=xskC>gi03^36$z|~i_qZ2JUcTV%POTl65g}~L$K<+;J@wUSt;2vLL4Ojd?W zBFdaPoa|QQmU>G641cN1B)OdmcaScG-0Zu4 zafkd|kBaQySh0;{(bK&+u)17jYVSCTLTJ3Yud0x;nOIIGq{LUyoxoez_PJcAA=DK< znsoy=qR64tOErR%#{xT9UVX&!%X)SR<|qo_MO@5o2!lje^^fxFuyLo!EM`7@P9Z(`Iqdg=4#^%Q8z=!DfcOz&iz zHt+S7=xTE<>f>P?R*4NHpCz5FiKsVp^Ld zd5$9(3lZ3}iDb`iIty37map_wc;xQPUfE59I#tt(Kp2#wv?ea~%%2gdJ4%Mt(%~9d zRHCY}3szlG0?5myNXNw9CBbPl_uoPVNqr%~LyW*k;fnaIS6ZXp9i@{Y}u8$kaBHuAgSBe z29Hcga%%BupHsJhkLpmccg5yF!GveSFS*-xYBpnpNO-TiIzIo+%#)oUKoVD`UI~HO z$TkJN-PR>vZr&d{r9ca1?@0Y3U{V?O`WSuiW!9;0Uh2#KbU_q{C38*|0zxhApkC&X zeUx~}r7VL8qdBHi48~Lh&rPXZviPvjgScMatjU&#pKvk^C8E`Wu{OUd>%v70GDn2S aF;ziPu#v|oq3fM$n|LCvE&l?FaMg<7X*&S` literal 0 HcmV?d00001 From 2c651ff096fd60bee1b8f0c29e42c136358a7240 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 2 Aug 2016 12:10:42 -0700 Subject: [PATCH 357/630] fix documenter config bug --- .travis.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.travis.yml b/.travis.yml index 1f827371a6a8..651ba9640f8b 100644 --- a/.travis.yml +++ b/.travis.yml @@ -38,5 +38,5 @@ script: after_success: - source $TRAVIS/run_coverage.sh - julia -e 'Pkg.add("Documenter")' - - julia -e 'cd(Pkg.dir("PACKAGE_NAME")); include(joinpath("docs", "make.jl"))' + - julia -e 'cd(Pkg.dir("MXNet")); include(joinpath("docs", "make.jl"))' From f442c4916fd107c436d85a02cfd2d8fa4502faad Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 2 Aug 2016 12:57:47 -0700 Subject: [PATCH 358/630] switch doc to new location. --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 855680ae6d1a..bdfbcc3e1148 100644 --- a/README.md +++ b/README.md @@ -2,7 +2,7 @@ [![Build Status](https://travis-ci.org/dmlc/MXNet.jl.svg?branch=master)](https://travis-ci.org/dmlc/MXNet.jl) [![codecov.io](https://codecov.io/github/dmlc/MXNet.jl/coverage.svg?branch=master)](https://codecov.io/github/dmlc/MXNet.jl?branch=master) -[![Documentation Status](https://readthedocs.org/projects/mxnetjl/badge/?version=latest)](http://mxnetjl.readthedocs.org/en/latest/?badge=latest) +[![](https://img.shields.io/badge/docs-latest-blue.svg)](https://dmlc.github.io/MXNet.jl/latest) [![MXNet](http://pkg.julialang.org/badges/MXNet_0.4.svg)](http://pkg.julialang.org/?pkg=MXNet) [![License](http://dmlc.github.io/img/apache2.svg)](LICENSE.md) [![Join the chat at https://gitter.im/dmlc/mxnet](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/dmlc/mxnet?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge) From 79f51e6532b4673d3b7fbbc810a59bb4904c1984 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 2 Aug 2016 12:59:24 -0700 Subject: [PATCH 359/630] fix URL to Windows building instruction (#111) --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 9449c6337102..86c79905b889 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -24,7 +24,7 @@ if !libmxnet_detected @windows_only begin info("Please follow the libmxnet documentation on how to build manually") info("or to install pre-build packages:") - info("http://mxnet.readthedocs.org/en/latest/build.html#building-on-windows") + info("http://mxnet.readthedocs.io/en/latest/how_to/build.html#building-on-windows") error("Automatic building libxmnet on Windows is currently not supported yet.") end From b54620b342b1016a4782eb1ff85c45c9cea77a99 Mon Sep 17 00:00:00 2001 From: Scott Lundberg Date: Wed, 3 Aug 2016 11:13:39 -0700 Subject: [PATCH 360/630] Fix broken documentation link. --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index bdfbcc3e1148..06313473c060 100644 --- a/README.md +++ b/README.md @@ -65,4 +65,4 @@ accuracy = 100correct/length(labels) println(mx.format("Accuracy on eval set: {1:.2f}%", accuracy)) ``` -For more details, please refer to the [documentation](http://mxnetjl.readthedocs.org/) and [examples](examples). +For more details, please refer to the [documentation](https://dmlc.github.io/MXNet.jl/latest) and [examples](examples). From a7b1c65b96ba91878d4902cb5b526c5b4640f40d Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 11 Aug 2016 05:44:21 +0900 Subject: [PATCH 361/630] fix deprecations in build.jl --- deps/build.jl | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 86c79905b889..1736bf9eb0a2 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -1,3 +1,4 @@ +using Compat ################################################################################ # First try to detect and load existing libmxnet ################################################################################ @@ -21,7 +22,7 @@ if !libmxnet_detected ################################################################################ # If not found, try to build automatically using BinDeps ################################################################################ - @windows_only begin + if is_windows() info("Please follow the libmxnet documentation on how to build manually") info("or to install pre-build packages:") info("http://mxnet.readthedocs.io/en/latest/how_to/build.html#building-on-windows") @@ -60,7 +61,9 @@ if !libmxnet_detected FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin ChangeDirectory("$_mxdir") `cp make/config.mk config.mk` - @osx_only `cp make/osx.mk config.mk` + if is_apple() + `cp make/osx.mk config.mk` + end `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` `cp ../../cblas.h include/cblas.h` From 0408e3e7cdfa4c14897fe01ccf36c11da0b10aaa Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 11 Aug 2016 06:15:51 +0900 Subject: [PATCH 362/630] fix String deprecations --- src/base.jl | 2 +- src/executor.jl | 4 ++-- src/io.jl | 10 +++++----- src/kvstore.jl | 2 +- src/ndarray.jl | 11 +++++------ src/symbolic-node.jl | 38 +++++++++++++++++++------------------- src/util.jl | 18 +++++++++--------- 7 files changed, 42 insertions(+), 43 deletions(-) diff --git a/src/base.jl b/src/base.jl index 32968ea0afb6..d35a1bec3818 100644 --- a/src/base.jl +++ b/src/base.jl @@ -43,7 +43,7 @@ function mx_get_last_error() if msg == C_NULL throw(MXError("Failed to get last error message")) end - return @compat String(msg) + return unsafe_string(msg) end "Utility macro to call MXNet API functions" diff --git a/src/executor.jl b/src/executor.jl index edebc79907c7..0bdccc942d22 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -23,7 +23,7 @@ function Executor(hdr :: MX_ExecutorHandle, symbol :: SymbolicNode, ref_hdrs = Ref{Ptr{MX_handle}}(0) @mxcall(:MXExecutorOutputs, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_handle}}), hdr, ref_size, ref_hdrs) - out_hdrs = pointer_to_array(ref_hdrs[], ref_size[]) + out_hdrs = unsafe_wrap(Array, ref_hdrs[], ref_size[]) out_arrays = [NDArray(MX_NDArrayHandle(x)) for x in out_hdrs] arg_names = list_arguments(symbol) @@ -217,5 +217,5 @@ Can be used to get an estimated about the memory cost. function debug_str(self :: Executor) s_ref = Ref{Cstring}() @mxcall(:MXExecutorPrint, (MX_handle, Ptr{Cstring}), self.handle, s_ref) - @compat String(s_ref[]) + unsafe_string(s_ref[]) end diff --git a/src/io.jl b/src/io.jl index 0e7d5c22490c..f240388ffbda 100644 --- a/src/io.jl +++ b/src/io.jl @@ -559,7 +559,7 @@ function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) - iter_name = Symbol(String(ref_name[])) + iter_name = Symbol(unsafe_wrap(String, ref_name[])) if gen_docs if endswith(string(iter_name), "Iter") @@ -567,7 +567,7 @@ function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) else f_desc = "" end - f_desc *= String(ref_desc[]) * "\n\n" + f_desc *= unsafe_string(ref_desc[]) * "\n\n" f_desc *= ":param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data.\n" f_desc *= ":param Base.Symbol label_name: keyword argument, default ``:softmax_label``. " * "The name of the label. Could be ``nothing`` if no label is presented in this dataset.\n\n" @@ -578,8 +578,8 @@ function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) defun = quote function $iter_name(; kwargs...) - arg_keys = AbstractString[string(k) for (k,v) in kwargs] - arg_vals = AbstractString[dump_mx_param(v) for (k,v) in kwargs] + arg_keys = String[string(k) for (k,v) in kwargs] + arg_vals = String[dump_mx_param(v) for (k,v) in kwargs] ref_hdr = Ref{MX_handle}(0) @mxcall(:MXDataIterCreateIter, (MX_handle, MX_uint, char_pp, char_pp, Ref{MX_handle}), @@ -603,7 +603,7 @@ function _import_io_iterators(;gen_docs::Bool=false) @mxcall(:MXListDataIters, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) n_creators = n_ref[] - h_creators = pointer_to_array(h_ref[], n_creators) + h_creators = unsafe_wrap(Array, h_ref[], n_creators) if gen_docs docs = Dict{Base.Symbol, AbstractString}() diff --git a/src/kvstore.jl b/src/kvstore.jl index bc2e65c6fdd3..03da58197d70 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -87,7 +87,7 @@ end function get_type(self :: KVStore) type_ref = Ref{char_p}(0) @mxcall(:MXKVStoreGetType, (MX_handle, Ref{char_p}), self, type_ref) - return Symbol(@compat String(type_ref[])) + return Symbol(unsafe_wrap(String, type_ref[])) end function get_num_workers(self :: KVStore) diff --git a/src/ndarray.jl b/src/ndarray.jl index dacee56d7281..1d7619a2ad3e 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -251,7 +251,7 @@ function size(arr :: NDArray) ref_shape = Ref{Ptr{MX_uint}}(0) @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), arr, ref_ndim, ref_shape) - tuple(map(Int, flipdim(pointer_to_array(ref_shape[], ref_ndim[]),1))...) + tuple(map(Int, flipdim(unsafe_wrap(Array, ref_shape[], ref_ndim[]),1))...) end function size(arr :: NDArray, dim :: Int) size(arr)[dim] @@ -824,8 +824,7 @@ end function try_get_shared(arr :: NDArray) if context(arr).device_type == CPU # try to do data sharing - vec = pointer_to_array(pointer(arr), length(arr)) - return reshape(vec, size(arr)) + return unsafe_wrap(Array, pointer(arr), size(arr)) else # impossible to share, just copying return copy(arr) @@ -876,11 +875,11 @@ function load(filename::AbstractString, ::Type{NDArray}) out_name_size = out_name_size[] out_size = out_size[] if out_name_size == 0 - return [NDArray(MX_NDArrayHandle(hdr)) for hdr in pointer_to_array(out_hdrs[], out_size)] + return [NDArray(MX_NDArrayHandle(hdr)) for hdr in unsafe_wrap(Array, out_hdrs[], out_size)] else @assert out_size == out_name_size - return Dict([(Symbol(@compat String(k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in - zip(pointer_to_array(out_names[], out_size), pointer_to_array(out_hdrs[], out_size))]) + return @compat Dict((Symbol(unsafe_wrap(String, k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in + zip(unsafe_wrap(Array, out_names[], out_size), unsafe_wrap(Array, out_hdrs[], out_size))) end end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 850379899642..94e7bb10c128 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -55,8 +55,8 @@ macro _list_symbol_info(self, func_name) @mxcall($func_name, (MX_handle, Ref{MX_uint}, Ref{char_pp}), $self, ref_sz, ref_names) narg = ref_sz[] - names = pointer_to_array(ref_names[], narg) - names = [Symbol(@compat String(x)) for x in names] + names = unsafe_wrap(Array, ref_names[], narg) + names = [Symbol(unsafe_wrap(String, x)) for x in names] return names end end @@ -123,13 +123,13 @@ Get attribute attached to this :class:`SymbolicNode` belonging to key. :return: The value belonging to key as a :class:`Nullable`. """ function get_attr(self :: SymbolicNode, key :: Symbol) - key_s = @compat String(string(key)) + key_s = string(key) ref_out = Ref{Cstring}() ref_success = Ref{Cint}(-1) @mxcall(:MXSymbolGetAttr, (MX_handle, Cstring, Ref{Cstring}, Ref{Cint}), self, key_s, ref_out, ref_success) if ref_success[] == 1 - return Nullable{String}(@compat String(ref_out[])) + return Nullable{String}(unsafe_string(ref_out[])) else return Nullable{String}() end @@ -147,11 +147,11 @@ function list_attr(self :: SymbolicNode) @mxcall(:MXSymbolListAttrShallow, (MX_handle, Ref{MX_uint}, Ref{char_pp}), self, ref_sz, ref_strings) narg = 2*ref_sz[] - strings = pointer_to_array(ref_strings[], narg) + strings = unsafe_wrap(Array, ref_strings[], narg) out = Dict{Symbol, String}() for i in 1:2:narg - key = Symbol(@compat String(strings[i])) - value = @compat String(strings[i+1]) + key = Symbol(unsafe_wrap(String, strings[i])) + value = unsafe_string(strings[i+1]) # Creates a copy of string out[key] = value end return out @@ -169,11 +169,11 @@ function list_all_attr(self :: SymbolicNode) @mxcall(:MXSymbolListAttr, (MX_handle, Ref{MX_uint}, Ref{char_pp}), self, ref_sz, ref_strings) narg = 2*ref_sz[] - strings = pointer_to_array(ref_strings[], narg) + strings = unsafe_wrap(Array, ref_strings[], narg) out = Dict{Symbol, String}() for i in 1:2:narg - key = Symbol(@compat String(strings[i])) - value = @compat String(strings[i+1]) + key = Symbol(unsafe_wrap(String, strings[i])) + value = unsafe_string(strings[i+1]) out[key] = value end return out @@ -191,8 +191,8 @@ the attributes of a :class:`SymbolicNode` that is already been used somewhere el cause unexpected behavior and inconsistency. """ function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) - key_s = @compat String(string(key)) - value_s = @compat String(value) + key_s = string(key) + value_s = String(value) @mxcall(:MXSymbolSetAttr, (MX_handle, Cstring, Cstring), self, key_s, value_s) end @@ -231,10 +231,10 @@ function Group(nodes :: SymbolicNode...) end function _build_shapes(shape_size::MX_uint, shape_ndim::Ptr{MX_uint}, shape_data::Ptr{Ptr{MX_uint}}) - shape_ndim = pointer_to_array(shape_ndim, shape_size) - shape_data = pointer_to_array(shape_data, shape_size) + shape_ndim = unsafe_wrap(Array, shape_ndim, shape_size) + shape_data = unsafe_wrap(Array, shape_data, shape_size) shapes = map(1:shape_size) do i - my_shape = pointer_to_array(shape_data[i], shape_ndim[i]) + my_shape = unsafe_wrap(Array, shape_data[i], shape_ndim[i]) tuple(flipdim(Int[my_shape...],1)...) end convert(Vector{Tuple}, shapes) @@ -332,9 +332,9 @@ function _infer_type(self, keys, arg_type_data) if ref_complete[] == 0 return (nothing, nothing, nothing) else - in_type = pointer_to_array(ref_in_type_data[], ref_in_type_size[]) - out_type = pointer_to_array(ref_out_type_data[], ref_out_type_size[]) - aux_type = pointer_to_array(ref_aux_type_data[], ref_aux_type_size[]) + in_type = unsafe_wrap(Array, ref_in_type_data[], ref_in_type_size[]) + out_type = unsafe_wrap(Array, ref_out_type_data[], ref_out_type_size[]) + aux_type = unsafe_wrap(Array, ref_aux_type_data[], ref_aux_type_size[]) return ([fromTypeFlag(TypeFlag(t)) for t in in_type], [fromTypeFlag(TypeFlag(t)) for t in out_type], [fromTypeFlag(TypeFlag(t)) for t in aux_type]) @@ -528,7 +528,7 @@ Convert a :class:`SymbolicNode` into a JSON string. function to_json(self :: SymbolicNode) ref_json = Ref{char_p}(0) @mxcall(:MXSymbolSaveToJSON, (MX_handle, Ref{char_p}), self, ref_json) - return @compat String(ref_json[]) + return unsafe_string(ref_json[]) end """ diff --git a/src/util.jl b/src/util.jl index 13ce10f58a77..402f633a8567 100644 --- a/src/util.jl +++ b/src/util.jl @@ -15,7 +15,7 @@ function get_mnist_ubyte() :train_label => "train-labels-idx1-ubyte", :test_data => "t10k-images-idx3-ubyte", :test_label => "t10k-labels-idx1-ubyte") - filenames = [k => joinpath(mnist_dir, v) for (k,v) in filenames] + filenames = @compat Dict(k => joinpath(mnist_dir, v) for (k,v) in filenames) if !all(isfile, values(filenames)) cd(mnist_dir) do mnist_dir = download("http://webdocs.cs.ualberta.ca/~bx3/data/mnist.zip", "mnist.zip") @@ -38,7 +38,7 @@ function get_cifar10() cifar10_dir = joinpath(data_dir, "cifar10") mkpath(cifar10_dir) filenames = Dict(:train => "cifar/train.rec", :test => "cifar/test.rec") - filenames = [k => joinpath(cifar10_dir, v) for (k,v) in filenames] + filenames = @compat Dict(k => joinpath(cifar10_dir, v) for (k,v) in filenames) if !all(isfile, values(filenames)) cd(cifar10_dir) do run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/cifar10.zip`) @@ -63,26 +63,26 @@ end # Internal Utilities ################################################################################ const DOC_EMBED_ANCHOR = "**autogen:EMBED:{1}:EMBED:autogen**" -function _format_typestring(typestr :: AbstractString) +function _format_typestring(typestr :: String) replace(typestr, r"\bSymbol\b", "SymbolicNode") end function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{char_pp}, arg_descs::Ref{char_pp}, remove_dup::Bool=true) param_keys = Set{String}() - arg_names = pointer_to_array(arg_names[], narg) - arg_types = pointer_to_array(arg_types[], narg) - arg_descs = pointer_to_array(arg_descs[], narg) + arg_names = unsafe_wrap(Array, arg_names[], narg) + arg_types = unsafe_wrap(Array, arg_types[], narg) + arg_descs = unsafe_wrap(Array, arg_descs[], narg) docstrings = String[] for i = 1:narg - arg_name = @compat String(arg_names[i]) + arg_name = unsafe_string(arg_names[i]) if arg_name ∈ param_keys && remove_dup continue end push!(param_keys, arg_name) - arg_type = _format_typestring(@compat String(arg_types[i])) - arg_desc = @compat String(arg_descs[i]) + arg_type = _format_typestring(unsafe_string(arg_types[i])) + arg_desc = unsafe_string(arg_descs[i]) push!(docstrings, "* `$arg_name::$arg_type`: $arg_desc\n") end return join(docstrings, "\n") From 31459739c244a3d38a69b8f68ee01a893ed9bf60 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 11 Aug 2016 06:27:50 +0900 Subject: [PATCH 363/630] Change back to dict comprehension syntax for v0.4 0.4 doesn't support the generator syntac (even through Compat). This commit should be reverted once we are v0.5 only. --- src/model.jl | 4 ++-- src/ndarray.jl | 4 ++-- src/util.jl | 4 ++-- 3 files changed, 6 insertions(+), 6 deletions(-) diff --git a/src/model.jl b/src/model.jl index ac96d047b668..f47d49d1a82d 100644 --- a/src/model.jl +++ b/src/model.jl @@ -385,8 +385,8 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra train_execs = Array(Executor, num_dev) for i = 1:num_dev - data_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)] - label_shapes = [k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)] + data_shapes = Dict([k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)]) + label_shapes = Dict([k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)]) train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=grad_req, data_shapes..., label_shapes...) dbg_str = mx.debug_str(train_execs[i]) info(string("TempSpace: ", split(dbg_str, ['\n'])[end-2]..., " on ", self.ctx[i])) diff --git a/src/ndarray.jl b/src/ndarray.jl index 1d7619a2ad3e..5a4bac527d9d 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -878,8 +878,8 @@ function load(filename::AbstractString, ::Type{NDArray}) return [NDArray(MX_NDArrayHandle(hdr)) for hdr in unsafe_wrap(Array, out_hdrs[], out_size)] else @assert out_size == out_name_size - return @compat Dict((Symbol(unsafe_wrap(String, k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in - zip(unsafe_wrap(Array, out_names[], out_size), unsafe_wrap(Array, out_hdrs[], out_size))) + return Dict([(Symbol(unsafe_wrap(String, k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in + zip(unsafe_wrap(Array, out_names[], out_size), unsafe_wrap(Array, out_hdrs[], out_size))]) end end diff --git a/src/util.jl b/src/util.jl index 402f633a8567..73ee877973f3 100644 --- a/src/util.jl +++ b/src/util.jl @@ -15,7 +15,7 @@ function get_mnist_ubyte() :train_label => "train-labels-idx1-ubyte", :test_data => "t10k-images-idx3-ubyte", :test_label => "t10k-labels-idx1-ubyte") - filenames = @compat Dict(k => joinpath(mnist_dir, v) for (k,v) in filenames) + filenames = Dict([k => joinpath(mnist_dir, v) for (k,v) in filenames]) if !all(isfile, values(filenames)) cd(mnist_dir) do mnist_dir = download("http://webdocs.cs.ualberta.ca/~bx3/data/mnist.zip", "mnist.zip") @@ -38,7 +38,7 @@ function get_cifar10() cifar10_dir = joinpath(data_dir, "cifar10") mkpath(cifar10_dir) filenames = Dict(:train => "cifar/train.rec", :test => "cifar/test.rec") - filenames = @compat Dict(k => joinpath(cifar10_dir, v) for (k,v) in filenames) + filenames = Dict([k => joinpath(cifar10_dir, v) for (k,v) in filenames]) if !all(isfile, values(filenames)) cd(cifar10_dir) do run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/cifar10.zip`) From 016efd6dc8b002f717c65f093cdac4c4aa2fe650 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 11 Aug 2016 06:55:53 +0900 Subject: [PATCH 364/630] improve docstrings --- src/ndarray.jl | 6 ++++-- src/util.jl | 7 +++++++ 2 files changed, 11 insertions(+), 2 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 5a4bac527d9d..713b446864ac 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -997,8 +997,10 @@ function _get_function_description(handle :: MX_handle) ref_arg_types, ref_arg_descs, ref_ret_type) name = Symbol(unsafe_wrap(String, ref_name[])) - - desc = unsafe_wrap(String, ref_desc[]) * "\n\n" + signature = _format_signature(Int(ref_narg[]), ref_arg_names) + desc = " " * string(name) * "(" * signature * ")\n\n" + desc *= unsafe_wrap(String, ref_desc[]) * "\n\n" + desc *= "# Arguments\n" desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) return name, desc end diff --git a/src/util.jl b/src/util.jl index 73ee877973f3..5c50d20357e7 100644 --- a/src/util.jl +++ b/src/util.jl @@ -87,3 +87,10 @@ function _format_docstring(narg::Int, arg_names::Ref{char_pp}, arg_types::Ref{ch end return join(docstrings, "\n") end + +function _format_signature(narg::Int, arg_names::Ref{char_pp}) + arg_names = unsafe_wrap(Array, arg_names[], narg) + + return join([unsafe_string(name) for name in arg_names] , ", ") +end + From 50882421bb357a88370c328edc7c5a3aef1d90f5 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 11 Aug 2016 07:04:33 +0900 Subject: [PATCH 365/630] Don't override help for already defined methods --- src/ndarray.jl | 14 +++++++++++--- src/symbolic-node.jl | 11 ++++++++--- 2 files changed, 19 insertions(+), 6 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 713b446864ac..49555b50f09b 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1082,9 +1082,17 @@ macro _import_ndarray_functions() name, desc = _get_function_description(handle) exprs = _get_function_expressions(handle, name) - expr = quote - $(exprs...) - @doc $desc $name + # TODO(vchuravy): Fix this in a more elegant way once we only support + # v0.5 + if isdefined(Base, name) || isdefined(name) + expr = quote + $(exprs...) + end + else + expr = quote + $(exprs...) + @doc $desc $name + end end push!(func_exprs, expr) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 94e7bb10c128..bd2dd54c6282 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -675,9 +675,14 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) end func_def = Expr(:function, func_head, Expr(:block, func_body)) - quote - $func_def - @doc $f_desc $func_name + # TODO(vchuravy) find a more elegant solution fro v0.5 + if isdefined(Base, func_name) || isdefined(func_name) + return func_def + else + return quote + $func_def + @doc $f_desc $func_name + end end end From 3bc93fe33395c3c571b9ccf96956d579c573f880 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 11 Aug 2016 07:18:29 +0900 Subject: [PATCH 366/630] improve documentation formatting for SymbolicNodes --- src/symbolic-node.jl | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index bd2dd54c6282..32be8f63a7ea 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -586,14 +586,17 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) kv_nargs_s = unsafe_wrap(String, ref_kv_nargs[]) kv_nargs = Symbol(kv_nargs_s) + signature = _format_signature(Int(ref_nargs[]), ref_arg_names) + f_desc = " " * func_name_s * "(" * signature * ")\n\n" f_desc = unsafe_wrap(String, ref_desc[]) * "\n\n" if !isempty(kv_nargs_s) - f_desc *= "This function support variable length positional :class:`SymbolicNode` inputs.\n\n" + f_desc *= "This function support variable length positional `SymbolicNode` inputs.\n\n" end + f_desc *= "# Arguments\n" f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":param Symbol name: The name of the :class:`SymbolicNode`. (e.g. `:my_symbol`), optional.\n" - f_desc *= ":param Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`SymbolicNode`.\n\n" - f_desc *= ":return: $(_format_typestring(unsafe_wrap(String, ref_ret_type[]))).\n\n" + f_desc *= "* `name::Symbol`: The name of the `SymbolicNode`. (e.g. `:my_symbol`), optional.\n" + f_desc *= "* `attrs::Dict{Symbol, AbstractString}`: The attributes associated with this `SymbolicNode`.\n\n" + f_desc *= "Returns `$(_format_typestring(unsafe_wrap(String, ref_ret_type[])))`." # function $func_name(args...; kwargs...) func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) From b328f242028696fe6b21e8db01480b3aff3e9fe1 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 11 Aug 2016 07:45:16 +0900 Subject: [PATCH 367/630] fix deprecation for call --- src/callback.jl | 4 ++-- src/symbolic-node.jl | 5 +++-- 2 files changed, 5 insertions(+), 4 deletions(-) diff --git a/src/callback.jl b/src/callback.jl index 3aca66a7bbf0..c3e1d299403e 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -51,7 +51,7 @@ For example, the :func:`speedometer` callback is defined as function every_n_batch(callback :: Function, n :: Int; call_on_0 :: Bool = false) BatchCallback(n, call_on_0, callback) end -function Base.call(cb :: BatchCallback, state :: OptimizationState) +@compat function (cb :: BatchCallback)(state :: OptimizationState) if state.curr_batch == 0 if cb.call_on_0 cb.callback(state) @@ -107,7 +107,7 @@ A convenient function to construct a callback that runs every ``n`` full data-pa function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) end -function Base.call{T<:Real}(cb :: EpochCallback, model :: Any, state :: OptimizationState, metric :: Vector{Tuple{Base.Symbol, T}}) +@compat function (cb :: EpochCallback){T<:Real}(model :: Any, state :: OptimizationState, metric :: Vector{Tuple{Base.Symbol, T}}) if state.curr_epoch == 0 if cb.call_on_0 cb.callback(model, state, metric) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 32be8f63a7ea..600bc75b3aeb 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -32,6 +32,7 @@ function Base.copy(self :: SymbolicNode) Base.deepcopy(self) end +# TODO(vchuravy) How to add documentation to the v0.5 style call overloading """ call(self :: SymbolicNode, args :: SymbolicNode...) call(self :: SymbolicNode; kwargs...) @@ -39,11 +40,11 @@ end Make a new node by composing ``self`` with ``args``. Or the arguments can be specified using keyword arguments. """ -function Base.call(self :: SymbolicNode, args :: SymbolicNode...) +@compat function (self::SymbolicNode)(args :: SymbolicNode...) s = deepcopy(self) _compose!(s, args...) end -function Base.call(self :: SymbolicNode; kwargs...) +@compat function (self::SymbolicNode)(;kwargs...) s = deepcopy(self) _compose!(s; kwargs...) end From 2c36a5debbfb7122ea68b65807d7e5a911669fd2 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 11 Aug 2016 07:56:08 +0900 Subject: [PATCH 368/630] nightly is v0.6 --- .travis.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.travis.yml b/.travis.yml index 651ba9640f8b..08c7db10e0ab 100644 --- a/.travis.yml +++ b/.travis.yml @@ -6,6 +6,7 @@ os: - osx julia: - 0.4 + - 0.5 - nightly # dependent apt packages From 63e6063d9d99af2e4b1ecc3108128fe43203cd0e Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 11 Aug 2016 11:37:48 -0700 Subject: [PATCH 369/630] fix Inception URL #113 --- models/Inception/get.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/models/Inception/get.sh b/models/Inception/get.sh index 392403a82703..dfd3701bd0b4 100755 --- a/models/Inception/get.sh +++ b/models/Inception/get.sh @@ -1,4 +1,4 @@ #!/bin/bash -wget -c http://webdocs.cs.ualberta.ca/~bx3/data/Inception.zip +wget -c http://data.dmlc.ml/mxnet/data/Inception.zip unzip Inception.zip From 513c030fad4a734983a143e51b10630fdf5e658d Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 16 Aug 2016 12:50:37 -0700 Subject: [PATCH 370/630] fix link in doc --- docs/src/index.md | 4 ++-- docs/src/tutorial/mnist.md | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/docs/src/index.md b/docs/src/index.md index 93e3fa49660a..a41b77478631 100644 --- a/docs/src/index.md +++ b/docs/src/index.md @@ -1,8 +1,8 @@ # MXNet Documentation -[MXNet.jl](https://github.com/dmlc/MXNet.jl>) is the +[MXNet.jl](https://github.com/dmlc/MXNet.jl) is the [Julia](http://julialang.org/) package of -[dmlc/mxnet](https://github.com/dmlc/mxnet). `MXNet.jl` brings flexible and efficient GPU +[dmlc/mxnet](https://github.com/dmlc/mxnet). MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of features include: diff --git a/docs/src/tutorial/mnist.md b/docs/src/tutorial/mnist.md index 8282f48ac8ca..3047a9c1d3ca 100644 --- a/docs/src/tutorial/mnist.md +++ b/docs/src/tutorial/mnist.md @@ -19,7 +19,7 @@ using MXNet ``` to load the `MXNet` module. Then we are ready to define the network -architecture via the symbolic API </user-guide/overview>. We start +architecture via the [symbolic API](../user-guide/overview.md). We start with a placeholder `data` symbol, ```julia From 3a7913f18a1ab977ae9bb980c1b78fa85a238dec Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 16 Aug 2016 12:56:00 -0700 Subject: [PATCH 371/630] fix some formatting errors in docs --- docs/src/user-guide/overview.md | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/docs/src/user-guide/overview.md b/docs/src/user-guide/overview.md index 691ab93e9acb..85814cdc63fe 100644 --- a/docs/src/user-guide/overview.md +++ b/docs/src/user-guide/overview.md @@ -192,10 +192,10 @@ lot of temp NDArray in the loop (the performance gets worse when increasing `N_REP`), is only about twice slower than the pre-allocated one. - Row Function Average Relative Replications - ------ --------------- ------------ ----------- --------------- - 1 "inplace\_op" 0.0074854 1.0 100 - 2 "normal\_op" 0.0174202 2.32723 100 +| Row | Function | Average | Relative | Replications | +| ------ | --------------- | ------------ | ----------- | --------------- | +| 1 | "inplace\_op" | 0.0074854 | 1.0 | 100 | +| 2 | "normal\_op" | 0.0174202 | 2.32723 | 100 | So it will usually not be a big problem unless you are at the bottleneck of the computation. From 63772b8e1a6685c09085b739fae98ba5243a39d1 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 16 Aug 2016 13:03:07 -0700 Subject: [PATCH 372/630] fix typos in doc --- docs/src/api/nn-factory.md | 2 +- docs/src/user-guide/install.md | 13 ++++++------- 2 files changed, 7 insertions(+), 8 deletions(-) diff --git a/docs/src/api/nn-factory.md b/docs/src/api/nn-factory.md index 41474383aa76..833d9a3efd53 100644 --- a/docs/src/api/nn-factory.md +++ b/docs/src/api/nn-factory.md @@ -1,4 +1,4 @@ -# Neural Network Factora +# Neural Network Factory Neural network factory provide convenient helper functions to define common neural networks. diff --git a/docs/src/user-guide/install.md b/docs/src/user-guide/install.md index fe586c248da3..34c532321ef7 100644 --- a/docs/src/user-guide/install.md +++ b/docs/src/user-guide/install.md @@ -24,9 +24,8 @@ libmxnet. The libmxnet source is downloaded to `Pkg.dir("MXNet")/deps/src/mxnet`. The automatic build is using default configurations, with OpenCV, CUDA disabled. If the compilation failed due to unresolved dependency, or if -you want to customize the build, it is recommended to compile and -install libmxnet manually. Please see below <manual-compilation> -for more details. +you want to customize the build, you can compile and +install libmxnet manually. Please see below for more details. Manual Compilation ------------------ @@ -38,8 +37,8 @@ to work with a seperate, maybe customized libmxnet. To build libmxnet, please refer to [the installation guide of libmxnet](http://mxnet.readthedocs.org/en/latest/build.html). After -successfully installing libmxnet, set the `MXNET_HOME` environment -variable to the location of libmxnet. In other words, the compiled +successfully installing libmxnet, set the `MXNET_HOME` *environment +variable* to the location of libmxnet. In other words, the compiled `libmxnet.so` should be found in `$MXNET_HOME/lib`. > **note** @@ -61,7 +60,7 @@ following paths (and in that order): - `Pkg.dir("MXNet")/deps/usr/lib`: automatic builds - Any system wide library search path -Note that MXNet.jl will not find `libmxnet.so` even if it is on one of -the paths above if a library it depends upon is missing from the +Note that MXNet.jl can not load `libmxnet.so` even if it is on one of +the paths above in case a library it depends upon is missing from the `LD_LIBRARY_PATH`. Thus, if you are going to compile to add CUDA, the path to the CUDA libraries will have to be added to `LD_LIBRARY_PATH`. From 50a294611fc93ef5170318b03b38e76509fc6247 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 18 Aug 2016 11:28:25 +0900 Subject: [PATCH 373/630] documentation cleanup --- docs/src/tutorial/mnist.md | 2 +- src/ndarray.jl | 268 ++++++++++++++++++------------------- src/nn-factory.jl | 17 +-- 3 files changed, 143 insertions(+), 144 deletions(-) diff --git a/docs/src/tutorial/mnist.md b/docs/src/tutorial/mnist.md index 3047a9c1d3ca..096d7dd0310f 100644 --- a/docs/src/tutorial/mnist.md +++ b/docs/src/tutorial/mnist.md @@ -28,7 +28,7 @@ data = mx.Variable(:data) and then cascading fully-connected layers and activation functions: -``` {.sourceCode .julia} +```julia fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) diff --git a/src/ndarray.jl b/src/ndarray.jl index 49555b50f09b..14fdee01564f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -70,13 +70,10 @@ end """ NDArray - Wrapper of the ``NDArray`` type in ``libmxnet``. This is the basic building block - of tensor-based computation. - - .. _ndarray-shape-note: - - .. note:: +Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block +of tensor-based computation. +!!! note since C/C++ use row-major ordering for arrays while Julia follows a column-major ordering. To keep things consistent, we keep the underlying data in their original layout, but use *language-native* convention when we talk @@ -113,7 +110,7 @@ Base.cconvert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) """ context(arr :: NDArray) - Get the context that this :class:`NDArray` lives on. +Get the context that this `NDArray` lives on. """ function context(arr :: NDArray) ref_typeid = Ref{Cint}(0) @@ -130,7 +127,7 @@ end empty(DType, shape :: Tuple) empty(DType, dim1, dim2, ...) - Allocate memory for an uninitialized :class:`NDArray` with a specified type. +Allocate memory for an uninitialized `NDArray` with a specified type. """ function empty{N,T<:DType}(::Type{T}, shape :: NTuple{N, Int}) empty(T, shape, cpu()) @@ -148,7 +145,7 @@ end empty(shape :: Tuple) empty(dim1, dim2, ...) - Allocate memory for an uninitialized :class:`NDArray` with specific shape of type Float32. +Allocate memory for an uninitialized `NDArray` with specific shape of type Float32. """ function empty{N}(shape :: NTuple{N, Int}) empty(shape, cpu()) @@ -165,7 +162,7 @@ end zeros(DType, shape :: Tuple) zeros(DType, dim1, dim2, ...) -Create zero-ed :class:`NDArray` with specific shape and type +Create zero-ed `NDArray` with specific shape and type """ function zeros{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}) zeros(T, shape, cpu()) @@ -184,7 +181,7 @@ end zeros(shape :: Tuple) zeros(dim1, dim2, ...) -Create zero-ed :class:`NDArray` with specific shape. +Create zero-ed `NDArray` with specific shape. """ function zeros{N}(shape :: NTuple{N, Int}) zeros(shape, cpu()) @@ -203,7 +200,7 @@ end ones(DType, shape :: Tuple) ones(DType, dim1, dim2, ...) -Create an :class:`NDArray` with specific shape & type, and initialize with 1. +Create an `NDArray` with specific shape & type, and initialize with 1. """ function ones{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}) ones(T, shape, cpu()) @@ -222,7 +219,7 @@ end ones(shape :: Tuple) ones(dim1, dim2, ...) -Create an :class:`NDArray` with specific shape and initialize with 1. +Create an `NDArray` with specific shape and initialize with 1. """ function ones{N}(shape :: NTuple{N, Int}) ones(shape, cpu()) @@ -243,8 +240,8 @@ import Base: size, length, ndims, eltype size(arr :: NDArray) size(arr :: NDArray, dim :: Int) - Get the shape of an :class:`NDArray`. The shape is in Julia's column-major convention. See - also the :ref:`notes on NDArray shapes `. +Get the shape of an `NDArray`. The shape is in Julia's column-major convention. See +also the notes on NDArray shapes [`NDArrat`](@ref). """ function size(arr :: NDArray) ref_ndim = Ref{MX_uint}(0) @@ -260,7 +257,7 @@ end """ length(arr :: NDArray) - Get the number of elements in an :class:`NDArray`. +Get the number of elements in an `NDArray`. """ function length(arr :: NDArray) prod(size(arr)) @@ -269,7 +266,7 @@ end """ ndims(arr :: NDArray) - Get the number of dimensions of an :class:`NDArray`. Is equivalent to ``length(size(arr))``. +Get the number of dimensions of an `NDArray`. Is equivalent to `length(size(arr))`. """ function ndims(arr :: NDArray) length(size(arr)) @@ -278,7 +275,7 @@ end """ eltype(arr :: NDArray) - Get the element type of an :class:`NDArray`. +Get the element type of an `NDArray`. """ function eltype{T <: Union{NDArray, MX_NDArrayHandle}}(arr :: T) dtype_ref = Ref{Cint}(0) @@ -299,11 +296,11 @@ import Base: slice """ slice(arr :: NDArray, start:stop) - Create a view into a sub-slice of an :class:`NDArray`. Note only slicing at the slowest - changing dimension is supported. In Julia's column-major perspective, this is the last - dimension. For example, given an :class:`NDArray` of shape (2,3,4), ``slice(array, 2:3)`` will create - a :class:`NDArray` of shape (2,3,2), sharing the data with the original array. This operation is - used in data parallelization to split mini-batch into sub-batches for different devices. +Create a view into a sub-slice of an `NDArray`. Note only slicing at the slowest +changing dimension is supported. In Julia's column-major perspective, this is the last +dimension. For example, given an `NDArray` of shape (2,3,4), `slice(array, 2:3)` will create +a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is +used in data parallelization to split mini-batch into sub-batches for different devices. """ function slice(arr :: NDArray, ::Colon) arr @@ -329,13 +326,13 @@ import Base: setindex! """ setindex!(arr :: NDArray, val, idx) - Assign values to an :class:`NDArray`. Elementwise assignment is not implemented, only the following - scenarios are supported +Assign values to an `NDArray`. Elementwise assignment is not implemented, only the following +scenarios are supported - - ``arr[:] = val``: whole array assignment, ``val`` could be a scalar or an array (Julia ``Array`` - or :class:`NDArray`) of the same shape. - - ``arr[start:stop] = val``: assignment to a *slice*, ``val`` could be a scalar or an array of - the same shape to the slice. See also :func:`slice`. +* `arr[:] = val`: whole array assignment, `val` could be a scalar or an array (Julia `Array` + or `NDArray`) of the same shape. +* `arr[start:stop] = val`: assignment to a *slice*, `val` could be a scalar or an array of + the same shape to the slice. See also [`slice`](@ref). """ function setindex!(arr :: NDArray, val :: Real, ::Colon) @assert(arr.writable) @@ -356,36 +353,35 @@ import Base: getindex """ getindex(arr :: NDArray, idx) -Shortcut for :func:`slice`. A typical use is to write - - .. code-block:: julia - - arr[:] += 5 +Shortcut for [`slice`](@ref). A typical use is to write - which translates into +```julia + arr[:] += 5 +``` - .. code-block:: julia +which translates into - arr[:] = arr[:] + 5 +```julia + arr[:] = arr[:] + 5 +``` - which furthur translates into +which furthur translates into - .. code-block:: julia +```julia + setindex!(getindex(arr, Colon()), 5, Colon()) +``` - setindex!(getindex(arr, Colon()), 5, Colon()) - - .. note:: - - The behavior is quite different from indexing into Julia's ``Array``. For example, ``arr[2:5]`` - create a **copy** of the sub-array for Julia ``Array``, while for :class:`NDArray`, this is - a *slice* that shares the memory. +!!! note + The behavior is quite different from indexing into Julia's `Array`. For example, `arr[2:5]` + create a **copy** of the sub-array for Julia `Array`, while for `NDArray`, this is + a *slice* that shares the memory. """ function getindex(arr :: NDArray, ::Colon) return arr end """ -Shortcut for `slice`. **NOTE** the behavior for Julia's built-in index slicing is to create a +Shortcut for [`slice`](@ref). **NOTE** the behavior for Julia's built-in index slicing is to create a copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. """ function getindex(arr :: NDArray, idx::UnitRange{Int}) @@ -397,7 +393,7 @@ import Base: copy!, copy, convert .. function:: copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) - Copy contents of ``src`` into ``dst``. +Copy contents of `src` into `dst`. """ function copy!(dst :: NDArray, src :: NDArray) @assert(dst.writable) @@ -441,13 +437,12 @@ end """ -.. function:: - copy(arr :: NDArray) - copy(arr :: NDArray, ctx :: Context) - copy(arr :: Array, ctx :: Context) + copy(arr :: NDArray) + copy(arr :: NDArray, ctx :: Context) + copy(arr :: Array, ctx :: Context) - Create a copy of an array. When no :class:`Context` is given, create a Julia ``Array``. - Otherwise, create an :class:`NDArray` on the specified context. +Create a copy of an array. When no `Context` is given, create a Julia `Array`. +Otherwise, create an `NDArray` on the specified context. """ # Create copy: NDArray -> Julia Array function copy(arr :: NDArray) @@ -470,7 +465,7 @@ end """ convert(::Type{Array{T}}, arr :: NDArray) - Convert an :class:`NDArray` into a Julia ``Array`` of specific type. Data will be copied. +Convert an `NDArray` into a Julia `Array` of specific type. Data will be copied. """ # Convert copy: NDArray -> Julia Array function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) @@ -480,25 +475,25 @@ end """ @inplace -Julia does not support re-definiton of ``+=`` operator (like ``__iadd__`` in python), -When one write ``a += b``, it gets translated to ``a = a+b``. ``a+b`` will allocate new -memory for the results, and the newly allocated :class:`NDArray` object is then assigned +Julia does not support re-definiton of `+=` operator (like `__iadd__` in python), +When one write `a += b`, it gets translated to `a = a+b`. `a+b` will allocate new +memory for the results, and the newly allocated `NDArray` object is then assigned back to a, while the original contents in a is discarded. This is very inefficient when we want to do inplace update. This macro is a simple utility to implement this behavior. Write - .. code-block:: julia +```julia + @mx.inplace a += b +``` - @mx.inplace a += b +will translate into - will translate into +```julia + mx.add_to!(a, b) +``` - .. code-block:: julia - - mx.add_to!(a, b) - - which will do inplace adding of the contents of ``b`` into ``a``. +which will do inplace adding of the contents of `b` into `a`. """ macro inplace(stmt) if stmt.head == :+= || stmt.head == :.+= @@ -517,7 +512,7 @@ end """ add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) -Add a bunch of arguments into ``dst``. Inplace updating. +Add a bunch of arguments into `dst`. Inplace updating. """ function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) @assert dst.writable @@ -537,8 +532,8 @@ import Base: +, .+ +(args...) .+(args...) -Summation. Multiple arguments of either scalar or :class:`NDArray` could be -added together. Note at least the first or second argument needs to be an :class:`NDArray` to +Summation. Multiple arguments of either scalar or `NDArray` could be +added together. Note at least the first or second argument needs to be an `NDArray` to avoid ambiguity of built-in summation. """ function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) @@ -558,7 +553,7 @@ end """ sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) - Subtract a bunch of arguments from ``dst``. Inplace updating. +Subtract a bunch of arguments from `dst`. Inplace updating. """ function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable @@ -576,8 +571,8 @@ import Base: -, .- -(arg0) .-(arg0, arg1) -Subtraction ``arg0 - arg1``, of scalar types or :class:`NDArray`. Or create -the negative of ``arg0``. +Subtraction `arg0 - arg1`, of scalar types or `NDArray`. Or create +the negative of `arg0`. """ function -(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) @@ -602,8 +597,8 @@ end """ mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) - Elementwise multiplication into ``dst`` of either a scalar or an :class:`NDArray` of the same shape. - Inplace updating. +Elementwise multiplication into `dst` of either a scalar or an `NDArray` of the same shape. +Inplace updating. """ function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable @@ -620,7 +615,7 @@ import Base: .*, * """ .*(arg0, arg1) -Elementwise multiplication of ``arg0`` and ``arg``, could be either scalar or :class:`NDArray`. +Elementwise multiplication of `arg0` and `arg`, could be either scalar or `NDArray`. """ function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) @@ -633,7 +628,7 @@ end """ *(arg0, arg1) -Currently only multiplication a scalar with an :class:`NDArray` is implemented. Matrix multiplication +Currently only multiplication a scalar with an `NDArray` is implemented. Matrix multiplication is to be added soon. """ function *(arg0 :: NDArray, arg :: Real) @@ -647,7 +642,7 @@ end """ div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) -Elementwise divide a scalar or an :class:`NDArray` of the same shape from ``dst``. Inplace updating. +Elementwise divide a scalar or an `NDArray` of the same shape from `dst`. Inplace updating. """ function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable @@ -662,7 +657,7 @@ import Base: ./, / """ ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) -Elementwise dividing an :class:`NDArray` by a scalar or another :class:`NDArray` of the same shape. +Elementwise dividing an `NDArray` by a scalar or another `NDArray` of the same shape. """ function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) @@ -672,7 +667,7 @@ end """ /(arg0 :: NDArray, arg :: Real) -Divide an :class:`NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. +Divide an `NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. """ function /(arg0 :: NDArray, arg :: Real) ./(arg0, arg) @@ -685,42 +680,41 @@ Manipulating as Julia Arrays @nd_as_jl(captures..., statement) - A convenient macro that allows to operate :class:`NDArray` as Julia Arrays. For example, +A convenient macro that allows to operate `NDArray` as Julia Arrays. For example, - .. code-block:: julia +```julia + x = mx.zeros(3,4) + y = mx.ones(3,4) + z = mx.zeros((3,4), mx.gpu()) - x = mx.zeros(3,4) - y = mx.ones(3,4) - z = mx.zeros((3,4), mx.gpu()) - - @mx.nd_as_jl ro=(x,y) rw=z begin - # now x, y, z are just ordinary Julia Arrays - z[:,1] = y[:,2] - z[:,2] = 5 - end - - Under the hood, the macro convert all the declared captures from :class:`NDArray` into Julia - Arrays, by using :func:`try_get_shared`. And automatically commit the modifications back into - the :class:`NDArray` that is declared as ``rw``. This is useful for fast prototyping and when - implement non-critical computations, such as :class:`AbstractEvalMetric`. - - .. note:: - - - Multiple ``rw`` and / or ``ro`` capture declaration could be made. - - The macro does **not** check to make sure that ``ro`` captures are not modified. If the - original :class:`NDArray` lives in CPU memory, then it is very likely the corresponding - Julia Array shares data with the :class:`NDArray`, so modifying the Julia Array will also - modify the underlying :class:`NDArray`. - - More importantly, since the :class:`NDArray` is - asynchronized, we will wait for *writing* for ``rw`` variables but wait only for *reading* - in ``ro`` variables. If we write into those ``ro`` variables, **and** if the memory is - shared, racing condition might happen, and the behavior is undefined. - - When an :class:`NDArray` is declared to be captured as ``rw``, its contents is always sync - back in the end. - - The execution results of the expanded macro is always ``nothing``. - - The statements are wrapped in a ``let``, thus locally introduced new variables will not be - available after the statements. So you will need to declare the variables before calling the - macro if needed. + @mx.nd_as_jl ro=(x,y) rw=z begin + # now x, y, z are just ordinary Julia Arrays + z[:,1] = y[:,2] + z[:,2] = 5 + end +``` + +Under the hood, the macro convert all the declared captures from `NDArray` into Julia +Arrays, by using `try_get_shared`. And automatically commit the modifications back into +the `NDArray` that is declared as `rw`. This is useful for fast prototyping and when +implement non-critical computations, such as `AbstractEvalMetric`. + +!!! note +* Multiple `rw` and / or `ro` capture declaration could be made. +* The macro does **not** check to make sure that `ro` captures are not modified. If the + original `NDArray` lives in CPU memory, then it is very likely the corresponding + Julia Array shares data with the `NDArray`, so modifying the Julia Array will also + modify the underlying `NDArray`. +* More importantly, since the `NDArray` is + asynchronized, we will wait for *writing* for `rw` variables but wait only for *reading* + in `ro` variables. If we write into those `ro` variables, **and** if the memory is + shared, racing condition might happen, and the behavior is undefined. +* When an `NDArray` is declared to be captured as `rw`, its contents is always sync + back in the end. +* The execution results of the expanded macro is always `nothing`. +* The statements are wrapped in a `let`, thus locally introduced new variables will not be + available after the statements. So you will need to declare the variables before calling the + macro if needed. """ macro nd_as_jl(m_args...) @assert(length(m_args) > 0) @@ -812,14 +806,15 @@ end """ try_get_shared(arr) - Try to create a Julia array by sharing the data with the underlying :class:`NDArray`. +Try to create a Julia array by sharing the data with the underlying `NDArray`. -* NDArray arr: the array to be shared. +# Arguments: +* `arr::NDArray`: the array to be shared. .. warning:: - The returned array does not guarantee to share data with the underlying :class:`NDArray`. - In particular, data sharing is possible only when the :class:`NDArray` lives on CPU. + The returned array does not guarantee to share data with the underlying `NDArray`. + In particular, data sharing is possible only when the `NDArray` lives on CPU. """ function try_get_shared(arr :: NDArray) if context(arr).device_type == CPU @@ -834,10 +829,11 @@ end """ is_shared(j_arr, arr) - Test whether ``j_arr`` is sharing data with ``arr``. +Test whether `j_arr` is sharing data with `arr`. +# Arguments: * Array j_arr: the Julia Array. -* NDArray arr: the :class:`NDArray`. +* NDArray arr: the `NDArray`. """ function is_shared(j_arr :: Array, arr :: NDArray) false @@ -857,13 +853,16 @@ end Load NDArrays from binary file. -* AbstractString filename: the path of the file to load. It could be S3 or HDFS address. - :return: Either ``Dict{Base.Symbol, NDArray}`` or ``Vector{NDArray}``. +# Arguments: +* `filename::String`: the path of the file to load. It could be S3 or HDFS address. + +Returns either `Dict{Symbol, NDArray}` or `Vector{NDArray}`. -If the ``libmxnet`` is built with the corresponding component enabled. Examples -* ``s3://my-bucket/path/my-s3-ndarray`` -* ``hdfs://my-bucket/path/my-hdfs-ndarray`` -* ``/path-to/my-local-ndarray`` +`filename` can point to `s3` or `hdfs` resources if the `libmxnet` is built with the +corresponding components enabled. Examples: +* `s3://my-bucket/path/my-s3-ndarray` +* `hdfs://my-bucket/path/my-hdfs-ndarray` +* `/path-to/my-local-ndarray` """ function load(filename::AbstractString, ::Type{NDArray}) out_size = Ref{MX_uint}(0) @@ -886,12 +885,11 @@ end """ save(filename :: AbstractString, data) -Save NDarrays to binary file. Filename could be S3 or HDFS address, if ``libmxnet`` is built -with corresponding support. +Save NDarrays to binary file. Filename could be S3 or HDFS address, if `libmxnet` is built +with corresponding support (see `load`). -* AbstractString filename: path to the binary file to write to. -* data: data to save to file. - :type data: :class:`NDArray`, or a ``Vector{NDArray}`` or a ``Dict{Base.Symbol, NDArray}``. +* `filename::String`: path to the binary file to write to. +* `data`: data to save to file. Data can be a`NDArray`, a `Vector{NDArray}`, or a `Dict{Base.Symbol, NDArray}`. """ function save(filename::AbstractString, data::NDArray) save(filename, [data]) @@ -928,22 +926,22 @@ end import Base: sqrt """ -The libxmnet APIs are automatically imported from ``libmxnet.so``. The functions listed -here operate on :class:`NDArray` objects. The arguments to the functions are typically ordered +The libxmnet APIs are automatically imported from `libmxnet.so`. The functions listed +here operate on `NDArray` objects. The arguments to the functions are typically ordered as .. code-block:: julia func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) -unless ``NDARRAY_ARG_BEFORE_SCALAR`` is not set. In this case, the scalars are put before the input arguments: +unless `NDARRAY_ARG_BEFORE_SCALAR` is not set. In this case, the scalars are put before the input arguments: .. code-block:: julia func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) -If ``ACCEPT_EMPTY_MUTATE_TARGET`` is set. An overloaded function without the output arguments will also be defined: +If `ACCEPT_EMPTY_MUTATE_TARGET` is set. An overloaded function without the output arguments will also be defined: .. code-block:: julia @@ -952,7 +950,7 @@ If ``ACCEPT_EMPTY_MUTATE_TARGET`` is set. An overloaded function without the out Upon calling, the output arguments will be automatically initialized with empty NDArrays. Those functions always return the output arguments. If there is only one output (the typical situation), that -object (:class:`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. +object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. """ function _get_ndarray_functions() diff --git a/src/nn-factory.jl b/src/nn-factory.jl index b170214a1af9..a60a4716bfef 100644 --- a/src/nn-factory.jl +++ b/src/nn-factory.jl @@ -1,24 +1,25 @@ """ - MLP(input, spec) + MLP(input, spec; hidden_activation = :relu, prefix) Construct a multi-layer perceptron. A MLP is a multi-layer neural network with fully connected layers. -* SymbolicNode input: the input to the mlp. -* spec: the mlp specification, a list of hidden dimensions. For example, - ``[128, (512, :sigmoid), 10]``. The number in the list indicate the +# Arguments: +* `input::SymbolicNode`: the input to the mlp. +* `spec`: the mlp specification, a list of hidden dimensions. For example, + `[128, (512, :sigmoid), 10]`. The number in the list indicate the number of hidden units in each layer. A tuple could be used to specify the activation of each layer. Otherwise, the default activation will be used (except for the last layer). -* Base.Symbol hidden_activation: keyword argument, default ``:relu``, indicating +* `hidden_activation::Symbol`: keyword argument, default `:relu`, indicating the default activation for hidden layers. The specification here could be overwritten - by layer-wise specification in the ``spec`` argument. Also activation is not + by layer-wise specification in the `spec` argument. Also activation is not applied to the last, i.e. the prediction layer. See :func:`Activation` for a list of supported activation types. -* prefix: keyword argument, default ``gensym()``, used as the prefix to +* `prefix`: keyword argument, default `gensym()`, used as the prefix to name the constructed layers. - :return: the constructed MLP. +Returns the constructed MLP. """ function MLP(input, spec; hidden_activation::Base.Symbol=:relu, prefix=gensym()) spec = convert(Vector{Union{Int,Tuple}}, spec) From 71eefbbbc4ea20e123abf63fdfdf21b6b96cdf55 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 18 Aug 2016 21:44:27 +0900 Subject: [PATCH 374/630] Remove `` and :class: --- docs/src/user-guide/overview.md | 2 +- src/callback.jl | 8 ++--- src/context.jl | 2 +- src/executor.jl | 6 ++-- src/initializer.jl | 10 +++--- src/io.jl | 42 ++++++++++++------------- src/metric.jl | 4 +-- src/model.jl | 44 +++++++++++++------------- src/optimizer.jl | 6 ++-- src/symbolic-node.jl | 55 +++++++++++++++++---------------- src/visualize.jl | 4 +-- 11 files changed, 93 insertions(+), 90 deletions(-) diff --git a/docs/src/user-guide/overview.md b/docs/src/user-guide/overview.md index 85814cdc63fe..9a7d8e514894 100644 --- a/docs/src/user-guide/overview.md +++ b/docs/src/user-guide/overview.md @@ -59,7 +59,7 @@ The followings are common ways to create NDArray objects: - `mx.empty(shape[, context])`: create on uninitialized array of a given shape on a specific device. For example, - `` mx.empty(2,3)`, `mx.((2,3), mx.gpu(2)) ``. + ` mx.empty(2,3)`, `mx.((2,3), mx.gpu(2)) `. - `mx.zeros(shape[, context])` and `mx.ones(shape[, context])`: similar to the Julia's built-in `zeros` and `ones`. - `mx.copy(jl_arr, context)`: copy the contents of a Julia `Array` to diff --git a/src/callback.jl b/src/callback.jl index c3e1d299403e..6203f9f51f87 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -28,7 +28,7 @@ end """ every_n_batch(callback :: Function, n :: Int; call_on_0 = false) -A convenient function to construct a callback that runs every ``n`` mini-batches. +A convenient function to construct a callback that runs every `n` mini-batches. # Arguments * `call_on_0::Bool`: keyword argument, default false. Unless set, the callback @@ -64,7 +64,7 @@ end """ speedometer(; frequency=50) -Create an :class:`AbstractBatchCallback` that measure the training speed +Create an `AbstractBatchCallback` that measure the training speed (number of samples processed per second) every k mini-batches. # Arguments @@ -95,7 +95,7 @@ end """ every_n_epoch(callback :: Function, n :: Int; call_on_0 = false) -A convenient function to construct a callback that runs every ``n`` full data-passes. +A convenient function to construct a callback that runs every `n` full data-passes. * Int call_on_0: keyword argument, default false. Unless set, the callback will **not** be run on epoch 0. Epoch 0 means no training has been performed @@ -120,7 +120,7 @@ end """ do_checkpoint(prefix; frequency=1, save_epoch_0=false) -Create an :class:`AbstractEpochCallback` that save checkpoints of the model to disk. +Create an `AbstractEpochCallback` that save checkpoints of the model to disk. The checkpoints can be loaded back later on. # Arguments diff --git a/src/context.jl b/src/context.jl index 908d542f5ba3..410a80ca8b4c 100644 --- a/src/context.jl +++ b/src/context.jl @@ -19,7 +19,7 @@ end """ cpu(dev_id) -Get a CPU context with a specific id. ``cpu()`` is usually the default context for many +Get a CPU context with a specific id. `cpu()` is usually the default context for many operations when no context is specified. # Arguments diff --git a/src/executor.jl b/src/executor.jl index 0bdccc942d22..8e8bdd3bec93 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -1,7 +1,7 @@ """ Executor -An executor is a realization of a symbolic architecture defined by a :class:`SymbolicNode`. +An executor is a realization of a symbolic architecture defined by a `SymbolicNode`. The actual forward and backward computation specified by the network architecture can be carried out with an executor. """ @@ -68,12 +68,12 @@ end """ bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) -Create an :class:`Executor` by binding a :class:`SymbolicNode` to concrete :class:`NDArray`. +Create an `Executor` by binding a `SymbolicNode` to concrete `NDArray`. # Arguments * `sym::SymbolicNode`: the network architecture describing the computation graph. * `ctx::Context`: the context on which the computation should run. -* `args`: either a list of :class:`NDArray` or a dictionary of name-array pairs. Concrete +* `args`: either a list of `NDArray` or a dictionary of name-array pairs. Concrete arrays for all the inputs in the network architecture. The inputs typically include network parameters (weights, bias, filters, etc.), data and labels. See :func:`list_arguments` and :func:`infer_shape`. diff --git a/src/initializer.jl b/src/initializer.jl index 7ee9920a9d12..dacb06f349c3 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -64,7 +64,7 @@ end """ UniformInitializer(scale=0.07) -Construct a :class:`UniformInitializer` with the specified scale. +Construct a `UniformInitializer` with the specified scale. """ UniformInitializer() = UniformInitializer(0.07) @@ -84,7 +84,7 @@ end """ NormalIninitializer(; mu=0, sigma=0.01) -Construct a :class:`NormalInitializer` with mean ``mu`` and variance ``sigma``. +Construct a `NormalInitializer` with mean `mu` and variance `sigma`. """ NormalInitializer(; mu=0, sigma=0.01) = NormalInitializer(mu, sigma) @@ -106,9 +106,9 @@ a normal distribution with μ = 0 and σ² or a uniform distribution from -σ to Several different ways of calculating the variance are given in the literature or are used by various libraries. -* [Bengio and Glorot 2010]: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 1)`` -* [K. He, X. Zhang, S. Ren, and J. Sun 2015]: ``mx.XavierInitializer(distribution = mx.xv_gaussian, regularization = mx.xv_in, magnitude = 2)`` -* caffe_avg: ``mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 3)`` +* [Bengio and Glorot 2010]: `mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 1)` +* [K. He, X. Zhang, S. Ren, and J. Sun 2015]: `mx.XavierInitializer(distribution = mx.xv_gaussian, regularization = mx.xv_in, magnitude = 2)` +* caffe_avg: `mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 3)` """ @enum XavierDistribution xv_uniform xv_normal diff --git a/src/io.jl b/src/io.jl index f240388ffbda..56b463a1a6c3 100644 --- a/src/io.jl +++ b/src/io.jl @@ -25,7 +25,7 @@ The root type for all data provider. A data provider should implement the follow training stage, both *data* and *label* will be feeded into the model, while during prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and of any shapes. The provided data and label names here should match the input names in a target - :class:`SymbolicNode`. + `SymbolicNode`. A data provider should also implement the Julia iteration interface, in order to allow iterating through the data set. The provider will be called in the following way: @@ -48,7 +48,7 @@ The root type for all data provider. A data provider should implement the follow By default, :func:`eachbatch` simply returns the provider itself, so the iterator interface is implemented on the provider type itself. But the extra layer of abstraction allows us to - implement a data provider easily via a Julia ``Task`` coroutine. See the + implement a data provider easily via a Julia `Task` coroutine. See the data provider defined in :doc:`the char-lstm example ` for an example of using coroutine to define data providers. @@ -58,7 +58,7 @@ The detailed interface functions for the iterator API is listed below: Base.eltype(provider) -> AbstractDataBatch :param AbstractDataProvider provider: the data provider. - :return: the specific subtype representing a data batch. See :class:`AbstractDataBatch`. + :return: the specific subtype representing a data batch. See `AbstractDataBatch`. Base.start(provider) -> AbstractDataProviderState @@ -91,7 +91,7 @@ case, you can safely assume that not be called. With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation -of the built-in :class:`MXDataProvider` for example. +of the built-in `MXDataProvider` for example. .. caution:: @@ -137,7 +137,7 @@ abstract AbstractDataProviderState :return: a vector of data in this batch, should be in the same order as declared in :func:`provide_data() `. - The last dimension of each :class:`NDArray` should always match the batch_size, even when + The last dimension of each `NDArray` should always match the batch_size, even when :func:`count_samples` returns a value less than the batch size. In this case, the data provider is free to pad the remaining contents with any value. @@ -167,7 +167,7 @@ abstract AbstractDataProviderState :type targets: Vector{Vector{SlicedNDArray}} The targets is a list of the same length as number of data provided by this provider. - Each element in the list is a list of :class:`SlicedNDArray`. This list described a + Each element in the list is a list of `SlicedNDArray`. This list described a spliting scheme of this data batch into different slices, each slice is specified by a slice-ndarray pair, where *slice* specify the range of samples in the mini-batch that should be loaded into the corresponding *ndarray*. @@ -189,7 +189,7 @@ abstract AbstractDataBatch """ DataBatch - A basic subclass of :class:`AbstractDataBatch`, that implement the interface by + A basic subclass of `AbstractDataBatch`, that implement the interface by accessing member fields. """ type DataBatch <: AbstractDataBatch @@ -204,7 +204,7 @@ get_label{Provider<:AbstractDataProvider}(::Provider, batch :: DataBatch) = batc """ SlicedNDArray - A alias type of ``Tuple{UnitRange{Int},NDArray}``. + A alias type of `Tuple{UnitRange{Int},NDArray}`. """ typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} @@ -257,7 +257,7 @@ eachbatch(provider :: AbstractDataProvider) = provider """ ArrayDataProvider - A convenient tool to iterate :class:`NDArray` or Julia ``Array``. + A convenient tool to iterate `NDArray` or Julia `Array`. """ type ArrayDataProvider <: AbstractDataProvider data_arrays :: Vector{Array{MX_float}} @@ -277,16 +277,16 @@ end """ ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) - Construct a data provider from :class:`NDArray` or Julia Arrays. + Construct a data provider from `NDArray` or Julia Arrays. :param data: the data, could be - - a :class:`NDArray`, or a Julia Array. This is equivalent to ``:data => data``. - - a name-data pair, like ``:mydata => array``, where ``:mydata`` is the name of the data - and ``array`` is an :class:`NDArray` or a Julia Array. + - a `NDArray`, or a Julia Array. This is equivalent to `:data => data`. + - a name-data pair, like `:mydata => array`, where `:mydata` is the name of the data + and `array` is an `NDArray` or a Julia Array. - a list of name-data pairs. - :param label: the same as the ``data`` parameter. When this argument is omitted, the constructed + :param label: the same as the `data` parameter. When this argument is omitted, the constructed provider will provide no labels. :param Int batch_size: the batch size, default is 0, which means treating the whole array as a single mini-batch. @@ -294,9 +294,9 @@ end :param Real data_padding: when the mini-batch goes beyond the dataset boundary, there might be less samples to include than a mini-batch. This value specify a scalar to pad the contents of all the missing data points. - :param Real label_padding: the same as ``data_padding``, except for the labels. + :param Real label_padding: the same as `data_padding`, except for the labels. - TODO: remove ``data_padding`` and ``label_padding``, and implement rollover that copies + TODO: remove `data_padding` and `label_padding`, and implement rollover that copies the last or first several training samples to feed the padding. """ # Julia's type system is sometimes very frustrating. You cannot specify a function @@ -563,16 +563,16 @@ function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) if gen_docs if endswith(string(iter_name), "Iter") - f_desc = "Can also be called with the alias ``$(string(iter_name)[1:end-4] * "Provider")``.\n" + f_desc = "Can also be called with the alias `$(string(iter_name)[1:end-4] * "Provider")`.\n" else f_desc = "" end f_desc *= unsafe_string(ref_desc[]) * "\n\n" - f_desc *= ":param Base.Symbol data_name: keyword argument, default ``:data``. The name of the data.\n" - f_desc *= ":param Base.Symbol label_name: keyword argument, default ``:softmax_label``. " * - "The name of the label. Could be ``nothing`` if no label is presented in this dataset.\n\n" + f_desc *= ":param Base.Symbol data_name: keyword argument, default `:data`. The name of the data.\n" + f_desc *= ":param Base.Symbol label_name: keyword argument, default `:softmax_label`. " * + "The name of the label. Could be `nothing` if no label is presented in this dataset.\n\n" f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":return: the constructed :class:`MXDataProvider`." + f_desc *= ":return: the constructed `MXDataProvider`." return (iter_name, f_desc) end diff --git a/src/metric.jl b/src/metric.jl index 21d5e4e34b14..aea8a0af628e 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -22,8 +22,8 @@ interfaces. Get the accumulated metrics. - :return: ``Vector{Tuple{Base.Symbol, Real}}``, a list of name-value pairs. For - example, ``[(:accuracy, 0.9)]``. + :return: `Vector{Tuple{Base.Symbol, Real}}`, a list of name-value pairs. For + example, `[(:accuracy, 0.9)]`. """ abstract AbstractEvalMetric diff --git a/src/model.jl b/src/model.jl index f47d49d1a82d..d6752e24ebd3 100644 --- a/src/model.jl +++ b/src/model.jl @@ -48,9 +48,9 @@ end FeedForward(arch :: SymbolicNode, ctx) * arch: the architecture of the network constructed using the symbolic API. -* ctx: the devices on which this model should do computation. It could be a single :class:`Context` - or a list of :class:`Context` objects. In the latter case, data parallelization will be used - for training. If no context is provided, the default context ``cpu()`` will be used. +* ctx: the devices on which this model should do computation. It could be a single `Context` + or a list of `Context` objects. In the latter case, data parallelization will be used + for training. If no context is provided, the default context `cpu()` will be used. """ function FeedForward(arch :: SymbolicNode; context :: Union{Context, Vector{Context}, Void} = nothing) if isa(context, Void) @@ -74,7 +74,7 @@ end * AbstractInitializer initializer: an initializer describing how the weights should be initialized. * Bool overwrite: keyword argument, force initialization even when weights already exists. * input_shapes: the shape of all data and label inputs to this model, given as keyword arguments. - For example, ``data=(28,28,1,100), label=(100,)``. + For example, `data=(28,28,1,100), label=(100,)`. """ function init_model(self :: FeedForward, initializer :: AbstractInitializer; overwrite::Bool=false, input_shapes...) # all arg names, including data, label, and parameters @@ -177,12 +177,12 @@ end * FeedForward self: the model. * AbstractDataProvider data: the data to perform prediction on. -* Bool overwrite: an :class:`Executor` is initialized the first time predict is called. The memory - allocation of the :class:`Executor` depends on the mini-batch size of the test +* Bool overwrite: an `Executor` is initialized the first time predict is called. The memory + allocation of the `Executor` depends on the mini-batch size of the test data provider. If you call predict twice with data provider of the same batch-size, - then the executor can be potentially be re-used. So, if ``overwrite`` is false, - we will try to re-use, and raise an error if batch-size changed. If ``overwrite`` - is true (the default), a new :class:`Executor` will be created to replace the old one. + then the executor can be potentially be re-used. So, if `overwrite` is false, + we will try to re-use, and raise an error if batch-size changed. If `overwrite` + is true (the default), a new `Executor` will be created to replace the old one. .. note:: @@ -196,9 +196,9 @@ end .. note:: - If you perform further after prediction. The weights are not automatically synchronized if ``overwrite`` + If you perform further after prediction. The weights are not automatically synchronized if `overwrite` is set to false and the old predictor is re-used. In this case - setting ``overwrite`` to true (the default) will re-initialize the predictor the next time you call + setting `overwrite` to true (the default) will re-initialize the predictor the next time you call predict and synchronize the weights again. :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` @@ -319,28 +319,28 @@ end """ fit(model :: FeedForward, optimizer, data; kwargs...) -Train the ``model`` on ``data`` with the ``optimizer``. +Train the `model` on `data` with the `optimizer`. * FeedForward model: the model to be trained. * AbstractOptimizer optimizer: the optimization algorithm to use. * AbstractDataProvider data: the training data provider. * Int n_epoch: default 10, the number of full data-passes to run. -* AbstractDataProvider eval_data: keyword argument, default ``nothing``. The data provider for +* AbstractDataProvider eval_data: keyword argument, default `nothing`. The data provider for the validation set. -* AbstractEvalMetric eval_metric: keyword argument, default ``Accuracy()``. The metric used - to evaluate the training performance. If ``eval_data`` is provided, the same metric is also +* AbstractEvalMetric eval_metric: keyword argument, default `Accuracy()`. The metric used + to evaluate the training performance. If `eval_data` is provided, the same metric is also calculated on the validation set. -* kvstore: keyword argument, default ``:local``. The key-value store used to synchronize gradients +* kvstore: keyword argument, default `:local`. The key-value store used to synchronize gradients and parameters when multiple devices are used for training. - :type kvstore: :class:`KVStore` or ``Base.Symbol`` -* AbstractInitializer initializer: keyword argument, default ``UniformInitializer(0.01)``. + :type kvstore: `KVStore` or `Base.Symbol` +* AbstractInitializer initializer: keyword argument, default `UniformInitializer(0.01)`. * Bool force_init: keyword argument, default false. By default, the random initialization using the - provided ``initializer`` will be skipped if the model weights already exists, maybe from a previous + provided `initializer` will be skipped if the model weights already exists, maybe from a previous call to :func:`train` or an explicit call to :func:`init_model` or :func:`load_checkpoint`. When this option is set, it will always do random initialization at the begining of training. -* callbacks: keyword argument, default ``[]``. Callbacks to be invoked at each epoch or mini-batch, - see :class:`AbstractCallback`. - :type callbacks: ``Vector{AbstractCallback}`` +* callbacks: keyword argument, default `[]`. Callbacks to be invoked at each epoch or mini-batch, + see `AbstractCallback`. + :type callbacks: `Vector{AbstractCallback}` """ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) opts = TrainingOptions(; kwargs...) diff --git a/src/optimizer.jl b/src/optimizer.jl index e2fc44338a2f..c5d4b29aa308 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -85,7 +85,7 @@ get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rat LearningRate.Exp :math:`\eta_t = \eta_0\gamma^t`. Here :math:`t` is the epoch count, or the iteration - count if ``decay_on_iteration`` is set to true. + count if `decay_on_iteration` is set to true. """ type Exp <: AbstractLearningRateScheduler learning_rate :: Float64 @@ -102,7 +102,7 @@ get_learning_rate(self :: Exp, state :: OptimizationState) = LearningRate.Inv :math:`\eta_t = \eta_0 * (1 + \gamma * t)^(-power)`. - Here :math:`t` is the epoch count, or the iteration count if ``decay_on_iteration`` + Here :math:`t` is the epoch count, or the iteration count if `decay_on_iteration` is set to true. """ type Inv <: AbstractLearningRateScheduler @@ -207,7 +207,7 @@ abstract AbstractOptimizerOptions normalized_gradient(opts, state, grad) * AbstractOptimizerOptions opts: options for the optimizer, should contain the field - ``grad_scale``, ``grad_clip`` and ``weight_decay``. + `grad_scale`, `grad_clip` and `weight_decay`. * OptimizationState state: the current optimization state. * NDArray weight: the trainable weights. * NDArray grad: the original gradient of the weights. diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 600bc75b3aeb..b71733ace71b 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -37,7 +37,7 @@ end call(self :: SymbolicNode, args :: SymbolicNode...) call(self :: SymbolicNode; kwargs...) -Make a new node by composing ``self`` with ``args``. Or the arguments +Make a new node by composing `self` with `args`. Or the arguments can be specified using keyword arguments. """ @compat function (self::SymbolicNode)(args :: SymbolicNode...) @@ -66,11 +66,11 @@ end list_arguments(self :: SymbolicNode) List all the arguments of this node. The argument for a node contains both -the inputs and parameters. For example, a :class:`FullyConnected` node will +the inputs and parameters. For example, a `FullyConnected` node will have both data and weights in its arguments. A composed node (e.g. a MLP) will list all the arguments for intermediate nodes. - :return: A list of symbols indicating the names of the arguments. +Returns a list of symbols indicating the names of the arguments. """ function list_arguments(self :: SymbolicNode) @_list_symbol_info(self, :MXSymbolListArguments) @@ -81,7 +81,7 @@ end List all the outputs of this node. - :return: A list of symbols indicating the names of the outputs. +Returns a list of symbols indicating the names of the outputs. """ function list_outputs(self :: SymbolicNode) @_list_symbol_info(self, :MXSymbolListOutputs) @@ -99,7 +99,7 @@ and do not have gradient. But still be useful for the specific operations. A common example of auxiliary state is the moving_mean and moving_variance in BatchNorm. Most operators do not have Auxiliary states. - :return: A list of symbols indicating the names of the auxiliary states. +Returns a list of symbols indicating the names of the auxiliary states. """ function list_auxiliary_states(self :: SymbolicNode) @_list_symbol_info(self, :MXSymbolListAuxiliaryStates) @@ -108,8 +108,8 @@ end """ get_internals(self :: SymbolicNode) -Get a new grouped :class:`SymbolicNode` whose output contains all the internal outputs of -this :class:`SymbolicNode`. +Get a new grouped `SymbolicNode` whose output contains all the internal outputs of +this `SymbolicNode`. """ function get_internals(self :: SymbolicNode) ref_hdr = Ref{MX_handle}(0) @@ -120,8 +120,9 @@ end """ get_attr(self :: SymbolicNode, key :: Symbol) -Get attribute attached to this :class:`SymbolicNode` belonging to key. -:return: The value belonging to key as a :class:`Nullable`. +Get attribute attached to this `SymbolicNode` belonging to key. + +Returns the value belonging to key as a `Nullable`. """ function get_attr(self :: SymbolicNode, key :: Symbol) key_s = string(key) @@ -140,7 +141,8 @@ end list_attr(self :: SymbolicNode) Get all attributes from a symbol. -:return: Dictionary of attributes. + +Returns a dictionary of attributes. """ function list_attr(self :: SymbolicNode) ref_sz = Ref{MX_uint}(0) @@ -162,7 +164,8 @@ end list_all_attr(self :: SymbolicNode) Get all attributes from the symbol graph. -:return: Dictionary of attributes. + +Returns a dictionary of attributes. """ function list_all_attr(self :: SymbolicNode) ref_sz = Ref{MX_uint}(0) @@ -183,12 +186,12 @@ end """ set_attr(self:: SymbolicNode, key :: Symbol, value :: AbstractString) -Set the attribute key to value for this :class:`SymbolicNode`. +Set the attribute key to value for this `SymbolicNode`. # Warning It is encouraged not to call this function directly, unless you know exactly what you are doing. The -recommended way of setting attributes is when creating the :class:`SymbolicNode`. Changing -the attributes of a :class:`SymbolicNode` that is already been used somewhere else might +recommended way of setting attributes is when creating the `SymbolicNode`. Changing +the attributes of a `SymbolicNode` that is already been used somewhere else might cause unexpected behavior and inconsistency. """ function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) @@ -205,7 +208,7 @@ Create a symbolic variable with the given name. This is typically used as a plac For example, the data node, acting as the starting point of a network architecture. # Arguments -* Dict{Symbol, AbstractString} attrs: The attributes associated with this :class:`Variable`. +* Dict{Symbol, AbstractString} attrs: The attributes associated with this `Variable`. """ function Variable(name :: Union{Symbol, AbstractString}; attrs = Dict()) attrs = convert(Dict{Symbol, AbstractString}, attrs) @@ -221,7 +224,7 @@ end """ Group(nodes :: SymbolicNode...) -Create a :class:`SymbolicNode` by grouping nodes together. +Create a `SymbolicNode` by grouping nodes together. """ function Group(nodes :: SymbolicNode...) handles = MX_handle[nodes...] @@ -283,9 +286,9 @@ as a list of shapes, which should specify the shapes of inputs in the same order the arguments returned by :func:`list_arguments`. Alternatively, the shape information could be specified via keyword arguments. -:return: A 3-tuple containing shapes of all the arguments, shapes of all the outputs and - shapes of all the auxiliary variables. If shape inference failed due to incomplete - or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. +Returns a 3-tuple containing shapes of all the arguments, shapes of all the outputs and +shapes of all the auxiliary variables. If shape inference failed due to incomplete +or incompatible inputs, the return value will be `(nothing, nothing, nothing)`. """ function infer_shape(self :: SymbolicNode; kwargs...) sdata = MX_uint[] @@ -351,9 +354,9 @@ as a list of types, which should specify the types of inputs in the same order a the arguments returned by :func:`list_arguments`. Alternatively, the type information could be specified via keyword arguments. -:return: A 3-tuple containing types of all the arguments, types of all the outputs and - types of all the auxiliary variables. If type inference failed due to incomplete - or incompatible inputs, the return value will be ``(nothing, nothing, nothing)``. +Returns a 3-tuple containing types of all the arguments, types of all the outputs and +types of all the auxiliary variables. If type inference failed due to incomplete +or incompatible inputs, the return value will be `(nothing, nothing, nothing)`. """ function infer_type(self :: SymbolicNode; kwargs...) types = Cint[toTypeFlag(x[2]) for x in kwargs] @@ -524,7 +527,7 @@ end """ to_json(self :: SymbolicNode) -Convert a :class:`SymbolicNode` into a JSON string. +Convert a `SymbolicNode` into a JSON string. """ function to_json(self :: SymbolicNode) ref_json = Ref{char_p}(0) @@ -535,7 +538,7 @@ end """ from_json(repr :: AbstractString, ::Type{SymbolicNode}) -Load a :class:`SymbolicNode` from a JSON string representation. +Load a `SymbolicNode` from a JSON string representation. """ function from_json(repr :: AbstractString, ::Type{SymbolicNode}) ref_hdr = Ref{MX_handle}(0) @@ -546,7 +549,7 @@ end """ load(filename :: AbstractString, ::Type{SymbolicNode}) -Load a :class:`SymbolicNode` from a JSON file. +Load a `SymbolicNode` from a JSON file. """ function load(filename :: AbstractString, ::Type{SymbolicNode}) ref_hdr = Ref{MX_handle}(0) @@ -557,7 +560,7 @@ end """ save(filename :: AbstractString, node :: SymbolicNode) -Save a :class:`SymbolicNode` to a JSON file. +Save a `SymbolicNode` to a JSON file. """ function save(filename :: AbstractString, node :: SymbolicNode) @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), node, filename) diff --git a/src/visualize.jl b/src/visualize.jl index 15f23c6bfffc..c60868430a9c 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -6,10 +6,10 @@ import JSON * SymbolicNode network: the network to visualize. * AbstractString title: keyword argument, default "Network Visualization", the title of the GraphViz graph. -* input_shapes: keyword argument, default ``nothing``. If provided, +* input_shapes: keyword argument, default `nothing`. If provided, will run shape inference and plot with the shape information. Should be either a dictionary of name-shape mapping or an array of shapes. - :return: the graph description in GraphViz ``dot`` language. + :return: the graph description in GraphViz `dot` language. """ function to_graphviz(network :: SymbolicNode; title="Network Visualization", input_shapes=nothing) if !isa(input_shapes, Void) From 221611ae19cbf5a4bec4c1832853a02b4cc62176 Mon Sep 17 00:00:00 2001 From: Ranjan Anantharaman Date: Sun, 21 Aug 2016 18:10:11 +0530 Subject: [PATCH 375/630] Get rid of sub depwarn --- src/metric.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index aea8a0af628e..dc00bdafb267 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -69,7 +69,7 @@ function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDA for j in 1:size(labels, 2) for i in 1:size(labels, 1) label = labels[i, j, 1, sample] - klasses = sub(pred, i, j, :, sample) + klasses = view(pred, i, j, :, sample) klass = indmax(klasses) - 1 # Classes start at 0...k-1 metric.acc_sum += klass == label @@ -79,7 +79,7 @@ function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDA end elseif ndims(pred) == 2 # 1-dimensional case for sample in 1:size(label, 1) - klass = indmax(sub(pred, :, sample)) - 1 + klass = indmax(view(pred, :, sample)) - 1 metric.acc_sum += klass == label[sample] metric.n_sample += 1 end From e672e427b6a696b594cf17fafa280e60d56f6aee Mon Sep 17 00:00:00 2001 From: Ranjan Anantharaman Date: Sun, 21 Aug 2016 18:11:06 +0530 Subject: [PATCH 376/630] import Compat.view --- src/MXNet.jl | 1 + 1 file changed, 1 insertion(+) diff --git a/src/MXNet.jl b/src/MXNet.jl index c447617e7fbf..b9de52a58bf8 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -9,6 +9,7 @@ module mx using Compat import Compat.String +import Compat.view using Formatting From 08ba2d13d6cd45bb77be9149c6fb730a4a3a19b4 Mon Sep 17 00:00:00 2001 From: Ranjan Anantharaman Date: Sun, 21 Aug 2016 18:11:48 +0530 Subject: [PATCH 377/630] Update REQUIRE with min version of Compat --- REQUIRE | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/REQUIRE b/REQUIRE index d97c567e15db..6fbfb73bd328 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,5 +1,5 @@ julia 0.4+ -Compat +Compat 0.8.4 Formatting BinDeps JSON From e3b793544d1d48486aa9a3d67d4c1d6c76335894 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 23 Aug 2016 04:32:37 +0900 Subject: [PATCH 378/630] reorder docs for io.jl and bring them into the markdown age --- docs/src/api/io.md | 111 ++++++++++++ src/base.jl | 2 +- src/io.jl | 413 ++++++++++++++++++++++----------------------- src/ndarray.jl | 2 +- 4 files changed, 312 insertions(+), 216 deletions(-) diff --git a/docs/src/api/io.md b/docs/src/api/io.md index 32a7d14f9144..fe5fd2f46e2b 100644 --- a/docs/src/api/io.md +++ b/docs/src/api/io.md @@ -3,6 +3,117 @@ Data providers are wrappers that load external data, be it images, text, or general tensors, and split it into mini-batches so that the model can consume the data in a uniformed way. +## AbstractDataProvider interface + +```@docs +mx.AbstractDataProvider +``` + +The difference between *data* and *label* is that during training stage, +both *data* and *label* will be feeded into the model, while during +prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and +of any shapes. The provided data and label names here should match the input names in a target +`SymbolicNode`. + +A data provider should also implement the Julia iteration interface, in order to allow iterating +through the data set. The provider will be called in the following way: + +```julia +for batch in eachbatch(provider) + data = get_data(provider, batch) +end +``` + +which will be translated by Julia compiler into + +```julia +state = Base.start(eachbatch(provider)) +while !Base.done(provider, state) + (batch, state) = Base.next(provider, state) + data = get_data(provider, batch) +end +``` + +By default, `eachbatch` simply returns the provider itself, so the iterator interface +is implemented on the provider type itself. But the extra layer of abstraction allows us to +implement a data provider easily via a Julia `Task` coroutine. See the +data provider defined in [the char-lstm example](tutorial/char-lstm) for an example of using coroutine to define data +providers. + +The detailed interface functions for the iterator API is listed below: + + Base.eltype(provider) -> AbstractDataBatch + +Returns the specific subtype representing a data batch. See `AbstractDataBatch`. +* `provider::AbstractDataProvider`: the data provider. + + Base.start(provider) -> AbstractDataProviderState + +This function is always called before iterating into the dataset. It should initialize +the iterator, reset the index, and do data shuffling if needed. +* `provider::AbstractDataProvider`: the data provider. + + Base.done(provider, state) -> Bool + +True if there is no more data to iterate in this dataset. +* `provider::AbstractDataProvider`: the data provider. +* `state::AbstractDataProviderState`: the state returned by `Base.start` and `Base.next`. + + Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) + +Returns the current data batch, and the state for the next iteration. +* `provider::AbstractDataProvider`: the data provider. + +Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that +is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this +case, you can safely assume that + +* `Base.start` will always be called, and called only once before the iteration starts. +* `Base.done` will always be called at the beginning of every iteration and always be called once. +* If `Base.done` return true, the iteration will stop, until the next round, again, starting with + a call to `Base.start`. +* `Base.next` will always be called only once in each iteration. It will always be called after + one and only one call to `Base.done`; but if `Base.done` returns true, `Base.next` will + not be called. + +With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation +of the built-in `MXDataProvider` for example. + +### Note: +Please do not use the one data provider simultaneously in two different places, either in parallel, +or in a nested loop. For example, the behavior for the following code is undefined + +```julia +for batch in data + # updating the parameters + + # now let's test the performance on the training set + for b2 in data + # ... + end +end +``` + +```@docs +mx.get_batch_size +mx.provide_data +mx.provide_label +``` + +## AbstractDataBatch interface + +```@docs +mx.AbstractDataProviderState +mx.count_samples +mx.get_data +mx.get_label +mx.get +mx.load_data! +mx.load_label! +``` + +## Implemented providers and other methods + ```@autodocs Modules = [MXNet.mx] Pages = ["io.jl"] diff --git a/src/base.jl b/src/base.jl index d35a1bec3818..cca45c273b96 100644 --- a/src/base.jl +++ b/src/base.jl @@ -30,7 +30,7 @@ end function __init__() _populate_symbol_creator_cache!() - _import_io_iterators() + _populate_iter_creator_cache!() atexit() do # notify libmxnet we are shutting down diff --git a/src/io.jl b/src/io.jl index 56b463a1a6c3..1878125f15fd 100644 --- a/src/io.jl +++ b/src/io.jl @@ -3,113 +3,50 @@ The root type for all data provider. A data provider should implement the following interfaces: - get_batch_size(provider) -> Int +* [`get_batch_size`](@ref) +* [`provide_data`](@ref) +* [`provide_label`](@ref) - :param AbstractDataProvider provider: the data provider. - :return: the mini-batch size of the provided data. All the provided data should have the - same mini-batch size (i.e. the last dimension). +As well as the Julia iterator interface (see [the Julia manual](http://docs.julialang.org/en/stable/manual/interfaces/)). +Normally this involves defining: - provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} - - :param AbstractDataProvider provider: the data provider. - :return: a vector of (name, shape) pairs describing the names of the data it provides, and - the corresponding shapes. - - provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} - - :param AbstractDataProvider provider: the data provider. - :return: a vector of (name, shape) pairs describing the names of the labels it provides, and - the corresponding shapes. - - The difference between *data* and *label* is that during - training stage, both *data* and *label* will be feeded into the model, while during - prediction stage, only *data* is loaded. Otherwise, they could be anything, with any names, and - of any shapes. The provided data and label names here should match the input names in a target - `SymbolicNode`. - - A data provider should also implement the Julia iteration interface, in order to allow iterating - through the data set. The provider will be called in the following way: - - .. code-block:: julia - - for batch in eachbatch(provider) - data = get_data(provider, batch) - end - - which will be translated by Julia compiler into - - .. code-block:: julia - - state = Base.start(eachbatch(provider)) - while !Base.done(provider, state) - (batch, state) = Base.next(provider, state) - data = get_data(provider, batch) - end - - By default, :func:`eachbatch` simply returns the provider itself, so the iterator interface - is implemented on the provider type itself. But the extra layer of abstraction allows us to - implement a data provider easily via a Julia `Task` coroutine. See the - data provider defined in :doc:`the char-lstm example - ` for an example of using coroutine to define data - providers. - -The detailed interface functions for the iterator API is listed below: - - Base.eltype(provider) -> AbstractDataBatch - - :param AbstractDataProvider provider: the data provider. - :return: the specific subtype representing a data batch. See `AbstractDataBatch`. - - Base.start(provider) -> AbstractDataProviderState - - :param AbstractDataProvider provider: the data provider. - - This function is always called before iterating into the dataset. It should initialize - the iterator, reset the index, and do data shuffling if needed. - - Base.done(provider, state) -> Bool - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataProviderState state: the state returned by :func:`Base.start` :func:`Base.next`. - :return: true if there is no more data to iterate in this dataset. +* `Base.eltype(provider) -> AbstractDataBatch` +* `Base.start(provider) -> AbstractDataProviderState` +* `Base.done(provider, state) -> Bool` +* `Base.next(provider, state) -> (AbstractDataBatch, AbstractDataProvider)` +""" +abstract AbstractDataProvider - Base.next(provider) -> (AbstractDataBatch, AbstractDataProviderState) +""" + get_batch_size(provider) -> Int - :param AbstractDataProvider provider: the data provider. - :return: the current data batch, and the state for the next iteration. +# Arguments: +* `provider::AbstractDataProvider`: the data provider. -Note sometimes you are wrapping an existing data iterator (e.g. the built-in libmxnet data iterator) that -is built with a different convention. It might be difficult to adapt to the interfaces stated here. In this -case, you can safely assume that +Returns the mini-batch size of the provided data. All the provided data should have the same mini-batch size (i.e. the last dimension). +""" +function get_batch_size end -* :func:`Base.start` will always be called, and called only once before the iteration starts. -* :func:`Base.done` will always be called at the beginning of every iteration and always be called once. -* If :func:`Base.done` return true, the iteration will stop, until the next round, again, starting with - a call to :func:`Base.start`. -* :func:`Base.next` will always be called only once in each iteration. It will always be called after - one and only one call to :func:`Base.done`; but if :func:`Base.done` returns true, :func:`Base.next` will - not be called. +""" + provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} -With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation -of the built-in `MXDataProvider` for example. +# Arguments: +* `provider::AbstractDataProvider`: the data provider. -.. caution:: +Returns a vector of (name, shape) pairs describing the names of the data it provides, and the corresponding shapes. - Please do not use the one data provider simultaneously in two different places, either in parallel, - or in a nested loop. For example, the behavior for the following code is undefined +""" +function provide_data end - .. code-block:: julia +""" + provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} - for batch in data - # updating the parameters +# Arguments: +* `provider::AbstractDataProvider`: the data provider. - # now let's test the performance on the training set - for b2 in data - # ... - end - end +Returns a vector of (name, shape) pairs describing the names of the labels it provides, and the corresponding shapes. """ -abstract AbstractDataProvider +function provide_label end """ AbstractDataProviderState @@ -123,74 +60,58 @@ abstract AbstractDataProviderState Base type for a data mini-batch. It should implement the following interfaces: - count_samples(provider, batch) -> Int +* [`count_samples`](@ref) +* [`get_data`](@ref) +* [`get_label`](@ref) - :param AbstractDataBatch batch: the data batch object. - :return: the number of samples in this batch. This number should be greater than 0, but - less than or equal to the batch size. This is used to indicate at the end of - the data set, there might not be enough samples for a whole mini-batch. +The following utility functions will be automatically defined: - get_data(provider, batch) -> Vector{NDArray} - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :return: a vector of data in this batch, should be in the same order as declared in - :func:`provide_data() `. - - The last dimension of each `NDArray` should always match the batch_size, even when - :func:`count_samples` returns a value less than the batch size. In this case, - the data provider is free to pad the remaining contents with any value. - - get_label(provider, batch) -> Vector{NDArray} - - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :return: a vector of labels in this batch. Similar to :func:`get_data`. +* [`get`](@ref) +* [`load_data!`](@ref) +* [`load_label!`](@ref) +""" +abstract AbstractDataBatch +""" + count_samples(provider, batch) -> Int - The following utility functions will be automatically defined. +# Arguments: +* `batch::AbstractDataBatch`: the data batch object. - get(provider, batch, name) -> NDArray +Returns the number of samples in this batch. This number should be greater than 0, but less than or equal to the batch size. This is used to indicate at the end of the data set, there might not be enough samples for a whole mini-batch. - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :param Base.Symbol name: the name of the data to get, should be one of the names - provided in either :func:`provide_data() ` - or :func:`provide_label() `. - :return: the corresponding data array corresponding to that name. +""" +function count_samples end - load_data!(provider, batch, targets) +""" + get_data(provider, batch) -> Vector{NDArray} - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :param targets: the targets to load data into. - :type targets: Vector{Vector{SlicedNDArray}} +# Arguments: +* `provider::AbstractDataProvider`: the data provider. +* `batch::AbstractDataBatch`: the data batch object. - The targets is a list of the same length as number of data provided by this provider. - Each element in the list is a list of `SlicedNDArray`. This list described a - spliting scheme of this data batch into different slices, each slice is specified by - a slice-ndarray pair, where *slice* specify the range of samples in the mini-batch - that should be loaded into the corresponding *ndarray*. +Returns a vector of data in this batch, should be in the same order as declared in `provide_data() `. - This utility function is used in data parallelization, where a mini-batch is splited - and computed on several different devices. +The last dimension of each `NDArray` should always match the batch_size, even when `count_samples` returns a value less than the batch size. In this case, the data provider is free to pad the remaining contents with any value. +""" +function get_data end - load_label!(provider, batch, targets) +""" + get_label(provider, batch) -> Vector{NDArray} - :param AbstractDataProvider provider: the data provider. - :param AbstractDataBatch batch: the data batch object. - :param targets: the targets to load label into. - :type targets: Vector{Vector{SlicedNDArray}} +# Arguments: +* `provider::AbstractDataProvider`: the data provider. +* `batch::AbstractDataBatch`: the data batch object. - The same as :func:`load_data!`, except that this is for loading labels. +Returns a vector of labels in this batch. Similar to [`get_data`](@ref). """ -abstract AbstractDataBatch +function get_label end """ DataBatch - A basic subclass of `AbstractDataBatch`, that implement the interface by - accessing member fields. +A basic subclass of `AbstractDataBatch`, that implement the interface by +accessing member fields. """ type DataBatch <: AbstractDataBatch data :: Vector{NDArray} @@ -204,7 +125,7 @@ get_label{Provider<:AbstractDataProvider}(::Provider, batch :: DataBatch) = batc """ SlicedNDArray - A alias type of `Tuple{UnitRange{Int},NDArray}`. +A alias type of `Tuple{UnitRange{Int},NDArray}`. """ typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} @@ -217,10 +138,38 @@ function _load_general!(provider :: AbstractDataProvider, batch :: AbstractDataB end end end + +""" + load_data!(provider, batch, targets) + +# Arguments: +* `provider::AbstractDataProvider`: the data provider. +* `batch::AbstractDataBatch`: the data batch object. +* `targets::Vector{Vector{SlicedNDArray}}`: the targets to load data into. + +The targets is a list of the same length as number of data provided by this provider. +Each element in the list is a list of `SlicedNDArray`. This list described a +spliting scheme of this data batch into different slices, each slice is specified by +a slice-ndarray pair, where *slice* specify the range of samples in the mini-batch +that should be loaded into the corresponding *ndarray*. + +This utility function is used in data parallelization, where a mini-batch is splited +and computed on several different devices. +""" function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) _load_general!(provider, batch, targets, get_data) end + +""" + load_label!(provider, batch, targets) + +* `provider::AbstractDataProvider provider`: the data provider. +* `batch::AbstractDataBatch batch`: the data batch object. +* `targets::Vector{Vector{SlicedNDArray}}`: the targets to load label into. + +The same as [`load_data!`](@ref), except that this is for loading labels. +""" function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}) _load_general!(provider, batch, targets, get_label) @@ -238,6 +187,17 @@ function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatc end import Base.get +""" + get(provider, batch, name) -> NDArray + +* `provider::AbstractDataProvider`: the data provider. +* `batch::AbstractDataBatch`: the data batch object. +* `name::Symbol`: the name of the data to get, should be one of the names + provided in either `provide_data() ` + or `provide_label() `. + +Returns the corresponding data array corresponding to that name. +""" function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name :: Base.Symbol) for (idx, (k, s)) in enumerate(provide_data(provider)) if name == k @@ -257,7 +217,29 @@ eachbatch(provider :: AbstractDataProvider) = provider """ ArrayDataProvider - A convenient tool to iterate `NDArray` or Julia `Array`. +A convenient tool to iterate `NDArray` or Julia `Array`. + + ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) + +Construct a data provider from `NDArray` or Julia Arrays. + +# Arguments: +* `data`: the data, could be + * a `NDArray`, or a Julia Array. This is equivalent to `:data => data`. + * a name-data pair, like `:mydata => array`, where `:mydata` is the name of the data + * and `array` is an `NDArray` or a Julia Array. + * a list of name-data pairs. + +* `label`: the same as the `data` parameter. When this argument is omitted, the constructed provider will provide no labels. +* `batch_size::Int`: the batch size, default is 0, which means treating the whole array as a single mini-batch. +* `shuffle::Bool`: turn on if the data should be shuffled at every epoch. +* `data_padding::Real`: when the mini-batch goes beyond the dataset boundary, there might + be less samples to include than a mini-batch. This value specify a scalar to pad the + contents of all the missing data points. +* `label_padding::Real`: the same as `data_padding`, except for the labels. + +TODO: remove `data_padding` and `label_padding`, and implement rollover that copies +the last or first several training samples to feed the padding. """ type ArrayDataProvider <: AbstractDataProvider data_arrays :: Vector{Array{MX_float}} @@ -274,31 +256,6 @@ type ArrayDataProvider <: AbstractDataProvider label_batch :: Vector{NDArray} end -""" - ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) - - Construct a data provider from `NDArray` or Julia Arrays. - - :param data: the data, could be - - - a `NDArray`, or a Julia Array. This is equivalent to `:data => data`. - - a name-data pair, like `:mydata => array`, where `:mydata` is the name of the data - and `array` is an `NDArray` or a Julia Array. - - a list of name-data pairs. - - :param label: the same as the `data` parameter. When this argument is omitted, the constructed - provider will provide no labels. - :param Int batch_size: the batch size, default is 0, which means treating the whole array as a - single mini-batch. - :param Bool shuffle: turn on if the data should be shuffled at every epoch. - :param Real data_padding: when the mini-batch goes beyond the dataset boundary, there might - be less samples to include than a mini-batch. This value specify a scalar to pad the - contents of all the missing data points. - :param Real label_padding: the same as `data_padding`, except for the labels. - - TODO: remove `data_padding` and `label_padding`, and implement rollover that copies - the last or first several training samples to feed the padding. -""" # Julia's type system is sometimes very frustrating. You cannot specify a function # with argument Vector{Pair} to expect to be matched when calling with the parameter # [:foo => zeros(2,3), :bar => zeros(3)] because the type inference gives very specific @@ -387,9 +344,11 @@ end function provide_data(provider::ArrayDataProvider) return collect(zip(provider.data_names, map(size, provider.data_batch))) end + function provide_label(provider::ArrayDataProvider) return collect(zip(provider.label_names, map(size, provider.label_batch))) end + get_batch_size(provider::ArrayDataProvider) = provider.batch_size immutable ArrayDataProviderState <: AbstractDataProviderState @@ -547,7 +506,42 @@ function count_samples(provider :: MXDataProvider, batch :: MXDataBatch) return provider.batch_size - Int(ref_pad[]) end -function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) +function _get_iter_creators() + n_ref = Ref{MX_uint}(0) + h_ref = Ref{Ptr{MX_handle}}(0) + @mxcall(:MXListDataIters, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) + + return unsafe_wrap(Array, h_ref[], n_ref[]) +end + +function _get_iter_name(hdr :: MX_handle) + ref_name = Ref{char_p}(0) + ref_desc = Ref{char_p}(0) + ref_narg = Ref{MX_uint}(0) + ref_arg_names = Ref{char_pp}(0) + ref_arg_types = Ref{char_pp}(0) + ref_arg_descs = Ref{char_pp}(0) + + @mxcall(:MXDataIterGetIterInfo, + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), + hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) + + return Symbol(unsafe_wrap(String, ref_name[])) +end + +const _iter_creator_cache = Dict{Symbol, MX_handle}() +function _populate_iter_creator_cache!() + empty!(_iter_creator_cache) + h_creators = _get_iter_creators() + for handle in h_creators + name = _get_iter_name(handle) + _iter_creator_cache[name] = handle + end +end + +_get_iter_creator(name :: Symbol) = _iter_creator_cache[name] + +function _define_data_iter_creator(hdr :: MX_handle) ref_name = Ref{char_p}(0) ref_desc = Ref{char_p}(0) ref_narg = Ref{MX_uint}(0) @@ -561,19 +555,24 @@ function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) iter_name = Symbol(unsafe_wrap(String, ref_name[])) - if gen_docs - if endswith(string(iter_name), "Iter") - f_desc = "Can also be called with the alias `$(string(iter_name)[1:end-4] * "Provider")`.\n" - else - f_desc = "" - end - f_desc *= unsafe_string(ref_desc[]) * "\n\n" - f_desc *= ":param Base.Symbol data_name: keyword argument, default `:data`. The name of the data.\n" - f_desc *= ":param Base.Symbol label_name: keyword argument, default `:softmax_label`. " * - "The name of the label. Could be `nothing` if no label is presented in this dataset.\n\n" - f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) - f_desc *= ":return: the constructed `MXDataProvider`." - return (iter_name, f_desc) + isprovider = endswith(string(iter_name), "Iter") + signature = _format_signature(Int(ref_narg[]), ref_arg_names) + f_desc = " " * string(iter_name) * "(" *signature * ")\n\n" + if isprovider + f_desc *= "Can also be called with the alias `$(string(iter_name)[1:end-4] * "Provider")`.\n" + end + f_desc *= unsafe_string(ref_desc[]) * "\n\n" + f_desc *= "# Arguments:\n" + f_desc *= "* `data_name::Symbol`: keyword argument, default `:data`. The name of the data.\n" + f_desc *= "* `label_name::Symbol`: keyword argument, default `:softmax_label`. " * + "The name of the label. Could be `nothing` if no label is presented in this dataset.\n\n" + f_desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) * "\n" + f_desc *= "Returns the constructed `MXDataProvider`." + + if isprovider + alias_name = Symbol(string(iter_name)[1:end-4] * "Provider") + else + alias_name = nothing end defun = quote @@ -582,42 +581,28 @@ function _define_data_iter_creator(hdr :: MX_handle; gen_docs::Bool=false) arg_vals = String[dump_mx_param(v) for (k,v) in kwargs] ref_hdr = Ref{MX_handle}(0) + local hdr = _get_iter_creator($(QuoteNode(iter_name))) @mxcall(:MXDataIterCreateIter, (MX_handle, MX_uint, char_pp, char_pp, Ref{MX_handle}), - $hdr, length(arg_keys), arg_keys, arg_vals, ref_hdr) + hdr, length(arg_keys), arg_keys, arg_vals, ref_hdr) return MXDataProvider(MX_DataIterHandle(ref_hdr[]); kwargs...) end - end - eval(defun) + $(isprovider ? :(const $alias_name = $iter_name) : :()) - # add an alias XXXProvider => XXXIter - if endswith(string(iter_name), "Iter") - alias_name = Symbol(string(iter_name)[1:end-4] * "Provider") - eval(:($alias_name = $iter_name)) + @doc $f_desc $iter_name end + defun end -function _import_io_iterators(;gen_docs::Bool=false) - n_ref = Ref{MX_uint}(0) - h_ref = Ref{Ptr{MX_handle}}(0) - @mxcall(:MXListDataIters, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) - - n_creators = n_ref[] - h_creators = unsafe_wrap(Array, h_ref[], n_creators) - - if gen_docs - docs = Dict{Base.Symbol, AbstractString}() - end - - for i = 1:n_creators - creator_hdr = h_creators[i] - ret = _define_data_iter_creator(creator_hdr; gen_docs=gen_docs) - if gen_docs - docs[ret[1]] = ret[2] - end - end - - if gen_docs - return docs +macro _import_io_iterators() + creators = _get_iter_creators() + defs = Expr[] + for handle in creators + push!(defs, _define_data_iter_creator(handle)) end + esc(quote + $(defs...) + end) end + +@_import_io_iterators() diff --git a/src/ndarray.jl b/src/ndarray.jl index 14fdee01564f..65f1a15bd7b1 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -241,7 +241,7 @@ import Base: size, length, ndims, eltype size(arr :: NDArray, dim :: Int) Get the shape of an `NDArray`. The shape is in Julia's column-major convention. See -also the notes on NDArray shapes [`NDArrat`](@ref). +also the notes on NDArray shapes [`NDArray`](@ref). """ function size(arr :: NDArray) ref_ndim = Ref{MX_uint}(0) From c1268953bf95d45e314b790251b20a442f387cf7 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 23 Aug 2016 05:16:38 +0900 Subject: [PATCH 379/630] use `!!! note` syntax (this breaks documentation creation on v0.4) --- .travis.yml | 1 + docs/src/api/io.md | 26 +++++++++++++------------- 2 files changed, 14 insertions(+), 13 deletions(-) diff --git a/.travis.yml b/.travis.yml index 08c7db10e0ab..284ca4b422ae 100644 --- a/.travis.yml +++ b/.travis.yml @@ -38,6 +38,7 @@ script: after_success: - source $TRAVIS/run_coverage.sh + - echo $TRAVIS_JULIA_VERSION - julia -e 'Pkg.add("Documenter")' - julia -e 'cd(Pkg.dir("MXNet")); include(joinpath("docs", "make.jl"))' diff --git a/docs/src/api/io.md b/docs/src/api/io.md index fe5fd2f46e2b..7312259dbf3c 100644 --- a/docs/src/api/io.md +++ b/docs/src/api/io.md @@ -79,20 +79,20 @@ case, you can safely assume that With those assumptions, it will be relatively easy to adapt any existing iterator. See the implementation of the built-in `MXDataProvider` for example. -### Note: -Please do not use the one data provider simultaneously in two different places, either in parallel, -or in a nested loop. For example, the behavior for the following code is undefined - -```julia -for batch in data - # updating the parameters - - # now let's test the performance on the training set - for b2 in data - # ... +!!! note + Please do not use the one data provider simultaneously in two different places, either in parallel, + or in a nested loop. For example, the behavior for the following code is undefined + + ```julia + for batch in data + # updating the parameters + + # now let's test the performance on the training set + for b2 in data + # ... + end end -end -``` + ``` ```@docs mx.get_batch_size From 3bbd8663fb34f6f400cdaef73a539c6504eded4b Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 23 Aug 2016 06:19:00 +0900 Subject: [PATCH 380/630] build documentation on 0.5 --- docs/make.jl | 1 + 1 file changed, 1 insertion(+) diff --git a/docs/make.jl b/docs/make.jl index 06bbef0466cd..a84f680711a5 100644 --- a/docs/make.jl +++ b/docs/make.jl @@ -8,4 +8,5 @@ makedocs( deploydocs( deps = Deps.pip("pygments", "mkdocs", "mkdocs-material", "python-markdown-math"), repo = "github.com/dmlc/MXNet.jl.git", + julia = "0.5", ) From 84866f46890b61213e0326c06415fed890291d3b Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 23 Aug 2016 07:24:00 +0900 Subject: [PATCH 381/630] fix documentation being attached to the wrong binding: --- src/symbolic-node.jl | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index b71733ace71b..40fc84b3cb42 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -33,13 +33,14 @@ function Base.copy(self :: SymbolicNode) end # TODO(vchuravy) How to add documentation to the v0.5 style call overloading -""" +@doc """ call(self :: SymbolicNode, args :: SymbolicNode...) call(self :: SymbolicNode; kwargs...) Make a new node by composing `self` with `args`. Or the arguments can be specified using keyword arguments. -""" +""" SymbolicNode + @compat function (self::SymbolicNode)(args :: SymbolicNode...) s = deepcopy(self) _compose!(s, args...) From 053ab4258456251f6989bb9902a48fb7071c5f8b Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 24 Aug 2016 06:58:04 +0900 Subject: [PATCH 382/630] fix overseen typo --- src/model.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/model.jl b/src/model.jl index d6752e24ebd3..580896e051e6 100644 --- a/src/model.jl +++ b/src/model.jl @@ -113,7 +113,7 @@ function init_model(self :: FeedForward, initializer :: AbstractInitializer; ove for (name, shape) in zip(aux_names, aux_shapes) if haskey(self.aux_params, name) - if shape == size(self.auxg_params[name]) + if shape == size(self.aux_params[name]) aux_params[name] = self.aux_params[name] continue else From e6979600f8781567a20a29241db7f1c29d8cddec Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sat, 27 Aug 2016 16:57:52 +0900 Subject: [PATCH 383/630] add grad function to do autodiff --- src/symbolic-node.jl | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 40fc84b3cb42..498de4ba42bc 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -202,6 +202,26 @@ function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) @mxcall(:MXSymbolSetAttr, (MX_handle, Cstring, Cstring), self, key_s, value_s) end +""" + grad(self :: SymbolicNode, wrt :: Vector{SymbolicNode}) + +Get the autodiff gradient of the current `SymbolicNode`. This function can +only be used if the current symbol is a loss function. + +# Arguments: +* `self::SymbolicNode`: current node. +* `wrt::Vector{Symbol}`: the names of the arguments to the gradient. + +Returns a gradient symbol of the corresponding gradient. +""" +function grad(self :: SymbolicNode, wrt :: Vector{Symbol}) + hdr_ref = Ref{MX_handle}(0) + keys = String[string(key) for key in wrt] + + @mxcall(:MXSymbolGrad, (MX_handle, MX_uint, char_pp, Ptr{MX_handle}), self, length(keys), keys, hdr_ref) + return SymbolicNode(MX_SymbolHandle(hdr_ref[])) +end + """ Variable(name :: Union{Symbol, AbstractString}) From 4403ef3c810e960d6b619de01354b66bfdf2315e Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 25 Aug 2016 05:03:17 +0900 Subject: [PATCH 384/630] add MultiMetric and reorder metric docs --- src/metric.jl | 88 ++++++++++++++++++++++++++++++++++++++------------- 1 file changed, 66 insertions(+), 22 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index dc00bdafb267..1e11098321ff 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -2,32 +2,24 @@ AbstractEvalMetric The base class for all evaluation metrics. The sub-types should implement the following -interfaces. +interfaces: - .. function:: update!(metric, labels, preds) - - Update and accumulate metrics. - - :param AbstractEvalMetric metric: the metric object. - :param labels: the labels from the data provider. - :type labels: Vector{NDArray} - :param preds: the outputs (predictions) of the network. - :type preds: Vector{NDArray} - - .. function:: reset!(metric) - - Reset the accumulation counter. +* [`update!`](@ref) +* [`reset!`](@ref) +* [`get`](@ref) +""" +abstract AbstractEvalMetric - .. function:: get(metric) +""" + update!(metric, labels, preds) - Get the accumulated metrics. +Update and accumulate metrics. - :return: `Vector{Tuple{Base.Symbol, Real}}`, a list of name-value pairs. For - example, `[(:accuracy, 0.9)]`. +# Arguments: +* `metric::AbstractEvalMetric`: the metric object. +* `labels::Vector{NDArray}`: the labels from the data provider. +* `preds::Vector{NDArray}`: the outputs (predictions) of the network. """ -abstract AbstractEvalMetric - -# Generic update! version function update!{T <: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}) if length(labels) != length(preds) Base.warn_once( @@ -39,6 +31,59 @@ function update!{T <: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray} end end +""" + reset!(metric) + +Reset the accumulation counter. +""" +function reset!(metric :: AbstractEvalMetric) + throw(MethodError(reset!, (typeof(metric),))) +end + + +import Base: get +""" + get(metric) + +Get the accumulated metrics. + +Returns `Vector{Tuple{Base.Symbol, Real}}`, a list of name-value pairs. +For example, `[(:accuracy, 0.9)]`. +""" +function get(metric :: AbstractEvalMetric) + throw(MethodError(get, (typeof(metric),))) +end + +""" + MultiMetric(metrics::Vector{AbstractEvalMetric}) + +Combine multiple metrics in one and get a result for all of them. + +# Usage +To calculate both mean-squared error [`Accuracy`](@ref) and log-loss [`ACE`](@ref): +```julia + mx.fit(..., eval_metric = mx.MultiMetric([mx.Accuracy(), mx.ACE()])) +``` +""" +type MultiMetric <: mx.AbstractEvalMetric + metrics :: Vector{mx.AbstractEvalMetric} +end + +function update!(metric :: MultiMetric, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + for m in metric.metrics + update!(m, labels, preds) + end + return nothing +end + +function reset!(metric :: MultiMetric) + map(reset!, metric.metrics) + return nothing +end + +function get(metric :: MultiMetric) + mapreduce(get, append!, metric.metrics) +end """ Accuracy @@ -89,7 +134,6 @@ function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDA end end -import Base: get function get(metric :: Accuracy) return [(:accuracy, metric.acc_sum / metric.n_sample)] end From 12a87e540f2c97b1bb5ef0870c043f440d93788c Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 24 Aug 2016 21:33:39 +0900 Subject: [PATCH 385/630] add one-dimensional ACE --- src/metric.jl | 69 +++++++++++++++++++++++++++++++-------------------- 1 file changed, 42 insertions(+), 27 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 1e11098321ff..14f56697c4cf 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -206,23 +206,30 @@ function _update_single_output(metric :: ACE, label :: NDArray, pred :: NDArray) @nd_as_jl ro=(label,pred) begin # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) - @assert ndims(pred) == 4 - - labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) - for sample in 1:size(labels, 4) - for j in 1:size(labels, 2) - for i in 1:size(labels, 1) - label = labels[i, j, 1, sample] - - # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification - # Since we can only target labels right now this is the only thing we can do. - target = Int(label) + 1 # klasses are 0...k-1 => julia indexing - p_k = pred[i, j, target, sample] + if ndims(pred) == 4 + labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) + for sample in 1:size(labels, 4) + for j in 1:size(labels, 2) + for i in 1:size(labels, 1) + # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification + # Since we can only target labels right now this is the only thing we can do. + target = Int(labels[i, j, 1, sample]) + 1 # klasses are 0...k-1 => julia indexing + p_k = pred[i, j, target, sample] - metric.ace_sum += log(p_k) - metric.n_sample += 1 + metric.ace_sum += log(p_k) + metric.n_sample += 1 + end end end + elseif ndims(pred) == 2 # 1-dimensional case + for sample in 1:size(labels, 1) + target = Int(labels[sample]) + 1 + p_k = pred[target, sample] + metric.ace_sum += log(p_k) + metric.n_sample += 1 + end + else + error("Can't handle prediction with dimensions $(ndims(pred)).") end end end @@ -257,23 +264,31 @@ function _update_single_output(metric :: MultiACE, label :: NDArray, pred :: NDA @nd_as_jl ro=(label,pred) begin # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) - @assert ndims(pred) == 4 - - labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) - for sample in 1:size(labels, 4) - for j in 1:size(labels, 2) - for i in 1:size(labels, 1) - label = labels[i, j, 1, sample] - # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification - # Since we can only target labels right now this is the only thing we can do. - target = Int(label) + 1 # klasses are 0...k-1 => julia indexing - p_k = pred[i, j, target, sample] + if ndims(pred) == 4 + labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) + for sample in 1:size(labels, 4) + for j in 1:size(labels, 2) + for i in 1:size(labels, 1) + # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification + # Since we can only target labels right now this is the only thing we can do. + target = Int(labels[i, j, 1, sample]) + 1 # klasses are 0...k-1 => julia indexing + p_k = pred[i, j, target, sample] - metric.aces[target] += log(p_k) - metric.counts[target] += 1 + metric.aces[target] += log(p_k) + metric.counts[target] += 1 + end end end + elseif ndims(pred) == 2 + for sample in 1:size(label, 1) + target = Int(label[sample]) + 1 + p_k = pred[target, sample] + metric.aces[target] += log(p_k) + metric.counts[target] += 1 + end + else + error("Can't handle prediction with dimensions $(ndims(pred)).") end end end From ab19db8b76084fc678a95aaba141b0a9c1b833f4 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Mon, 29 Aug 2016 03:22:14 +0900 Subject: [PATCH 386/630] update docs for ACE --- src/metric.jl | 10 +++------- 1 file changed, 3 insertions(+), 7 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 14f56697c4cf..4ae66acf25b7 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -182,9 +182,7 @@ end """ ACE -Averaged cross-entropy for classification. This also know als logloss. - -Calculated the averaged cross entropy for multi-dimentions output. +Calculates the averaged cross-entropy (logloss) for classification. """ type ACE <: AbstractEvalMetric ace_sum :: Float64 @@ -237,10 +235,8 @@ end """ MultiACE -Averaged cross-entropy for classification. This also know als logloss. -This variant keeps track of the different losses per class. - -Calculated the averaged cross entropy for multi-dimentions output. +Calculates the averaged cross-entropy per class and overall (see [`ACE`](@ref)). +This can be used to quantify the influence of different classes on the overall loss. """ type MultiACE <: AbstractEvalMetric aces :: Vector{Float64} From 637e3785d97b76daf4ba9d9ba7b46a26fd148a39 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 1 Sep 2016 02:08:10 +0900 Subject: [PATCH 387/630] cleanup docs a bit more --- docs/src/api/optimizer.md | 15 +++- docs/src/api/optimizers/adam.md | 6 -- docs/src/api/optimizers/sgd.md | 6 -- src/callback.jl | 36 ++++----- src/executor.jl | 6 +- src/model.jl | 131 ++++++++++++++++---------------- src/ndarray.jl | 49 +++++------- src/nn-factory.jl | 2 +- src/optimizer.jl | 84 ++++++++++---------- src/optimizers/adam.jl | 34 ++++----- src/optimizers/sgd.jl | 35 ++++----- src/symbolic-node.jl | 16 ++-- src/util.jl | 1 - src/visualize.jl | 9 ++- 14 files changed, 207 insertions(+), 223 deletions(-) delete mode 100644 docs/src/api/optimizers/adam.md delete mode 100644 docs/src/api/optimizers/sgd.md diff --git a/docs/src/api/optimizer.md b/docs/src/api/optimizer.md index 043529a670c1..81fad7cb827e 100644 --- a/docs/src/api/optimizer.md +++ b/docs/src/api/optimizer.md @@ -1,12 +1,21 @@ # Optimizers ```@autodocs -Modules = [MXNet.mx] +Modules = [MXNet.mx, MXNet.mx.LearningRate, MXNet.mx.Momentum] Pages = ["optimizer.jl"] ``` ## Built-in optimizers -```@contents -Pages = ["optimizers/adam.md", "optimizers/sgd.md"] +### Stochastic Gradient Descent +```@autodocs +Modules = [MXNet.mx] +Pages = ["optimizers/sgd.jl"] +``` + +### ADAM +```@autodocs +Modules = [MXNet.mx] +Pages = ["optimizers/adam.jl"] ``` + diff --git a/docs/src/api/optimizers/adam.md b/docs/src/api/optimizers/adam.md deleted file mode 100644 index 269d82a9c80e..000000000000 --- a/docs/src/api/optimizers/adam.md +++ /dev/null @@ -1,6 +0,0 @@ -# ADAM - -```@autodocs -Modules = [MXNet.mx] -Pages = ["adam.jl"] -``` diff --git a/docs/src/api/optimizers/sgd.md b/docs/src/api/optimizers/sgd.md deleted file mode 100644 index 506c7b5c266d..000000000000 --- a/docs/src/api/optimizers/sgd.md +++ /dev/null @@ -1,6 +0,0 @@ -# Stochastic Gradient Descent - -```@autodocs -Modules = [MXNet.mx] -Pages = ["sgd.jl"] -``` diff --git a/src/callback.jl b/src/callback.jl index 6203f9f51f87..7736bbf08a44 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -32,21 +32,21 @@ A convenient function to construct a callback that runs every `n` mini-batches. # Arguments * `call_on_0::Bool`: keyword argument, default false. Unless set, the callback - will **not** be run on batch 0. + will *not* be run on batch 0. -For example, the :func:`speedometer` callback is defined as +For example, the [`speedometer`](@ref) callback is defined as - .. code-block:: julia - - every_n_iter(frequency, call_on_0=true) do state :: OptimizationState - if state.curr_batch == 0 - # reset timer - else - # compute and print speed - end - end +```julia +every_n_iter(frequency, call_on_0=true) do state :: OptimizationState + if state.curr_batch == 0 + # reset timer + else + # compute and print speed + end +end +``` - :seealso: :func:`every_n_epoch`, :func:`speedometer`. +See also [`every_n_epoch`](@ref) and [`speedometer`](@ref). """ function every_n_batch(callback :: Function, n :: Int; call_on_0 :: Bool = false) BatchCallback(n, call_on_0, callback) @@ -68,7 +68,7 @@ Create an `AbstractBatchCallback` that measure the training speed (number of samples processed per second) every k mini-batches. # Arguments -* Int frequency: keyword argument, default 50. The frequency (number of +* `frequency::Int`: keyword argument, default 50. The frequency (number of min-batches) to measure and report the speed. """ function speedometer(;frequency::Int=50) @@ -97,12 +97,12 @@ end A convenient function to construct a callback that runs every `n` full data-passes. -* Int call_on_0: keyword argument, default false. Unless set, the callback - will **not** be run on epoch 0. Epoch 0 means no training has been performed +* `call_on_0::Int`: keyword argument, default false. Unless set, the callback + will *not* be run on epoch 0. Epoch 0 means no training has been performed yet. This is useful if you want to inspect the randomly initialized model that has not seen any data yet. - :seealso: :func:`every_n_iter`. +See also [`every_n_iter`](@ref). """ function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) @@ -127,9 +127,9 @@ The checkpoints can be loaded back later on. * `prefix::AbstractString`: the prefix of the filenames to save the model. The model architecture will be saved to prefix-symbol.json, while the weights will be saved to prefix-0012.params, for example, for the 12-th epoch. -* Int frequency: keyword argument, default 1. The frequency (measured in epochs) to +* `frequency::Int`: keyword argument, default 1. The frequency (measured in epochs) to save checkpoints. -* Bool save_epoch_0: keyword argument, default false. Whether we should save a +* `save_epoch_0::Bool`: keyword argument, default false. Whether we should save a checkpoint for epoch 0 (model initialized but not seen any data yet). """ function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) diff --git a/src/executor.jl b/src/executor.jl index 8e8bdd3bec93..3ae5301a6c92 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -75,8 +75,8 @@ Create an `Executor` by binding a `SymbolicNode` to concrete `NDArray`. * `ctx::Context`: the context on which the computation should run. * `args`: either a list of `NDArray` or a dictionary of name-array pairs. Concrete arrays for all the inputs in the network architecture. The inputs typically include - network parameters (weights, bias, filters, etc.), data and labels. See :func:`list_arguments` - and :func:`infer_shape`. + network parameters (weights, bias, filters, etc.), data and labels. See [`list_arguments`](@ref) + and [`infer_shape`](@ref). * `args_grad`: * `aux_states`: * `grad_req`: @@ -211,7 +211,7 @@ Can be used to get an estimated about the memory cost. dProvider = ... # DataProvider exec = mx.simple_bind(net, mx.cpu(), data=size(dProvider.data_batch[1])) dbg_str = mx.debug_str(exec) - println(split(ref, ['\n'])[end-2]) + println(split(ref, ['\\n'])[end-2]) ``` """ function debug_str(self :: Executor) diff --git a/src/model.jl b/src/model.jl index 580896e051e6..a892dc886ca3 100644 --- a/src/model.jl +++ b/src/model.jl @@ -11,8 +11,8 @@ abstract AbstractModel The feedforward model provides convenient interface to train and predict on feedforward architectures like multi-layer MLP, ConvNets, etc. There is no explicitly handling of *time index*, but it is relatively easy to implement -unrolled RNN / LSTM under this framework (**TODO**: add example). For models -that handles sequential data explicitly, please use **TODO**... +unrolled RNN / LSTM under this framework (*TODO*: add example). For models +that handles sequential data explicitly, please use *TODO*... """ type FeedForward <: AbstractModel arch :: SymbolicNode @@ -47,10 +47,11 @@ end """ FeedForward(arch :: SymbolicNode, ctx) -* arch: the architecture of the network constructed using the symbolic API. -* ctx: the devices on which this model should do computation. It could be a single `Context` - or a list of `Context` objects. In the latter case, data parallelization will be used - for training. If no context is provided, the default context `cpu()` will be used. +# Arguments: +* `arch`: the architecture of the network constructed using the symbolic API. +* `ctx`: the devices on which this model should do computation. It could be a single `Context` + or a list of `Context` objects. In the latter case, data parallelization will be used + for training. If no context is provided, the default context `cpu()` will be used. """ function FeedForward(arch :: SymbolicNode; context :: Union{Context, Vector{Context}, Void} = nothing) if isa(context, Void) @@ -64,17 +65,18 @@ end """ init_model(self, initializer; overwrite=false, input_shapes...) - Initialize the weights in the model. +Initialize the weights in the model. - This method will be called automatically when training a model. So there is usually no - need to call this method unless one needs to inspect a model with only randomly initialized - weights. +This method will be called automatically when training a model. So there is usually no +need to call this method unless one needs to inspect a model with only randomly initialized +weights. -* FeedForward self: the model to be initialized. -* AbstractInitializer initializer: an initializer describing how the weights should be initialized. -* Bool overwrite: keyword argument, force initialization even when weights already exists. -* input_shapes: the shape of all data and label inputs to this model, given as keyword arguments. - For example, `data=(28,28,1,100), label=(100,)`. +# Arguments: +* `self::FeedForward`: the model to be initialized. +* `initializer::AbstractInitializer`: an initializer describing how the weights should be initialized. +* `overwrite::Bool`: keyword argument, force initialization even when weights already exists. +* `input_shapes`: the shape of all data and label inputs to this model, given as keyword arguments. + For example, `data=(28,28,1,100), label=(100,)`. """ function init_model(self :: FeedForward, initializer :: AbstractInitializer; overwrite::Bool=false, input_shapes...) # all arg names, including data, label, and parameters @@ -162,46 +164,44 @@ function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_sha end """ -.. function:: - predict(self, data; overwrite=false, callback=nothing) + predict(self, data; overwrite=false, callback=nothing) - Predict using an existing model. The model should be already initialized, or trained or loaded from - a checkpoint. There is an overloaded function that allows to pass the callback as the first argument, - so it is possible to do +Predict using an existing model. The model should be already initialized, or trained or loaded from +a checkpoint. There is an overloaded function that allows to pass the callback as the first argument, +so it is possible to do - .. code-block:: julia - - predict(model, data) do batch_output - # consume or write batch_output to file - end - -* FeedForward self: the model. -* AbstractDataProvider data: the data to perform prediction on. -* Bool overwrite: an `Executor` is initialized the first time predict is called. The memory - allocation of the `Executor` depends on the mini-batch size of the test - data provider. If you call predict twice with data provider of the same batch-size, - then the executor can be potentially be re-used. So, if `overwrite` is false, - we will try to re-use, and raise an error if batch-size changed. If `overwrite` - is true (the default), a new `Executor` will be created to replace the old one. - - .. note:: - - Prediction is computationally much less costly than training, so the bottleneck sometimes becomes the IO - for copying mini-batches of data. Since there is no concern about convergence in prediction, it is better - to set the mini-batch size as large as possible (limited by your device memory) if prediction speed is a - concern. - - For the same reason, currently prediction will only use the first device even if multiple devices are - provided to construct the model. - - .. note:: - - If you perform further after prediction. The weights are not automatically synchronized if `overwrite` - is set to false and the old predictor is re-used. In this case - setting `overwrite` to true (the default) will re-initialize the predictor the next time you call - predict and synchronize the weights again. - - :seealso: :func:`train`, :func:`fit`, :func:`init_model`, :func:`load_checkpoint` +```julia +predict(model, data) do batch_output + # consume or write batch_output to file +end +``` + +# Arguments: +* `self::FeedForward`: the model. +* `data::AbstractDataProvider`: the data to perform prediction on. +* `overwrite::Bool`: an `Executor` is initialized the first time predict is called. The memory + allocation of the `Executor` depends on the mini-batch size of the test + data provider. If you call predict twice with data provider of the same batch-size, + then the executor can be potentially be re-used. So, if `overwrite` is false, + we will try to re-use, and raise an error if batch-size changed. If `overwrite` + is true (the default), a new `Executor` will be created to replace the old one. + +!!! note + Prediction is computationally much less costly than training, so the bottleneck sometimes becomes the IO + for copying mini-batches of data. Since there is no concern about convergence in prediction, it is better + to set the mini-batch size as large as possible (limited by your device memory) if prediction speed is a + concern. + + For the same reason, currently prediction will only use the first device even if multiple devices are + provided to construct the model. + +!!! note + If you perform further after prediction. The weights are not automatically synchronized if `overwrite` + is set to false and the old predictor is re-used. In this case + setting `overwrite` to true (the default) will re-initialize the predictor the next time you call + predict and synchronize the weights again. + +See also [`train`](@ref), [`fit`](@ref), [`init_model`](@ref), and [`load_checkpoint`](@ref) """ function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = true) predict(self, data; overwrite = overwrite, callback=callback) @@ -310,7 +310,7 @@ end """ train(model :: FeedForward, ...) -Alias to :func:`fit`. +Alias to [`fit`](@ref). """ function train(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) fit(self, optimizer, data; kwargs...) @@ -321,26 +321,25 @@ end Train the `model` on `data` with the `optimizer`. -* FeedForward model: the model to be trained. -* AbstractOptimizer optimizer: the optimization algorithm to use. -* AbstractDataProvider data: the training data provider. -* Int n_epoch: default 10, the number of full data-passes to run. -* AbstractDataProvider eval_data: keyword argument, default `nothing`. The data provider for +* `model::FeedForward`: the model to be trained. +* `optimizer::AbstractOptimizer`: the optimization algorithm to use. +* `data::AbstractDataProvider`: the training data provider. +* `n_epoch::Int`: default 10, the number of full data-passes to run. +* `eval_data::AbstractDataProvider`: keyword argument, default `nothing`. The data provider for the validation set. -* AbstractEvalMetric eval_metric: keyword argument, default `Accuracy()`. The metric used +* `eval_metric::AbstractEvalMetric`: keyword argument, default [`Accuracy()`](@ref). The metric used to evaluate the training performance. If `eval_data` is provided, the same metric is also calculated on the validation set. -* kvstore: keyword argument, default `:local`. The key-value store used to synchronize gradients +* `kvstore`: keyword argument, default `:local`. The key-value store used to synchronize gradients and parameters when multiple devices are used for training. :type kvstore: `KVStore` or `Base.Symbol` -* AbstractInitializer initializer: keyword argument, default `UniformInitializer(0.01)`. -* Bool force_init: keyword argument, default false. By default, the random initialization using the +* `initializer::AbstractInitializer`: keyword argument, default `UniformInitializer(0.01)`. +* `force_init::Bool`: keyword argument, default false. By default, the random initialization using the provided `initializer` will be skipped if the model weights already exists, maybe from a previous - call to :func:`train` or an explicit call to :func:`init_model` or :func:`load_checkpoint`. When + call to [`train`](@ref) or an explicit call to [`init_model`](@ref) or [`load_checkpoint`](@ref). When this option is set, it will always do random initialization at the begining of training. -* callbacks: keyword argument, default `[]`. Callbacks to be invoked at each epoch or mini-batch, +* `callbacks::Vector{AbstractCallback}`: keyword argument, default `[]`. Callbacks to be invoked at each epoch or mini-batch, see `AbstractCallback`. - :type callbacks: `Vector{AbstractCallback}` """ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) opts = TrainingOptions(; kwargs...) diff --git a/src/ndarray.jl b/src/ndarray.jl index 65f1a15bd7b1..fb06ca2a9573 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -122,10 +122,9 @@ end """ -.. function:: - empty(DType, shape :: Tuple, ctx :: Context) - empty(DType, shape :: Tuple) - empty(DType, dim1, dim2, ...) + empty(DType, shape :: Tuple, ctx :: Context) + empty(DType, shape :: Tuple) + empty(DType, dim1, dim2, ...) Allocate memory for an uninitialized `NDArray` with a specified type. """ @@ -140,10 +139,9 @@ function empty{T<:DType}(:: Type{T}, shape :: Int...) end """ -.. function:: - empty(shape :: Tuple, ctx :: Context) - empty(shape :: Tuple) - empty(dim1, dim2, ...) + empty(shape :: Tuple, ctx :: Context) + empty(shape :: Tuple) + empty(dim1, dim2, ...) Allocate memory for an uninitialized `NDArray` with specific shape of type Float32. """ @@ -236,9 +234,8 @@ end import Base: size, length, ndims, eltype """ -.. function:: - size(arr :: NDArray) - size(arr :: NDArray, dim :: Int) + size(arr :: NDArray) + size(arr :: NDArray, dim :: Int) Get the shape of an `NDArray`. The shape is in Julia's column-major convention. See also the notes on NDArray shapes [`NDArray`](@ref). @@ -390,8 +387,7 @@ end import Base: copy!, copy, convert """ -.. function:: - copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) + copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) Copy contents of `src` into `dst`. """ @@ -467,7 +463,6 @@ end Convert an `NDArray` into a Julia `Array` of specific type. Data will be copied. """ -# Convert copy: NDArray -> Julia Array function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) convert(t, copy(arr)) end @@ -811,10 +806,9 @@ Try to create a Julia array by sharing the data with the underlying `NDArray`. # Arguments: * `arr::NDArray`: the array to be shared. - .. warning:: - - The returned array does not guarantee to share data with the underlying `NDArray`. - In particular, data sharing is possible only when the `NDArray` lives on CPU. +!!! note + The returned array does not guarantee to share data with the underlying `NDArray`. + In particular, data sharing is possible only when the `NDArray` lives on CPU. """ function try_get_shared(arr :: NDArray) if context(arr).device_type == CPU @@ -930,22 +924,21 @@ The libxmnet APIs are automatically imported from `libmxnet.so`. The functions l here operate on `NDArray` objects. The arguments to the functions are typically ordered as -.. code-block:: julia - - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) +```julia + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ..., arg_out1, arg_out2, ...) +``` unless `NDARRAY_ARG_BEFORE_SCALAR` is not set. In this case, the scalars are put before the input arguments: -.. code-block:: julia - - func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) - +```julia + func_name(scalar1, scalar2, ..., arg_in1, arg_in2, ..., arg_out1, arg_out2, ...) +``` If `ACCEPT_EMPTY_MUTATE_TARGET` is set. An overloaded function without the output arguments will also be defined: -.. code-block:: julia - - func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) +```julia + func_name(arg_in1, arg_in2, ..., scalar1, scalar2, ...) +``` Upon calling, the output arguments will be automatically initialized with empty NDArrays. diff --git a/src/nn-factory.jl b/src/nn-factory.jl index a60a4716bfef..76babffbe035 100644 --- a/src/nn-factory.jl +++ b/src/nn-factory.jl @@ -14,7 +14,7 @@ fully connected layers. * `hidden_activation::Symbol`: keyword argument, default `:relu`, indicating the default activation for hidden layers. The specification here could be overwritten by layer-wise specification in the `spec` argument. Also activation is not - applied to the last, i.e. the prediction layer. See :func:`Activation` for a + applied to the last, i.e. the prediction layer. See [`Activation`](@ref) for a list of supported activation types. * `prefix`: keyword argument, default `gensym()`, used as the prefix to name the constructed layers. diff --git a/src/optimizer.jl b/src/optimizer.jl index c5d4b29aa308..c672c2fe998a 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -24,27 +24,20 @@ abstract AbstractMomentumScheduler """ OptimizationState - .. attribute:: batch_size - - The size of the mini-batch used in stochastic training. - - .. attribute:: curr_epoch - - The current epoch count. Epoch 0 means no training yet, during the first - pass through the data, the epoch will be 1; during the second pass, the - epoch count will be 1, and so on. - - .. attribute:: curr_batch - - The current mini-batch count. The batch count is reset during every epoch. - The batch count 0 means the beginning of each epoch, with no mini-batch - seen yet. During the first mini-batch, the mini-batch count will be 1. - - .. attribute:: curr_iter - - The current iteration count. One iteration corresponds to one mini-batch, - but unlike the mini-batch count, the iteration count does **not** reset - in each epoch. So it track the *total* number of mini-batches seen so far. +# Attributes: +* `batch_size`: The size of the mini-batch used in stochastic training. +* `curr_epoch`: + The current epoch count. Epoch 0 means no training yet, during the first + pass through the data, the epoch will be 1; during the second pass, the + epoch count will be 1, and so on. +* `curr_batch`: + The current mini-batch count. The batch count is reset during every epoch. + The batch count 0 means the beginning of each epoch, with no mini-batch + seen yet. During the first mini-batch, the mini-batch count will be 1. +* `curr_iter`: + The current iteration count. One iteration corresponds to one mini-batch, + but unlike the mini-batch count, the iteration count does **not** reset + in each epoch. So it track the *total* number of mini-batches seen so far. """ type OptimizationState batch_size :: Int @@ -59,12 +52,12 @@ OptimizationState(batch_size::Int) = OptimizationState(batch_size, 0, 0, 0) get_learning_rate(scheduler, state) # Arguments -* AbstractLearningRateScheduler scheduler: a learning rate scheduler. -* OptimizationState state: the current state about epoch, mini-batch and iteration count. - :return: the current learning rate. +* `scheduler::AbstractLearningRateScheduler`: a learning rate scheduler. +* `state::OptimizationState`: the current state about epoch, mini-batch and iteration count. + +Returns the current learning rate. """ -function get_learning_rate -end +function get_learning_rate end ################################################################################ # The learning rate module @@ -74,7 +67,7 @@ import ..mx: AbstractLearningRateScheduler, OptimizationState, get_learning_rate """ LearningRate.Fixed - Fixed learning rate scheduler always return the same learning rate. +Fixed learning rate scheduler always return the same learning rate. """ type Fixed <: AbstractLearningRateScheduler learning_rate :: Float64 @@ -84,8 +77,8 @@ get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rat """ LearningRate.Exp - :math:`\eta_t = \eta_0\gamma^t`. Here :math:`t` is the epoch count, or the iteration - count if `decay_on_iteration` is set to true. +``\eta_t = \eta_0\gamma^t``. Here ``t`` is the epoch count, or the iteration +count if `decay_on_iteration` is set to true. """ type Exp <: AbstractLearningRateScheduler learning_rate :: Float64 @@ -101,9 +94,9 @@ get_learning_rate(self :: Exp, state :: OptimizationState) = """ LearningRate.Inv - :math:`\eta_t = \eta_0 * (1 + \gamma * t)^(-power)`. - Here :math:`t` is the epoch count, or the iteration count if `decay_on_iteration` - is set to true. +``\eta_t = \eta_0 * (1 + \gamma * t)^(-power)``. +Here ``t`` is the epoch count, or the iteration count if `decay_on_iteration` +is set to true. """ type Inv <: AbstractLearningRateScheduler learning_rate :: Float64 @@ -132,9 +125,10 @@ end """ get_momentum(scheduler, state) -* AbstractMomentumScheduler scheduler: the momentum scheduler. -* OptimizationState state: the state about current epoch, mini-batch and iteration count. - :return: the current momentum. +* `scheduler::AbstractMomentumScheduler`: the momentum scheduler. +* `state::OptimizationState`: the state about current epoch, mini-batch and iteration count. + +Returns the current momentum. """ function get_momentum end @@ -148,8 +142,8 @@ import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum """ Momentum.Null - The null momentum scheduler always returns 0 for momentum. It is also used to - explicitly indicate momentum should not be used. +The null momentum scheduler always returns 0 for momentum. It is also used to +explicitly indicate momentum should not be used. """ type Null <: AbstractMomentumScheduler end @@ -158,7 +152,7 @@ get_momentum(self :: Null, state :: OptimizationState) = 0.0 """ Momentum.Fixed - Fixed momentum scheduler always returns the same value. +Fixed momentum scheduler always returns the same value. """ type Fixed <: AbstractMomentumScheduler momentum :: Float64 @@ -180,10 +174,10 @@ end """ get_updater(optimizer) -* AbstractOptimizer optimizer: the underlying optimizer. +A utility function to create an updater function, that uses its closure to +store all the states needed for each weights. - A utility function to create an updater function, that uses its closure to - store all the states needed for each weights. +* `optimizer::AbstractOptimizer`: the underlying optimizer. """ function get_updater(optimizer :: AbstractOptimizer) states = Dict{Int,Any}() @@ -206,11 +200,11 @@ abstract AbstractOptimizerOptions """ normalized_gradient(opts, state, grad) -* AbstractOptimizerOptions opts: options for the optimizer, should contain the field +* `opts::AbstractOptimizerOptions`: options for the optimizer, should contain the field `grad_scale`, `grad_clip` and `weight_decay`. -* OptimizationState state: the current optimization state. -* NDArray weight: the trainable weights. -* NDArray grad: the original gradient of the weights. +* `state::OptimizationState`: the current optimization state. +* `weight::NDArray`: the trainable weights. +* `grad::NDArray`: the original gradient of the weights. Get the properly normalized gradient (re-scaled and clipped if necessary). """ diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl index 6b17f1b3e152..665cc52694b0 100644 --- a/src/optimizers/adam.jl +++ b/src/optimizers/adam.jl @@ -8,26 +8,26 @@ lr_scheduler :: Any = nothing ) -#=doc -.. class:: ADAM +""" + ADAM - The solver described in Diederik Kingma, Jimmy Ba: *Adam: A Method for - Stochastic Optimization*. arXiv:1412.6980 [cs.LG]. +The solver described in Diederik Kingma, Jimmy Ba: *Adam: A Method for +Stochastic Optimization*. arXiv:1412.6980 [cs.LG]. - .. function:: ADAM(; kwargs...) + ADAM(; kwargs...) - :param Real lr: default `0.001`, learning rate. - :param AbstractLearningRateScheduler lr_scheduler: default `nothing`, a - dynamic learning rate scheduler. If set, will overwrite the `lr` - parameter. - :param Real beta1: default `0.9`. - :param Real beta2: default `0.999`. - :param Real epsilon: default `1e-8`. - :param Real grad_clip: default `0`, if positive, will clip the gradient - into the range `[-grad_clip, grad_clip]`. - :param Real weight_decay: default `0.00001`, weight decay is equivalent - to adding a global l2 regularizer for all the parameters. -=# +* `lr::Real`: default `0.001`, learning rate. +* `lr_scheduler::AbstractLearningRateScheduler`: default `nothing`, a + dynamic learning rate scheduler. If set, will overwrite the `lr` + parameter. +* `beta1::Real`: default `0.9`. +* `beta2::Real`: default `0.999`. +* `epsilon::Real`: default `1e-8`. +* `grad_clip::Real`: default `0`, if positive, will clip the gradient + into the range `[-grad_clip, grad_clip]`. +* `weight_decay::Real`: default `0.00001`, weight decay is equivalent + to adding a global l2 regularizer for all the parameters. +""" type ADAM <: AbstractOptimizer opts :: ADAMOptions state :: OptimizationState diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index fb6bf195fdb5..2eda1d0bf67c 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -7,26 +7,27 @@ momentum_scheduler :: Any = nothing ) -#=doc -.. class:: SGD +""" + SGD - Stochastic gradient descent optimizer. +Stochastic gradient descent optimizer. - .. function:: SGD(; kwargs...) + SGD(; kwargs...) - :param Real lr: default `0.01`, learning rate. - :param AbstractLearningRateScheduler lr_scheduler: default `nothing`, a - dynamic learning rate scheduler. If set, will overwrite the `lr` - parameter. - :param Real momentum: default `0.0`, the momentum. - :param AbstractMomentumScheduler momentum_scheduler: default `nothing`, - a dynamic momentum scheduler. If set, will overwrite the `momentum` - parameter. - :param Real grad_clip: default `0`, if positive, will clip the gradient - into the bounded range `[-grad_clip, grad_clip]`. - :param Real weight_decay: default `0.0001`, weight decay is equivalent to - adding a global l2 regularizer to the parameters. -=# +# Arguments: +* `lr::Real`: default `0.01`, learning rate. +* `lr_scheduler::AbstractLearningRateScheduler`: default `nothing`, a + dynamic learning rate scheduler. If set, will overwrite the `lr` + parameter. +* `momentum::Real`: default `0.0`, the momentum. +* `momentum_scheduler::AbstractMomentumScheduler`: default `nothing`, + a dynamic momentum scheduler. If set, will overwrite the `momentum` + parameter. +* `grad_clip::Real`: default `0`, if positive, will clip the gradient + into the bounded range `[-grad_clip, grad_clip]`. +* `weight_decay::Real`: default `0.0001`, weight decay is equivalent to + adding a global l2 regularizer to the parameters. +""" type SGD <: AbstractOptimizer opts :: SGDOptions state :: OptimizationState diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 498de4ba42bc..48ec27833ad6 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -189,11 +189,11 @@ end Set the attribute key to value for this `SymbolicNode`. -# Warning -It is encouraged not to call this function directly, unless you know exactly what you are doing. The -recommended way of setting attributes is when creating the `SymbolicNode`. Changing -the attributes of a `SymbolicNode` that is already been used somewhere else might -cause unexpected behavior and inconsistency. +!!! note + It is encouraged not to call this function directly, unless you know exactly what you are doing. The + recommended way of setting attributes is when creating the `SymbolicNode`. Changing + the attributes of a `SymbolicNode` that is already been used somewhere else might + cause unexpected behavior and inconsistency. """ function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) key_s = string(key) @@ -304,7 +304,7 @@ end Do shape inference according to the input shapes. The input shapes could be provided as a list of shapes, which should specify the shapes of inputs in the same order as -the arguments returned by :func:`list_arguments`. Alternatively, the shape information +the arguments returned by [`list_arguments`](@ref). Alternatively, the shape information could be specified via keyword arguments. Returns a 3-tuple containing shapes of all the arguments, shapes of all the outputs and @@ -372,7 +372,7 @@ end Do type inference according to the input types. The input types could be provided as a list of types, which should specify the types of inputs in the same order as -the arguments returned by :func:`list_arguments`. Alternatively, the type information +the arguments returned by [`list_arguments`](@ref). Alternatively, the type information could be specified via keyword arguments. Returns a 3-tuple containing types of all the arguments, types of all the outputs and @@ -401,7 +401,7 @@ end Get a node representing the specified output of this node. The index could be a symbol or string indicating the name of the output, or a 1-based integer -indicating the index, as in the list of :func:`list_outputs`. +indicating the index, as in the list of [`list_outputs`](@ref). """ function Base.getindex(self :: SymbolicNode, idx :: Union{Base.Symbol, AbstractString}) idx = Symbol(idx) diff --git a/src/util.jl b/src/util.jl index 5c50d20357e7..544962e4f161 100644 --- a/src/util.jl +++ b/src/util.jl @@ -62,7 +62,6 @@ end ################################################################################ # Internal Utilities ################################################################################ -const DOC_EMBED_ANCHOR = "**autogen:EMBED:{1}:EMBED:autogen**" function _format_typestring(typestr :: String) replace(typestr, r"\bSymbol\b", "SymbolicNode") end diff --git a/src/visualize.jl b/src/visualize.jl index c60868430a9c..f0dd74efdc67 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -3,13 +3,14 @@ import JSON """ to_graphviz(network) -* SymbolicNode network: the network to visualize. -* AbstractString title: keyword argument, default "Network Visualization", +* `network::SymbolicNode`: the network to visualize. +* `title::AbstractString:` keyword argument, default "Network Visualization", the title of the GraphViz graph. -* input_shapes: keyword argument, default `nothing`. If provided, +* `input_shapes`: keyword argument, default `nothing`. If provided, will run shape inference and plot with the shape information. Should be either a dictionary of name-shape mapping or an array of shapes. - :return: the graph description in GraphViz `dot` language. + +Returns the graph description in GraphViz `dot` language. """ function to_graphviz(network :: SymbolicNode; title="Network Visualization", input_shapes=nothing) if !isa(input_shapes, Void) From 3fac768636662e7befc95764fe32996c8e477494 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 2 Sep 2016 02:54:54 +0900 Subject: [PATCH 388/630] associate docs with method and not binding --- src/io.jl | 2 +- src/ndarray.jl | 24 +++++++++--------------- src/symbolic-node.jl | 11 +++-------- 3 files changed, 13 insertions(+), 24 deletions(-) diff --git a/src/io.jl b/src/io.jl index 1878125f15fd..0c5de69e53f8 100644 --- a/src/io.jl +++ b/src/io.jl @@ -576,6 +576,7 @@ function _define_data_iter_creator(hdr :: MX_handle) end defun = quote + @doc $f_desc -> function $iter_name(; kwargs...) arg_keys = String[string(k) for (k,v) in kwargs] arg_vals = String[dump_mx_param(v) for (k,v) in kwargs] @@ -589,7 +590,6 @@ function _define_data_iter_creator(hdr :: MX_handle) end $(isprovider ? :(const $alias_name = $iter_name) : :()) - @doc $f_desc $iter_name end defun end diff --git a/src/ndarray.jl b/src/ndarray.jl index fb06ca2a9573..6cccacd35bd8 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1047,7 +1047,6 @@ function _get_function_expressions(handle :: MX_handle, name) func_head = Expr(:call, name, args...) func_def = Expr(:function, func_head, func_body) - exprs = Expr[func_def] if accept_empty_mutate args0 = args[1:n_used_vars+n_scalars] @@ -1058,9 +1057,10 @@ function _get_function_expressions(handle :: MX_handle, name) func_head0 = Expr(:call, name, args0...) func_def0 = Expr(:function, func_head0, func_body0) - push!(exprs, func_def0) + return func_def, func_def0 + else + return func_def, :() end - return exprs end macro _import_ndarray_functions() @@ -1071,19 +1071,13 @@ macro _import_ndarray_functions() handle = funcs[i] name, desc = _get_function_description(handle) - exprs = _get_function_expressions(handle, name) + func_def, func_def0 = _get_function_expressions(handle, name) - # TODO(vchuravy): Fix this in a more elegant way once we only support - # v0.5 - if isdefined(Base, name) || isdefined(name) - expr = quote - $(exprs...) - end - else - expr = quote - $(exprs...) - @doc $desc $name - end + expr = quote + $(isdefined(Base, name) ? :(import Base.$name) : :()) + @doc $desc -> + $func_def + $func_def0 end push!(func_exprs, expr) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 48ec27833ad6..5c1b123b0b7e 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -703,14 +703,9 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) end func_def = Expr(:function, func_head, Expr(:block, func_body)) - # TODO(vchuravy) find a more elegant solution fro v0.5 - if isdefined(Base, func_name) || isdefined(func_name) - return func_def - else - return quote - $func_def - @doc $f_desc $func_name - end + return quote + @doc $f_desc -> + $func_def end end From f0b758b62cadf48e6d7d836b765960c6e03a8899 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 2 Sep 2016 02:57:51 +0900 Subject: [PATCH 389/630] move call docs into type docs --- src/symbolic-node.jl | 15 ++++++--------- 1 file changed, 6 insertions(+), 9 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 5c1b123b0b7e..13675450232a 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -2,6 +2,12 @@ SymbolicNode SymbolicNode is the basic building block of the symbolic graph in MXNet.jl. + + (self :: SymbolicNode)(args :: SymbolicNode...) + (self :: SymbolicNode)(; kwargs...) + +Make a new node by composing `self` with `args`. Or the arguments +can be specified using keyword arguments. """ type SymbolicNode handle :: MX_SymbolHandle @@ -32,15 +38,6 @@ function Base.copy(self :: SymbolicNode) Base.deepcopy(self) end -# TODO(vchuravy) How to add documentation to the v0.5 style call overloading -@doc """ - call(self :: SymbolicNode, args :: SymbolicNode...) - call(self :: SymbolicNode; kwargs...) - -Make a new node by composing `self` with `args`. Or the arguments -can be specified using keyword arguments. -""" SymbolicNode - @compat function (self::SymbolicNode)(args :: SymbolicNode...) s = deepcopy(self) _compose!(s, args...) From 1ba38965f2780dad6659dcac74a7654bdf77cf3a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 1 Sep 2016 11:50:48 -0700 Subject: [PATCH 390/630] update default dataset URL (fix test failing of #123) --- src/util.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/util.jl b/src/util.jl index 544962e4f161..10d42b25a37c 100644 --- a/src/util.jl +++ b/src/util.jl @@ -18,7 +18,7 @@ function get_mnist_ubyte() filenames = Dict([k => joinpath(mnist_dir, v) for (k,v) in filenames]) if !all(isfile, values(filenames)) cd(mnist_dir) do - mnist_dir = download("http://webdocs.cs.ualberta.ca/~bx3/data/mnist.zip", "mnist.zip") + mnist_dir = download("http://data.dmlc.ml/mxnet/data/mnist.zip", "mnist.zip") try run(`unzip -u $mnist_dir`) catch @@ -41,7 +41,7 @@ function get_cifar10() filenames = Dict([k => joinpath(cifar10_dir, v) for (k,v) in filenames]) if !all(isfile, values(filenames)) cd(cifar10_dir) do - run(`wget http://webdocs.cs.ualberta.ca/~bx3/data/cifar10.zip`) + run(`http://data.dmlc.ml/mxnet/data/cifar10.zip`) try run(`unzip -u cifar10.zip`) catch From 6840119fb6440c4e6ab3bfbecc131795c8a82557 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 25 Aug 2016 04:28:49 +0900 Subject: [PATCH 391/630] handle kwargs for ndarray functions --- src/ndarray.jl | 40 ++++++++++++++++++++++------------------ test/unittest/ndarray.jl | 11 +++++++++++ 2 files changed, 33 insertions(+), 18 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 6cccacd35bd8..fb203cd91635 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -885,17 +885,17 @@ with corresponding support (see `load`). * `filename::String`: path to the binary file to write to. * `data`: data to save to file. Data can be a`NDArray`, a `Vector{NDArray}`, or a `Dict{Base.Symbol, NDArray}`. """ -function save(filename::AbstractString, data::NDArray) +function save(filename::String, data::NDArray) save(filename, [data]) end -function save(filename::AbstractString, data::Vector{NDArray}) +function save(filename::String, data::Vector{NDArray}) @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), filename, length(data), MX_handle[data...], char_pp(0)) end -function save(filename::AbstractString, data::Dict{Base.Symbol,NDArray}) +function save(filename::String, data::Dict{Base.Symbol,NDArray}) names = [k for k in keys(data)] arrays = MX_handle[data[k] for k in names] - names = AbstractString[string(k) for k in names] + names = String[string(k) for k in names] @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), filename, length(names), arrays, names) @@ -904,10 +904,12 @@ end ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ -function _invoke_mxfunction(func_handle::MX_handle, use_vars, scalars, mut_vars) - @mxcall(:MXFuncInvoke, - (MX_handle, Ptr{MX_handle}, Ptr{MX_float}, Ptr{MX_handle}), - func_handle, use_vars, scalars, mut_vars) +function _invoke_mxfunction(func_handle::MX_handle, use_vars, scalars, mut_vars; kwargs...) + names = String[string(entry[1]) for entry in kwargs] + args = String[string(entry[2]) for entry in kwargs] + @mxcall(:MXFuncInvokeEx, + (MX_handle, Ptr{MX_handle}, Ptr{MX_float}, Ptr{MX_handle}, Cint, char_pp, char_pp), + func_handle, use_vars, scalars, mut_vars, length(names), names, args) end @enum(LIBMX_FUNC_TYPE_MASK, @@ -1035,7 +1037,7 @@ function _get_function_expressions(handle :: MX_handle, name) end stmt_call = quote local handle = _get_function($(QuoteNode(name))) - _invoke_mxfunction(handle, $_use_vars, $_scalars, $_mut_vars) + _invoke_mxfunction(handle, $_use_vars, $_scalars, $_mut_vars; kwargs...) end if n_mutate_vars == 1 stmt_ret = :(return out1) @@ -1043,20 +1045,22 @@ function _get_function_expressions(handle :: MX_handle, name) stmt_ret = Expr(:return, Expr(:tuple, [Symbol("out$i") for i=1:n_mutate_vars]...)) end - func_body = Expr(:block, stmt_call, stmt_ret) - func_head = Expr(:call, name, args...) - - func_def = Expr(:function, func_head, func_body) + func_def = quote + function $name($(args...); kwargs...) + $stmt_call + $stmt_ret + end + end if accept_empty_mutate args0 = args[1:n_used_vars+n_scalars] - func_head0 = Expr(:call, name, args0...) _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] - stmt_call0 = Expr(:call, name, args0..., _mut_vars0...) - func_body0 = Expr(:block, stmt_call0) - func_head0 = Expr(:call, name, args0...) - func_def0 = Expr(:function, func_head0, func_body0) + func_def0 = quote + function $name($(args0...); kwargs...) + $name($(args0...), $(_mut_vars0...); kwargs...) + end + end return func_def, func_def0 else return func_def, :() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index f76d8cd95b59..83b0578bb91f 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -298,6 +298,16 @@ function test_eltype() end end +function test_kwargs() + info("NDArray::kwargs") + dims1 = (2,3,4) + + x = mx.empty(dims1) + tx = mx.transpose(x, axes=(1,0,2)) + # @test size(tx) == (3,2,4) + @test size(tx) == (2,4,3) +end + ################################################################################ # Run tests ################################################################################ @@ -315,5 +325,6 @@ test_sqrt() test_eltype() test_nd_as_jl() test_dot() +test_kwargs() end From e0b76682a9f5a676935d905c50bfcec75fcda9d8 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 2 Sep 2016 02:28:04 +0900 Subject: [PATCH 392/630] special case transpose --- src/ndarray.jl | 10 ++++++++++ test/unittest/ndarray.jl | 10 ++++++---- 2 files changed, 16 insertions(+), 4 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index fb203cd91635..c3288dc323eb 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1035,6 +1035,15 @@ function _get_function_expressions(handle :: MX_handle, name) if name == :dot _use_vars.args[2:end] = flipdim(_use_vars.args[2:end], 1) end + + if name == :transpose + transform = quote + kwargs = Any[key != :axes ? (key, arg) : (key, reverse(map(i->length(arg)-i, arg))) for (key, arg) in kwargs] + end + else + transform = :() + end + stmt_call = quote local handle = _get_function($(QuoteNode(name))) _invoke_mxfunction(handle, $_use_vars, $_scalars, $_mut_vars; kwargs...) @@ -1047,6 +1056,7 @@ function _get_function_expressions(handle :: MX_handle, name) func_def = quote function $name($(args...); kwargs...) + $transform $stmt_call $stmt_ret end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 83b0578bb91f..8d5a1b0d57a9 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -302,10 +302,12 @@ function test_kwargs() info("NDArray::kwargs") dims1 = (2,3,4) - x = mx.empty(dims1) - tx = mx.transpose(x, axes=(1,0,2)) - # @test size(tx) == (3,2,4) - @test size(tx) == (2,4,3) + A = rand(Float32, dims1) + x = mx.NDArray(A) + tx = mx.transpose(x, axes=(2,1,3)) + tA = permutedims(A, [2,1,3]) + @test size(tx) == size(tA) + @test all(copy(tx) .== tA) end ################################################################################ From f5e80af08039bb410b69fbbe1899586e70810510 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 2 Sep 2016 05:34:43 +0900 Subject: [PATCH 393/630] add special casing of transpose to the symbolic layer --- src/symbolic-node.jl | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 13675450232a..bbaf16c47001 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -630,6 +630,11 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) name = "" end + if $func_name == :transpose + kwargs = Any[key != :axes ? (key, arg) : (key, reverse(map(i->length(arg)-i, arg))) for (key, arg) in kwargs] + end + + param_keys = String[] param_vals = String[] symbol_kws = Dict{Symbol, SymbolicNode}() From ae1d45b4566114c1f271c07fdc36e5f3bd4824eb Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 6 Sep 2016 11:47:36 -0400 Subject: [PATCH 394/630] preparing for v0.0.9 --- NEWS.md | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/NEWS.md b/NEWS.md index f11136c8cd46..03ede8371798 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,10 @@ +# v0.0.9 (2016.09.06) + +* Migrated documentation system to `Documenter.jl` (@vchuravy) +* Simplified building by using Julia's OpenBlas (@staticfloat) +* Freezing parameters (@vchuravy) +* Support `DType` for `NDArray` (@vchuravy) + # v0.0.8 (2016.02.08) * Fix compatability with Julia v0.5. From 9e3a60a56120fa75ad0291ea0cbf81af146c7fc4 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 6 Sep 2016 19:55:05 +0200 Subject: [PATCH 395/630] Positional arguments in symbolic API need type restriction. (#134) * fix positional arguments can only be SymbolicNodes * fix missing signature of Symbolic function in docs --- src/symbolic-node.jl | 18 +++++++----------- test/unittest/symbolic-node.jl | 7 +++++++ 2 files changed, 14 insertions(+), 11 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index bbaf16c47001..15ae1d7d0e2d 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -610,7 +610,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) signature = _format_signature(Int(ref_nargs[]), ref_arg_names) f_desc = " " * func_name_s * "(" * signature * ")\n\n" - f_desc = unsafe_wrap(String, ref_desc[]) * "\n\n" + f_desc *= unsafe_wrap(String, ref_desc[]) * "\n\n" if !isempty(kv_nargs_s) f_desc *= "This function support variable length positional `SymbolicNode` inputs.\n\n" end @@ -620,9 +620,9 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) f_desc *= "* `attrs::Dict{Symbol, AbstractString}`: The attributes associated with this `SymbolicNode`.\n\n" f_desc *= "Returns `$(_format_typestring(unsafe_wrap(String, ref_ret_type[])))`." - # function $func_name(args...; kwargs...) - func_head = Expr(:call, func_name, Expr(:parameters, Expr(:..., :kwargs)), Expr(:..., :args)) - func_body = quote + func_def = quote + @doc $f_desc -> + function $func_name(args::SymbolicNode...; kwargs...) idx = findfirst(x -> x[1] == :name, kwargs) if idx > 0 name = kwargs[idx][2] @@ -702,13 +702,9 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) end return node - end - - func_def = Expr(:function, func_head, Expr(:block, func_body)) - return quote - @doc $f_desc -> - $func_def - end + end # function + end # quote + return func_def end function _get_atomic_symbol_creators() diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 825602723151..388a74fe644b 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -106,6 +106,12 @@ function test_attrs() @test_throws MethodError mx.Convolution(data=data2, kernel = (1,1), num_filter = 1, attrs = Dict(:test => "1.0", :test2 => 1.0)) end +function test_functions() + info("SymbolicNode::Functions") + data = mx.Variable(:data) + typeof(mx.sum(data)) == mx.SymbolicNode +end + ################################################################################ # Run tests ################################################################################ @@ -116,5 +122,6 @@ test_infer_shape() test_infer_shape_error() test_saveload() test_attrs() +test_functions() end From 8949dbb5f63fcbc2b97ffcfc6460c270db49c3f6 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 6 Sep 2016 19:59:18 +0200 Subject: [PATCH 396/630] remove mistaken + in REQUIRE (#135) --- REQUIRE | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/REQUIRE b/REQUIRE index 6fbfb73bd328..38ef82563fc3 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,4 +1,4 @@ -julia 0.4+ +julia 0.4 Compat 0.8.4 Formatting BinDeps From f06d9943f51fdb77b8c2841aa70258eb4dbf7f30 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 6 Sep 2016 23:22:48 -0400 Subject: [PATCH 397/630] fix special handling of dot for SymbolicNode (#123) --- src/ndarray.jl | 3 +++ src/symbolic-node.jl | 12 ++++++++++-- test/unittest/symbolic-node.jl | 17 ++++++++++++++++- 3 files changed, 29 insertions(+), 3 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index c3288dc323eb..2e2c806552f7 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1036,6 +1036,9 @@ function _get_function_expressions(handle :: MX_handle, name) _use_vars.args[2:end] = flipdim(_use_vars.args[2:end], 1) end + # XXX: hacky way of solving the semantic difference of the axes parameter in Julia + # and in libmxnet. + # See https://github.com/dmlc/MXNet.jl/pull/123 if name == :transpose transform = quote kwargs = Any[key != :axes ? (key, arg) : (key, reverse(map(i->length(arg)-i, arg))) for (key, arg) in kwargs] diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 15ae1d7d0e2d..dfc54c3c3b1c 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -629,12 +629,20 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) else name = "" end + + # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped + # See https://github.com/dmlc/MXNet.jl/issues/55 + if $func_name_s == "dot" + args = reverse(args) + end - if $func_name == :transpose + # XXX: hacky way of solving the semantic difference of the axes parameter in Julia + # and in libmxnet. + # See https://github.com/dmlc/MXNet.jl/pull/123 + if $func_name_s == "transpose" kwargs = Any[key != :axes ? (key, arg) : (key, reverse(map(i->length(arg)-i, arg))) for (key, arg) in kwargs] end - param_keys = String[] param_vals = String[] symbol_kws = Dict{Symbol, SymbolicNode}() diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 388a74fe644b..d78b0775a983 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -2,7 +2,7 @@ module TestSymbolicNode using MXNet using Base.Test -using ..Main: mlp2 +using ..Main: mlp2, reldiff ################################################################################ # Test Implementations @@ -112,6 +112,20 @@ function test_functions() typeof(mx.sum(data)) == mx.SymbolicNode end +function test_dot() + info("SymbolicNode::dot") + x = mx.Variable(:x) + y = mx.Variable(:y) + z = mx.dot(x, y) + z_exec = mx.bind(z, context=mx.cpu(), + args=Dict(:x=>mx.ones((100, 2)), :y=>mx.ones((2, 200)))) + mx.forward(z_exec) + + ret = copy(z_exec.outputs[1]) + @test size(ret) == (100, 200) + @test reldiff(ret, 2*ones(100, 200)) < 1e-6 +end + ################################################################################ # Run tests ################################################################################ @@ -123,5 +137,6 @@ test_infer_shape_error() test_saveload() test_attrs() test_functions() +test_dot() end From 6e2c1aecf098ee00c9a1cfe495650c1f0d9674b2 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 6 Sep 2016 23:44:05 -0400 Subject: [PATCH 398/630] add readme for developers --- README-DEV.md | 10 ++++++++++ deps/build.jl | 2 ++ 2 files changed, 12 insertions(+) create mode 100644 README-DEV.md diff --git a/README-DEV.md b/README-DEV.md new file mode 100644 index 000000000000..e4dc3fd45c29 --- /dev/null +++ b/README-DEV.md @@ -0,0 +1,10 @@ +# Workflow for making a release + +1. Update `NEWS.md` to list important changes +2. Check out the `stable` branch, rebase with `master`. +3. Update `libmxnet_curr_ver` in `deps/build.jl` to the latest commit SHA (or any proper reference). Using `master` here is not good because future changes in libmxnet might break existing Julia packages. +4. Run tests. +5. Commit changes and push. +6. Run `Pkg.tag("MXNet")` in Julia. +7. Run `Pkg.publish()`, which will open a browser for making a pull request to METADATA.jl. +8. Edit the [releases page](https://github.com/dmlc/MXNet.jl/releases) to copy the release notes from `NEWS.md` to the newly created release tag. diff --git a/deps/build.jl b/deps/build.jl index 1736bf9eb0a2..22f06e7acf36 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -3,6 +3,7 @@ using Compat # First try to detect and load existing libmxnet ################################################################################ libmxnet_detected = false +libmxnet_curr_ver = "master" if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") @@ -58,6 +59,7 @@ if !libmxnet_detected ChangeDirectory(_srcdir) `rm -rf mxnet` `git clone --recursive https://github.com/dmlc/mxnet` + `git checkout $libmxnet_curr_ver` FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin ChangeDirectory("$_mxdir") `cp make/config.mk config.mk` From ebdafe814bfe7f277b256470aafdeed3044f64a5 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 6 Sep 2016 23:44:57 -0400 Subject: [PATCH 399/630] update libmxnet SHA --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 22f06e7acf36..cc7fb6e563c3 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -3,7 +3,7 @@ using Compat # First try to detect and load existing libmxnet ################################################################################ libmxnet_detected = false -libmxnet_curr_ver = "master" +libmxnet_curr_ver = "7a90e598623314b5f7adc1184e4012f6c6160ff6" if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") From 545332d3c66545653c525e3982b0f80f34a6409f Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 6 Sep 2016 23:45:38 -0400 Subject: [PATCH 400/630] keep the master branch to track libmxnet master --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index cc7fb6e563c3..22f06e7acf36 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -3,7 +3,7 @@ using Compat # First try to detect and load existing libmxnet ################################################################################ libmxnet_detected = false -libmxnet_curr_ver = "7a90e598623314b5f7adc1184e4012f6c6160ff6" +libmxnet_curr_ver = "master" if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") From 39bc643ee5c54e243c45a5837b408f8ed4f9aa84 Mon Sep 17 00:00:00 2001 From: pluskid Date: Wed, 7 Sep 2016 00:11:48 -0400 Subject: [PATCH 401/630] make is_windows compatible with Julia v0.4 --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 22f06e7acf36..ebce44a22ec7 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -23,7 +23,7 @@ if !libmxnet_detected ################################################################################ # If not found, try to build automatically using BinDeps ################################################################################ - if is_windows() + if @compat(is_windows()) info("Please follow the libmxnet documentation on how to build manually") info("or to install pre-build packages:") info("http://mxnet.readthedocs.io/en/latest/how_to/build.html#building-on-windows") From ba2c9995c87c752fd8ebe495fff7dbeb9488a889 Mon Sep 17 00:00:00 2001 From: pluskid Date: Wed, 7 Sep 2016 00:20:29 -0400 Subject: [PATCH 402/630] fix build script --- deps/build.jl | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index ebce44a22ec7..c073bdf6b1c8 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -59,9 +59,12 @@ if !libmxnet_detected ChangeDirectory(_srcdir) `rm -rf mxnet` `git clone --recursive https://github.com/dmlc/mxnet` - `git checkout $libmxnet_curr_ver` + @build_steps begin + ChangeDirectory(joinpath(_srcdir, "mxnet")) + `git checkout $libmxnet_curr_ver` + end FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin - ChangeDirectory("$_mxdir") + ChangeDirectory(_mxdir) `cp make/config.mk config.mk` if is_apple() `cp make/osx.mk config.mk` From 8f4396116ac8e245f4773d50e3323fdd234c1249 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Sep 2016 00:24:32 -0400 Subject: [PATCH 403/630] prepare for v0.1.0 --- NEWS.md | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/NEWS.md b/NEWS.md index 03ede8371798..4423c42d6724 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,7 @@ +# v0.1.0 (2016.09.07) + +* Track specific libmxnet version for each release. + # v0.0.9 (2016.09.06) * Migrated documentation system to `Documenter.jl` (@vchuravy) From 86362f353ebebe38452dd96853816f7b0b8af79c Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Sep 2016 00:25:37 -0400 Subject: [PATCH 404/630] update workflow for creating release --- README-DEV.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README-DEV.md b/README-DEV.md index e4dc3fd45c29..b148fde3d5c7 100644 --- a/README-DEV.md +++ b/README-DEV.md @@ -1,7 +1,7 @@ # Workflow for making a release 1. Update `NEWS.md` to list important changes -2. Check out the `stable` branch, rebase with `master`. +2. Check out the `stable` branch, merge with `master`. 3. Update `libmxnet_curr_ver` in `deps/build.jl` to the latest commit SHA (or any proper reference). Using `master` here is not good because future changes in libmxnet might break existing Julia packages. 4. Run tests. 5. Commit changes and push. From 1a0b440bef9fe791ffa35abb6bbfe58cccba85c8 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 7 Sep 2016 18:56:11 +0200 Subject: [PATCH 405/630] Make build.jl aware of other blas vendors besides OpenBLAS (#137) * be a bit more lenient about which blas versions we support * also set dependencies to the correct version * Fail if blas_vendor == :unknown --- deps/build.jl | 13 +++++++++++-- 1 file changed, 11 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index c073bdf6b1c8..3efddefa8061 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -30,7 +30,7 @@ if !libmxnet_detected error("Automatic building libxmnet on Windows is currently not supported yet.") end - openblas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) + blas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) if VERSION >= v"0.5.0-dev+4338" blas_vendor = Base.BLAS.vendor() @@ -43,6 +43,14 @@ if !libmxnet_detected ilp64 = "-DINTERFACE64" end + if blas_vendor == :unknown + error("Julia is build with an unkown blas library ($blas_path).\n Automatic building of libmxnet is not yet supported.") + elseif blas_vendor != :openblas64 || blas_vendor != :openblas + warn("Unsure if we can build against $blas_vendor.") + end + + blas_name = blas_vendor == :openblas64 ? "openblas" : string(blas_vendor) + #-------------------------------------------------------------------------------- # Build libmxnet mxnet = library_dependency("mxnet", aliases=["libmxnet", "libmxnet.so"]) @@ -62,6 +70,7 @@ if !libmxnet_detected @build_steps begin ChangeDirectory(joinpath(_srcdir, "mxnet")) `git checkout $libmxnet_curr_ver` + `git submodule update` end FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin ChangeDirectory(_mxdir) @@ -72,7 +81,7 @@ if !libmxnet_detected `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` `cp ../../cblas.h include/cblas.h` - `make USE_BLAS=openblas MSHADOW_LDFLAGS="$openblas_path"` + `make USE_BLAS=$blas_name MSHADOW_LDFLAGS="$blas_path"` `cp lib/libmxnet.so $_libdir` end) end From d4278ca5515c6c89d27fc40350c6adf683caf08d Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Sep 2016 13:13:03 -0400 Subject: [PATCH 406/630] remove unnecessary @compat call --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 3efddefa8061..66b08165cfa4 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -23,7 +23,7 @@ if !libmxnet_detected ################################################################################ # If not found, try to build automatically using BinDeps ################################################################################ - if @compat(is_windows()) + if is_windows() info("Please follow the libmxnet documentation on how to build manually") info("or to install pre-build packages:") info("http://mxnet.readthedocs.io/en/latest/how_to/build.html#building-on-windows") From 1ff097550557e8e560a5be58f2e36920d2f68e56 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Sep 2016 13:33:53 -0400 Subject: [PATCH 407/630] replace pipe with pipeline --- src/util.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/util.jl b/src/util.jl index 10d42b25a37c..a53647790c06 100644 --- a/src/util.jl +++ b/src/util.jl @@ -46,7 +46,7 @@ function get_cifar10() run(`unzip -u cifar10.zip`) catch try - run(pipe(`7z x cifar10.zip`,stdout=DevNull)) + run(pipeline(`7z x cifar10.zip`, stdout=DevNull)) catch error("Extraction Failed:No extraction program found in path") end From 37e715ab14bd0a3a919277843bd8e8d33d4bb9f5 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 7 Sep 2016 14:12:49 -0400 Subject: [PATCH 408/630] fix build script --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 66b08165cfa4..b65c3d89632b 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -45,7 +45,7 @@ if !libmxnet_detected if blas_vendor == :unknown error("Julia is build with an unkown blas library ($blas_path).\n Automatic building of libmxnet is not yet supported.") - elseif blas_vendor != :openblas64 || blas_vendor != :openblas + elseif blas_vendor != :openblas64 && blas_vendor != :openblas warn("Unsure if we can build against $blas_vendor.") end From 9798c974b3365e543a4184a0b8f71174410121e4 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 8 Sep 2016 07:36:46 +0900 Subject: [PATCH 409/630] improve buildscript --- deps/build.jl | 51 ++++++++++++++++++++++++++++++++++++--------------- 1 file changed, 36 insertions(+), 15 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index b65c3d89632b..d69ac93a2c3b 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -44,19 +44,25 @@ if !libmxnet_detected end if blas_vendor == :unknown - error("Julia is build with an unkown blas library ($blas_path).\n Automatic building of libmxnet is not yet supported.") - elseif blas_vendor != :openblas64 && blas_vendor != :openblas - warn("Unsure if we can build against $blas_vendor.") + info("Julia is build with an unkown blas library ($blas_path).") + info("Attempting build without reusing the blas library") + USE_JULIA_BLAS = false + elseif !(blas_vendor in (:openblas, :openblas64)) + info("Unsure if we can build against $blas_vendor.") + info("Attempting build anyway.") + USE_JULIA_BLAS = true + else + USE_JULIA_BLAS = true end blas_name = blas_vendor == :openblas64 ? "openblas" : string(blas_vendor) #-------------------------------------------------------------------------------- # Build libmxnet - mxnet = library_dependency("mxnet", aliases=["libmxnet", "libmxnet.so"]) + mxnet = library_dependency("mxnet", aliases=["mxnet", "libmxnet", "libmxnet.so"]) _prefix = joinpath(BinDeps.depsdir(mxnet), "usr") - _srcdir = joinpath(BinDeps.depsdir(mxnet),"src") + _srcdir = joinpath(BinDeps.depsdir(mxnet), "src") _mxdir = joinpath(_srcdir, "mxnet") _libdir = joinpath(_prefix, "lib") provides(BuildProcess, @@ -64,28 +70,43 @@ if !libmxnet_detected CreateDirectory(_srcdir) CreateDirectory(_libdir) @build_steps begin - ChangeDirectory(_srcdir) - `rm -rf mxnet` - `git clone --recursive https://github.com/dmlc/mxnet` + BinDeps.DirectoryRule(_mxdir, @build_steps begin + ChangeDirectory(_srcdir) + `git clone --recursive https://github.com/dmlc/mxnet` + end) @build_steps begin - ChangeDirectory(joinpath(_srcdir, "mxnet")) + ChangeDirectory(_mxdir) + `git fetch` `git checkout $libmxnet_curr_ver` `git submodule update` end - FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin + FileRule(joinpath(_mxdir, "config.mk"), @build_steps begin ChangeDirectory(_mxdir) - `cp make/config.mk config.mk` if is_apple() `cp make/osx.mk config.mk` + else + `cp make/config.mk config.mk` end `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` - `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` + end) + @build_steps begin + ChangeDirectory(_mxdir) `cp ../../cblas.h include/cblas.h` - `make USE_BLAS=$blas_name MSHADOW_LDFLAGS="$blas_path"` - `cp lib/libmxnet.so $_libdir` + if USE_JULIA_BLAS + MakeTargets("USE_BLAS=$blas_name -j$(nprocs())", env=Dict( + "MSHADOW_LDFLAGS" => blas_path, + "MSHADOW_CFLAGS" => ilp64, + )) + else + `make -j$(nprocs())` + end + `rm $_libdir/libmxnet.so` + end + FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin + `cp $_mxdir/lib/libmxnet.so $_libdir/` end) end - end), mxnet) + end), mxnet, installed_libpath=_libdir) @BinDeps.install Dict(:mxnet => :mxnet) end From eb4a3fd72ff743ca43e8478baa0b1b28eef52ae8 Mon Sep 17 00:00:00 2001 From: pluskid Date: Thu, 8 Sep 2016 11:21:32 -0400 Subject: [PATCH 410/630] fix build script. --- deps/build.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index d69ac93a2c3b..d6d6f2386c48 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -44,7 +44,7 @@ if !libmxnet_detected end if blas_vendor == :unknown - info("Julia is build with an unkown blas library ($blas_path).") + info("Julia is built with an unkown blas library ($blas_path).") info("Attempting build without reusing the blas library") USE_JULIA_BLAS = false elseif !(blas_vendor in (:openblas, :openblas64)) @@ -100,7 +100,7 @@ if !libmxnet_detected else `make -j$(nprocs())` end - `rm $_libdir/libmxnet.so` + `rm -f $_libdir/libmxnet.so` end FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin `cp $_mxdir/lib/libmxnet.so $_libdir/` From 44d659ab661baccd6c3eaafa15528026ab67fab4 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 9 Sep 2016 02:00:24 +0200 Subject: [PATCH 411/630] Fixes deps/build.jl on Travis (#142) The problem is that we need to specify `MSHADOW_LDFLAGS` and `MSHADOW_CFLAGS`. The way MXNet is currently setup we can't change these from the terminal. This solves the problem by using `sed` to change `mshadow/make/mshadow.mk`. But if mshadow would change git could throw an error on updating. So we remove the changes before an update and add them afterwards again. This has the drawback that users can't modifty that file. (But those users should maintain their own build and use `MXNET_HOME`.) This also eagerly deletes `usr/lib/libmxnet.so` So that we actually trigger a rebuild on an update of the pkg. --- deps/build.jl | 13 ++++++++----- 1 file changed, 8 insertions(+), 5 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index d6d6f2386c48..b79940e8c1eb 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -56,6 +56,7 @@ if !libmxnet_detected end blas_name = blas_vendor == :openblas64 ? "openblas" : string(blas_vendor) + MSHADOW_LDFLAGS = "MSHADOW_LDFLAGS=-lm $blas_path" #-------------------------------------------------------------------------------- # Build libmxnet @@ -65,6 +66,9 @@ if !libmxnet_detected _srcdir = joinpath(BinDeps.depsdir(mxnet), "src") _mxdir = joinpath(_srcdir, "mxnet") _libdir = joinpath(_prefix, "lib") + # We have do eagerly delete the installed libmxnet.so + # Otherwise we won't rebuild on an update. + run(`rm -f $_libdir/libmxnet.so`) provides(BuildProcess, (@build_steps begin CreateDirectory(_srcdir) @@ -76,9 +80,12 @@ if !libmxnet_detected end) @build_steps begin ChangeDirectory(_mxdir) + # TODO(vchuravy). We have to reset mshadow/make/mshadow.mk + `git -C mshadow checkout -- make/mshadow.mk` `git fetch` `git checkout $libmxnet_curr_ver` `git submodule update` + `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` end FileRule(joinpath(_mxdir, "config.mk"), @build_steps begin ChangeDirectory(_mxdir) @@ -93,14 +100,10 @@ if !libmxnet_detected ChangeDirectory(_mxdir) `cp ../../cblas.h include/cblas.h` if USE_JULIA_BLAS - MakeTargets("USE_BLAS=$blas_name -j$(nprocs())", env=Dict( - "MSHADOW_LDFLAGS" => blas_path, - "MSHADOW_CFLAGS" => ilp64, - )) + `make -j$(nprocs()) USE_BLAS=$blas_name $MSHADOW_LDFLAGS` else `make -j$(nprocs())` end - `rm -f $_libdir/libmxnet.so` end FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin `cp $_mxdir/lib/libmxnet.so $_libdir/` From e218d85baa630ee44eeb2b047aa8d7c24870b5d7 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 8 Sep 2016 21:42:14 -0400 Subject: [PATCH 412/630] fix NEWS.md for skipped v0.0.9 --- NEWS.md | 5 +---- REQUIRE | 2 +- 2 files changed, 2 insertions(+), 5 deletions(-) diff --git a/NEWS.md b/NEWS.md index 4423c42d6724..2d0ec817ce39 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,9 +1,6 @@ -# v0.1.0 (2016.09.07) +# v0.1.0 (2016.09.08) * Track specific libmxnet version for each release. - -# v0.0.9 (2016.09.06) - * Migrated documentation system to `Documenter.jl` (@vchuravy) * Simplified building by using Julia's OpenBlas (@staticfloat) * Freezing parameters (@vchuravy) diff --git a/REQUIRE b/REQUIRE index 38ef82563fc3..d37f975fe665 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,5 +1,5 @@ julia 0.4 -Compat 0.8.4 +Compat 0.9.1 Formatting BinDeps JSON From 6bd3951d93999d1d58681ca56b2269bb4a7558a4 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 16 Sep 2016 03:42:17 +0900 Subject: [PATCH 413/630] try to automatically find CUDA --- deps/build.jl | 17 ++++++++++++++++- 1 file changed, 16 insertions(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index b79940e8c1eb..4a13b19c105c 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -32,6 +32,16 @@ if !libmxnet_detected blas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) + # Try to find cuda + hascuda = false + if haskey(ENV, "CUDA_HOME") + hascuda = Libdl.dlopen_e(joinpath(ENV["CUDA_HOME"], "lib64", "libcuda.so")) != C_NULL + else + cudapaths = String["/opt/cuda/lib64", "/usr/local/cuda/lib64"] + cudalib = Libdl.find_library(["libcuda", "libcuda.so"], cudapaths) + hascuda = Libdl.dlopen_e(cudalib) != C_NULL + end + if VERSION >= v"0.5.0-dev+4338" blas_vendor = Base.BLAS.vendor() else @@ -80,7 +90,6 @@ if !libmxnet_detected end) @build_steps begin ChangeDirectory(_mxdir) - # TODO(vchuravy). We have to reset mshadow/make/mshadow.mk `git -C mshadow checkout -- make/mshadow.mk` `git fetch` `git checkout $libmxnet_curr_ver` @@ -95,6 +104,12 @@ if !libmxnet_detected `cp make/config.mk config.mk` end `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` + if hascuda + `sed -i -s 's/USE_CUDA = 0/USE_CUDA = 1/' config.mk` + if haskey(ENV, "CUDA_HOME") + `sed -i -s 's/USE_CUDA_PATH = NULL/USE_CUDA_PATH = $(ENV["CUDA_HOME"])/' config.mk` + end + end end) @build_steps begin ChangeDirectory(_mxdir) From 7a2432c0b4851189108689caf02ac43014285ad5 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Sep 2016 13:15:13 -0400 Subject: [PATCH 414/630] ignore vscode project files --- .gitignore | 1 + 1 file changed, 1 insertion(+) diff --git a/.gitignore b/.gitignore index 3325a370ecaf..d6791c8491bf 100644 --- a/.gitignore +++ b/.gitignore @@ -10,3 +10,4 @@ deps/deps.jl docs/_build docs/build/ docs/site/ +.vscode From e6b050805ea81535232c52c4847b8478e54f318a Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Sep 2016 17:58:08 -0400 Subject: [PATCH 415/630] ndarray ops --- src/base.jl | 2 +- src/ndarray.jl | 197 ++++++++++++++----------------------------- src/symbolic-node.jl | 4 +- src/util.jl | 70 +++++++++++++++ 4 files changed, 135 insertions(+), 138 deletions(-) diff --git a/src/base.jl b/src/base.jl index cca45c273b96..a864125757cd 100644 --- a/src/base.jl +++ b/src/base.jl @@ -102,7 +102,7 @@ macro mx_define_handle_t(name, destructor) end @mx_define_handle_t(MX_NDArrayHandle, MXNDArrayFree) -@mx_define_handle_t(MX_FunctionHandle, nop) +@mx_define_handle_t(MX_OpHandle, nop) @mx_define_handle_t(MX_SymbolHandle, MXSymbolFree) @mx_define_handle_t(MX_ExecutorHandle, MXExecutorFree) @mx_define_handle_t(MX_DataIterHandle, MXDataIterFree) diff --git a/src/ndarray.jl b/src/ndarray.jl index 2e2c806552f7..c1cd7ccf16b2 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -333,7 +333,7 @@ scenarios are supported """ function setindex!(arr :: NDArray, val :: Real, ::Colon) @assert(arr.writable) - _set_value(convert(eltype(arr), val), arr) + _set_value(out=arr, src=convert(eltype(arr), val)) return arr end function setindex!{T<:Real}(arr :: NDArray, val :: Array{T}, ::Colon) @@ -948,156 +948,83 @@ Those functions always return the output arguments. If there is only one output object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. """ -function _get_ndarray_functions() - n = Ref{MX_uint}(0) - handles = Ref{Ptr{MX_handle}}(0) - - @mxcall(:MXListFunctions, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n, handles) - - funcs = unsafe_wrap(Array, handles[], n[]) - return funcs -end - -const _function_cache = Dict{Symbol, MX_handle}() -function _get_function(name :: Symbol) - if !haskey(_function_cache, name) - handle = Ref{MX_handle}(0) - - @mxcall(:MXGetFunction, (Cstring, Ref{MX_handle}), name, handle) - _function_cache[name] = handle[] - return handle[] - else - return _function_cache[name] - end -end - -function _get_function_description(handle :: MX_handle) - # get function information (human readable) - ref_name = Ref{char_p}(0) - ref_desc = Ref{char_p}(0) - ref_narg = Ref{MX_uint}(0) - - ref_arg_names = Ref{char_pp}(0) - ref_arg_types = Ref{char_pp}(0) - ref_arg_descs = Ref{char_pp}(0) - - ref_ret_type = Ref{char_p}(0) - - @mxcall(:MXFuncGetInfo, - (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, - Ref{char_pp}, Ref{char_pp}, Ref{char_p}), - handle, ref_name, ref_desc, ref_narg, ref_arg_names, - ref_arg_types, ref_arg_descs, ref_ret_type) - - name = Symbol(unsafe_wrap(String, ref_name[])) - signature = _format_signature(Int(ref_narg[]), ref_arg_names) - desc = " " * string(name) * "(" * signature * ")\n\n" - desc *= unsafe_wrap(String, ref_desc[]) * "\n\n" - desc *= "# Arguments\n" - desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) - return name, desc -end - -function _get_function_expressions(handle :: MX_handle, name) - # get function specification - ref_n_use_vars = Ref{MX_uint}(0) - ref_n_scalars = Ref{MX_uint}(0) - ref_n_mut_vars = Ref{MX_uint}(0) - ref_type_mask = Ref{Cint}(0) - @mxcall(:MXFuncDescribe, - (MX_handle, Ref{MX_uint}, Ref{MX_uint}, Ref{MX_uint}, Ref{Cint}), - handle, ref_n_use_vars, ref_n_scalars, ref_n_mut_vars, ref_type_mask) - - n_used_vars = ref_n_use_vars[] - n_scalars = ref_n_scalars[] - n_mutate_vars = ref_n_mut_vars[] - type_mask = ref_type_mask[] - accept_empty_mutate = (type_mask & convert(Cint,ACCEPT_EMPTY_MUTATE_TARGET)) != 0 - arg_before_scalar = (type_mask & convert(Cint,NDARRAY_ARG_BEFORE_SCALAR)) != 0 - - # general ndarray function - if arg_before_scalar - args = vcat([Expr(:(::), Symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), Symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), Symbol("out$i"), NDArray) for i=1:n_mutate_vars]) - else - args = vcat([Expr(:(::), Symbol("sca$i"), Real) for i=1:n_scalars], - [Expr(:(::), Symbol("in$i"), NDArray) for i=1:n_used_vars], - [Expr(:(::), Symbol("out$i"), NDArray) for i=1:n_mutate_vars]) - end - - _use_vars = Expr(:ref, :MX_handle, [Symbol("in$i") for i=1:n_used_vars]...) - _scalars = Expr(:ref, :MX_float, [Symbol("sca$i") for i=1:n_scalars]...) - _mut_vars = Expr(:ref, :MX_handle, [Symbol("out$i") for i=1:n_mutate_vars]...) - - # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped - # See https://github.com/dmlc/MXNet.jl/issues/55 - if name == :dot - _use_vars.args[2:end] = flipdim(_use_vars.args[2:end], 1) - end - - # XXX: hacky way of solving the semantic difference of the axes parameter in Julia - # and in libmxnet. - # See https://github.com/dmlc/MXNet.jl/pull/123 - if name == :transpose - transform = quote - kwargs = Any[key != :axes ? (key, arg) : (key, reverse(map(i->length(arg)-i, arg))) for (key, arg) in kwargs] - end - else - transform = :() - end - - stmt_call = quote - local handle = _get_function($(QuoteNode(name))) - _invoke_mxfunction(handle, $_use_vars, $_scalars, $_mut_vars; kwargs...) - end - if n_mutate_vars == 1 - stmt_ret = :(return out1) - else - stmt_ret = Expr(:return, Expr(:tuple, [Symbol("out$i") for i=1:n_mutate_vars]...)) - end +function _get_ndarray_function_def(name :: String) + func_name = Symbol(name) func_def = quote - function $name($(args...); kwargs...) - $transform - $stmt_call - $stmt_ret - end - end + function $func_name(args::NDArray...; out=nothing, kwargs...) + if out != nothing + output_vars = out + if isa(output_vars, NDArray) + output_vars = NDArray[output_vars] + end + num_outputs = length(output_vars) + else + output_vars = NDArray[] + num_outputs = 0 + end + + # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped + # See https://github.com/dmlc/MXNet.jl/issues/55 + if $name == "dot" + args = flipdim(args, 1) + end - if accept_empty_mutate - args0 = args[1:n_used_vars+n_scalars] - _mut_vars0 = [:(NDArray(_ndarray_alloc())) for i=1:n_mutate_vars] + # XXX: hacky way of solving the semantic difference of the axes parameter in Julia + # and in libmxnet. + # See https://github.com/dmlc/MXNet.jl/pull/123 + if $name == "transpose" + kwargs = Any[key != :axes ? (key, arg) : (key, reverse(map(i->length(arg)-i, arg))) for (key, arg) in kwargs] + end - func_def0 = quote - function $name($(args0...); kwargs...) - $name($(args0...), $(_mut_vars0...); kwargs...) + output_handles = [Base.cconvert(MX_handle, x) for x in output_vars] + output_handles_pp = [Base.cconvert(Ptr{MX_handle}, output_handles)] + num_outputs_p = [convert(Cint, num_outputs)] + + kw_keys_str = String[string(x[1]) for x in kwargs] + kw_vals_str = String[string(x[2]) for x in kwargs] + + args = collect(args) # tuple to list + op_handle = _get_cached_libmx_op_handle($(QuoteNode(name))) + @mxcall(:MXImperativeInvoke, + (MX_handle, Cint, Ptr{MX_handle}, + Ptr{Cint}, Ptr{Ptr{MX_handle}}, + Cint, char_pp, char_pp), + op_handle, length(args), args, + num_outputs_p, output_handles_pp, + length(kwargs), kw_keys_str, kw_vals_str) + + if out == nothing + handle_array = unsafe_wrap(Array, output_handles_pp[], num_outputs_p[]) + arrays = [NDArray(hdr) for hdr in handle_array] + if mx_num_outputs == 1 + return arrays[1] + else + return arrays + end + else + return out end end - return func_def, func_def0 - else - return func_def, :() end + + return func_def end macro _import_ndarray_functions() - funcs = _get_ndarray_functions() - func_exprs = Expr[] + names = _get_libmx_op_names() + func_exprs = map(names) do name + op_handle = _get_libmx_op_handle(name) - for i = 1:length(funcs) - handle = funcs[i] - - name, desc = _get_function_description(handle) - func_def, func_def0 = _get_function_expressions(handle, name) + desc, key_narg = _get_libmx_op_description(name, op_handle) + func_def = _get_ndarray_function_def(name) + func_name = Symbol(name) expr = quote - $(isdefined(Base, name) ? :(import Base.$name) : :()) + $(isdefined(Base, func_name) ? :(import Base.$func_name) : :()) @doc $desc -> $func_def - $func_def0 end - - push!(func_exprs, expr) end esc(quote diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index dfc54c3c3b1c..c1e6f7d8e8c6 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -629,7 +629,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) else name = "" end - + # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped # See https://github.com/dmlc/MXNet.jl/issues/55 if $func_name_s == "dot" @@ -755,7 +755,7 @@ macro _import_atomic_symbol_creators() end) end -@_import_atomic_symbol_creators() +#@_import_atomic_symbol_creators() ################################################################################ # Utility macros to chain up symbols diff --git a/src/util.jl b/src/util.jl index a53647790c06..11d12e7f9dd2 100644 --- a/src/util.jl +++ b/src/util.jl @@ -62,6 +62,76 @@ end ################################################################################ # Internal Utilities ################################################################################ +function _get_libmx_op_names() + n = Ref{MX_uint}(0) + names = Ref{char_pp}(0) + + @mxcall(:MXListAllOpNames, (Ref{MX_uint}, Ref{char_pp}), n, names) + + names = unsafe_wrap(Array, names[], n[]) + return [unsafe_string(x) for x in names] +end +function _get_libmx_op_handle(name :: String) + handle = Ref{MX_handle}(0) + @mxcall(:NNGetOpHandle, (char_p, Ref{MX_handle}), name, handle) + return MX_OpHandle(handle[]) +end + +# We keep a cache and retrieve the address everytime +# we run Julia, instead of pre-compiling with macro, +# because the actual handle might change in different +# runs +const _libmx_op_cache = Dict{String, MX_OpHandle}() +function _get_cached_libmx_op_handle(name :: String) + if !haskey(_libmx_op_cache, name) + handle = _get_libmx_op_handle(name) + _libmx_op_cache[name] = handle + return handle + else + return _libmx_op_cache[name] + end +end + +function _get_libmx_op_description(name :: String, handle :: MX_OpHandle) + # get operator information (human readable) + ref_real_name = Ref{char_p}(0) + ref_desc = Ref{char_p}(0) + ref_narg = Ref{MX_uint}(0) + + ref_arg_names = Ref{char_pp}(0) + ref_arg_types = Ref{char_pp}(0) + ref_arg_descs = Ref{char_pp}(0) + + ref_key_narg = Ref{char_p}(0) + ref_ret_type = Ref{char_p}(0) + + @mxcall(:MXSymbolGetAtomicSymbolInfo, + (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, + Ref{char_pp}, Ref{char_pp}, Ref{char_p}, Ref{char_p}), + handle, ref_real_name, ref_desc, ref_narg, ref_arg_names, + ref_arg_types, ref_arg_descs, ref_key_narg, ref_ret_type) + + real_name = unsafe_string(ref_real_name[]) + signature = _format_signature(Int(ref_narg[]), ref_arg_names) + desc = " " * name * "(" * signature * ")\n\n" + if real_name != name + desc *= name * " is an alias of " * real_name * ".\n\n" + end + + key_narg = unsafe_string(ref_key_narg[]) + if key_narg != "" + desc *= "**Note**: " * name * " takes variable number of positional inputs. " + desc *= "So instead of calling as $name([x, y, z], $key_narg=3), " + desc *= "one should call via $name(x, y, z), and $key_narg will be " + desc *= "determined automatically.\n\n" + end + + desc *= unsafe_string(ref_desc[]) * "\n\n" + desc *= "# Arguments\n" + desc *= _format_docstring(Int(ref_narg[]), ref_arg_names, ref_arg_types, ref_arg_descs) + return desc, key_narg +end + function _format_typestring(typestr :: String) replace(typestr, r"\bSymbol\b", "SymbolicNode") end From d16b654b8dc350355bdc794383beac43de35de66 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Sep 2016 20:16:51 -0400 Subject: [PATCH 416/630] ndarray op test --- src/ndarray.jl | 43 ++++++++++++++++++++++++++++------------ test/unittest/ndarray.jl | 19 +++++++++--------- 2 files changed, 40 insertions(+), 22 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index c1cd7ccf16b2..6cd6762488d4 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -155,6 +155,17 @@ function empty(shape :: Int...) empty(shape) end +import Base.similar + +""" + similar(arr :: NDArray) + +Create an `NDArray` with similar shape, data type, and context with the given one. +""" +function similar(arr :: NDArray) + empty(eltype(arr), size(arr), context(arr)) +end + """ zeros(DType, shape :: Tuple, ctx :: Context) zeros(DType, shape :: Tuple) @@ -398,7 +409,7 @@ function copy!(dst :: NDArray, src :: NDArray) return end - _copyto(src, dst) + _copyto(src, out=dst) return dst end @@ -513,9 +524,9 @@ function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) @assert dst.writable for arg in args if isa(arg, Real) - _plus_scalar(dst, convert(eltype(dst), arg), dst) + _plus_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) else - _plus(dst, arg, dst) + _plus(dst, arg, out=dst) end end return dst @@ -553,9 +564,9 @@ Subtract a bunch of arguments from `dst`. Inplace updating. function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) - _minus_scalar(dst, convert(eltype(dst), arg), dst) + _minus_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) else - _minus(dst, arg, dst) + _minus(dst, arg, out=dst) end end @@ -586,7 +597,7 @@ function .-(arg0 :: Real, arg1 :: NDArray) end function -(arg0 :: NDArray) - _mul_scalar(arg0, -one(eltype(arg0))) + _mul_scalar(arg0, scalar=-one(eltype(arg0))) end """ @@ -598,9 +609,9 @@ Inplace updating. function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) - _mul_scalar(dst, convert(eltype(dst), arg), dst) + _mul_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) else - _mul(dst, arg, dst) + _mul(dst, arg, out=dst) end return dst end @@ -642,9 +653,9 @@ Elementwise divide a scalar or an `NDArray` of the same shape from `dst`. Inplac function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) @assert dst.writable if isa(arg, Real) - _div_scalar(dst, convert(eltype(dst), arg), dst) + _div_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) else - _div(dst, arg, dst) + _div(dst, arg, out=dst) end end @@ -964,6 +975,8 @@ function _get_ndarray_function_def(name :: String) num_outputs = 0 end + args = collect(args) # tuple to list + # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped # See https://github.com/dmlc/MXNet.jl/issues/55 if $name == "dot" @@ -978,13 +991,16 @@ function _get_ndarray_function_def(name :: String) end output_handles = [Base.cconvert(MX_handle, x) for x in output_vars] - output_handles_pp = [Base.cconvert(Ptr{MX_handle}, output_handles)] + if length(output_handles) > 0 + output_handles_pp = [Base.cconvert(Ptr{MX_handle}, output_handles)] + else + output_handles_pp = [Base.convert(Ptr{MX_handle}, 0)] + end num_outputs_p = [convert(Cint, num_outputs)] kw_keys_str = String[string(x[1]) for x in kwargs] kw_vals_str = String[string(x[2]) for x in kwargs] - args = collect(args) # tuple to list op_handle = _get_cached_libmx_op_handle($(QuoteNode(name))) @mxcall(:MXImperativeInvoke, (MX_handle, Cint, Ptr{MX_handle}, @@ -996,8 +1012,9 @@ function _get_ndarray_function_def(name :: String) if out == nothing handle_array = unsafe_wrap(Array, output_handles_pp[], num_outputs_p[]) + handle_array = [MX_NDArrayHandle(x) for x in handle_array] arrays = [NDArray(hdr) for hdr in handle_array] - if mx_num_outputs == 1 + if length(arrays) == 1 return arrays[1] else return arrays diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 8d5a1b0d57a9..6257a150af19 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -33,38 +33,39 @@ end function test_assign() dims = rand_dims() tensor = rand(mx.MX_float, dims) + thresh = 1e-3 info("NDArray::assign::dims = $dims") # Julia Array -> NDArray assignment array = mx.empty(size(tensor)) array[:]= tensor - @test reldiff(tensor, copy(array)) < 1e-6 + @test reldiff(tensor, copy(array)) < thresh array2 = mx.zeros(size(tensor)) - @test reldiff(zeros(size(tensor)), copy(array2)) < 1e-6 + @test reldiff(zeros(size(tensor)), copy(array2)) < thresh array3 = mx.zeros(Float16, size(tensor)) - @test reldiff(zeros(Float16, size(tensor)), copy(array2)) < 1e-6 + @test reldiff(zeros(Float16, size(tensor)), copy(array2)) < thresh # scalar -> NDArray assignment scalar = rand() array2[:] = scalar - @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < 1e-6 + @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < thresh scalar = rand(Float16) array2[:] = scalar - @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < 1e-6 + @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < thresh scalar = rand(Float64) array2[:] = scalar array3[:] = scalar - @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < 1e-6 - @test reldiff(zeros(Float16,size(tensor))+scalar, copy(array3)) < 1e-6 + @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < thresh + @test reldiff(zeros(Float16,size(tensor))+scalar, copy(array3)) < thresh # NDArray -> NDArray assignment array[:] = array2 - @test reldiff(zeros(size(tensor))+scalar, copy(array)) < 1e-6 + @test reldiff(zeros(size(tensor))+scalar, copy(array)) < thresh end function test_slice() @@ -235,7 +236,7 @@ function test_clip() j_array, nd_array = rand_tensors(dims) clip_up = maximum(abs(j_array)) / 2 clip_down = 0 - clipped = mx.clip(nd_array, clip_down, clip_up) + clipped = mx.clip(nd_array, a_min=clip_down, a_max=clip_up) # make sure the original array is not modified @test reldiff(copy(nd_array), j_array) < 1e-6 From 03509ae17aa86f01be9c696dd2d1b00cfba44dbd Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Wed, 21 Sep 2016 21:15:16 -0400 Subject: [PATCH 417/630] temp commit, symbolic not passing due to ambiguity --- src/base.jl | 3 +- src/ndarray.jl | 6 ++- src/symbolic-node.jl | 101 +++++++++++---------------------------- test/unittest/ndarray.jl | 2 +- 4 files changed, 34 insertions(+), 78 deletions(-) diff --git a/src/base.jl b/src/base.jl index a864125757cd..588b777177bf 100644 --- a/src/base.jl +++ b/src/base.jl @@ -29,7 +29,8 @@ else end function __init__() - _populate_symbol_creator_cache!() + # TODO: bug in nnvm, if do not call this, call get handle "_copyto" will fail + _get_libmx_op_names() _populate_iter_creator_cache!() atexit() do diff --git a/src/ndarray.jl b/src/ndarray.jl index 6cd6762488d4..e516782da3d2 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -964,6 +964,7 @@ function _get_ndarray_function_def(name :: String) func_def = quote function $func_name(args::NDArray...; out=nothing, kwargs...) + println($name) if out != nothing output_vars = out if isa(output_vars, NDArray) @@ -980,7 +981,7 @@ function _get_ndarray_function_def(name :: String) # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped # See https://github.com/dmlc/MXNet.jl/issues/55 if $name == "dot" - args = flipdim(args, 1) + args = reverse(args) end # XXX: hacky way of solving the semantic difference of the axes parameter in Julia @@ -1001,7 +1002,8 @@ function _get_ndarray_function_def(name :: String) kw_keys_str = String[string(x[1]) for x in kwargs] kw_vals_str = String[string(x[2]) for x in kwargs] - op_handle = _get_cached_libmx_op_handle($(QuoteNode(name))) + #op_handle = _get_cached_libmx_op_handle($(QuoteNode(name))) + op_handle = _get_cached_libmx_op_handle($(name)) @mxcall(:MXImperativeInvoke, (MX_handle, Cint, Ptr{MX_handle}, Ptr{Cint}, Ptr{Ptr{MX_handle}}, diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index c1e6f7d8e8c6..5aedd3f6e439 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -587,39 +587,14 @@ end ################################################################################ # Atomic SymbolicNode functions dynamically imported from libmxnet ################################################################################ -function _define_atomic_symbol_creator(hdr :: MX_handle) - ref_name = Ref{char_p}(0) - ref_desc = Ref{char_p}(0) - ref_kv_nargs = Ref{char_p}(0) - ref_nargs = Ref{MX_uint}(0) - ref_arg_names = Ref{char_pp}(0) - ref_arg_types = Ref{char_pp}(0) - ref_arg_descs = Ref{char_pp}(0) - ref_ret_type = Ref{char_p}(0) - - @mxcall(:MXSymbolGetAtomicSymbolInfo, - (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, - Ref{char_pp}, Ref{char_p}, Ref{char_p}), - hdr, ref_name, ref_desc, ref_nargs, ref_arg_names, ref_arg_types, ref_arg_descs, - ref_kv_nargs, ref_ret_type) - - func_name_s = unsafe_wrap(String, ref_name[]) - func_name = Symbol(func_name_s) - kv_nargs_s = unsafe_wrap(String, ref_kv_nargs[]) - kv_nargs = Symbol(kv_nargs_s) - - signature = _format_signature(Int(ref_nargs[]), ref_arg_names) - f_desc = " " * func_name_s * "(" * signature * ")\n\n" - f_desc *= unsafe_wrap(String, ref_desc[]) * "\n\n" - if !isempty(kv_nargs_s) - f_desc *= "This function support variable length positional `SymbolicNode` inputs.\n\n" - end - f_desc *= "# Arguments\n" - f_desc *= _format_docstring(Int(ref_nargs[]), ref_arg_names, ref_arg_types, ref_arg_descs) +function _define_atomic_symbol_creator(name :: String) + handle = _get_libmx_op_handle(name) + f_desc, key_narg = _get_libmx_op_description(name, handle) + f_desc *= "* `name::Symbol`: The name of the `SymbolicNode`. (e.g. `:my_symbol`), optional.\n" f_desc *= "* `attrs::Dict{Symbol, AbstractString}`: The attributes associated with this `SymbolicNode`.\n\n" - f_desc *= "Returns `$(_format_typestring(unsafe_wrap(String, ref_ret_type[])))`." + func_name = Symbol(name) func_def = quote @doc $f_desc -> function $func_name(args::SymbolicNode...; kwargs...) @@ -632,14 +607,14 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped # See https://github.com/dmlc/MXNet.jl/issues/55 - if $func_name_s == "dot" + if $name == "dot" args = reverse(args) end # XXX: hacky way of solving the semantic difference of the axes parameter in Julia # and in libmxnet. # See https://github.com/dmlc/MXNet.jl/pull/123 - if $func_name_s == "transpose" + if $name == "transpose" kwargs = Any[key != :axes ? (key, arg) : (key, reverse(map(i->length(arg)-i, arg))) for (key, arg) in kwargs] end @@ -648,10 +623,10 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) symbol_kws = Dict{Symbol, SymbolicNode}() attrs = Dict{Symbol, String}() - $(if kv_nargs != Symbol("") + $(if key_narg != "" quote - if !in($kv_nargs_s, param_keys) - push!(param_keys, $kv_nargs_s) + if !in(Symbol($key_narg), param_keys) + push!(param_keys, Symbol($key_narg)) push!(param_vals, string(length(args))) end end @@ -674,18 +649,18 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) end if length(args) != 0 && length(symbol_kws) != 0 - @assert(false, $func_name_s * " only accepts Symbols either as positional or keyword arguments, not both.") + @assert(false, $name * " only accepts SymbolicNode either as positional or keyword arguments, not both.") end - $(if kv_nargs != Symbol("") + $(if key_narg != "" quote if length(symbol_kws) > 0 - @assert(false, $func_name_s * " takes variable number of SymbolicNode arguments, " * + @assert(false, $name * " takes variable number of SymbolicNode arguments, " * "please pass input Symbols via positional arguments, instead of keyword arguments.") end end end) - local hdr = _get_symbol_creator($(QuoteNode(func_name))) + local hdr = _get_cached_libmx_op_handle($name) # create the SymbolicNode ref_sym_hdr = Ref{MX_handle}() @@ -695,7 +670,7 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) sym_hdr = ref_sym_hdr[] node = SymbolicNode(MX_SymbolHandle(sym_hdr)) - hint = lowercase($func_name_s) + hint = lowercase($name) name = get!(DEFAULT_NAME_MANAGER, name, hint) # set attrs @@ -715,47 +690,25 @@ function _define_atomic_symbol_creator(hdr :: MX_handle) return func_def end -function _get_atomic_symbol_creators() - n_ref = Ref{MX_uint}(0) - h_ref = Ref{Ptr{MX_handle}}(0) - @mxcall(:MXSymbolListAtomicSymbolCreators, (Ref{MX_uint}, Ref{Ptr{MX_handle}}), n_ref, h_ref) - - return unsafe_wrap(Array, h_ref[], n_ref[]) -end - -function _get_atomic_symbol_name(handle :: MX_handle) - name_r = Ref{char_p}(0) - @mxcall(:MXSymbolGetAtomicSymbolName, (MX_handle, Ref{char_p}), handle, name_r) - return unsafe_wrap(String, name_r[]) -end - -const _symbol_creator_cache = Dict{Symbol, MX_handle}() -function _populate_symbol_creator_cache!() - empty!(_symbol_creator_cache) - h_creators = _get_atomic_symbol_creators() - for handle in h_creators - name = Symbol(_get_atomic_symbol_name(handle)) - _symbol_creator_cache[name] = handle - end -end - -_get_symbol_creator(name :: Symbol) = _symbol_creator_cache[name] - macro _import_atomic_symbol_creators() - h_creators = _get_atomic_symbol_creators() - - exprs = Expr[] - for creator_hdr in h_creators - expr = _define_atomic_symbol_creator(creator_hdr) - push!(exprs, expr) + # XXX: those are operators defined for NDArray, we exclude them here + # because the calling convention for the type signature is not strong + # enough to disambiguate the method for NDArray and SymbolicNode + const ignored_ops = ["_set_value"] + + names = _get_libmx_op_names() + func_exprs = map(names) do name + if name ∉ ignored_ops + expr = _define_atomic_symbol_creator(name) + end end esc(quote - $(exprs...) + $(func_exprs...) end) end -#@_import_atomic_symbol_creators() +@_import_atomic_symbol_creators() ################################################################################ # Utility macros to chain up symbols diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 6257a150af19..abc8d646fc7a 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -314,8 +314,8 @@ end ################################################################################ # Run tests ################################################################################ -test_copy() test_assign() +test_copy() test_slice() test_plus() test_minus() From 623fbaf7e073e9bcb4791df2523715855392f337 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Thu, 22 Sep 2016 16:16:35 -0400 Subject: [PATCH 418/630] disambiguate nd op and sym op --- src/ndarray.jl | 16 +++++++++++----- src/symbolic-node.jl | 20 +++++++++++++++----- test/common.jl | 6 +++--- test/unittest/symbolic-node.jl | 21 ++++++++++----------- 4 files changed, 39 insertions(+), 24 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index e516782da3d2..f32180a95e9c 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -963,8 +963,7 @@ function _get_ndarray_function_def(name :: String) func_name = Symbol(name) func_def = quote - function $func_name(args::NDArray...; out=nothing, kwargs...) - println($name) + function $func_name(::Type{NDArray}, args::NDArray...; out=nothing, kwargs...) if out != nothing output_vars = out if isa(output_vars, NDArray) @@ -1027,7 +1026,13 @@ function _get_ndarray_function_def(name :: String) end end - return func_def + func_def2 = quote + function $func_name(args::NDArray...; out=nothing, kwargs...) + $func_name(NDArray, args...; out=out, kwargs...) + end + end + + return func_def, func_def2 end macro _import_ndarray_functions() @@ -1036,13 +1041,14 @@ macro _import_ndarray_functions() op_handle = _get_libmx_op_handle(name) desc, key_narg = _get_libmx_op_description(name, op_handle) - func_def = _get_ndarray_function_def(name) + func_def, func_def2 = _get_ndarray_function_def(name) func_name = Symbol(name) expr = quote $(isdefined(Base, func_name) ? :(import Base.$func_name) : :()) - @doc $desc -> $func_def + @doc $desc -> + $func_def2 end end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 5aedd3f6e439..1612f0c57771 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -596,8 +596,7 @@ function _define_atomic_symbol_creator(name :: String) func_name = Symbol(name) func_def = quote - @doc $f_desc -> - function $func_name(args::SymbolicNode...; kwargs...) + function $func_name(::Type{SymbolicNode}, args::SymbolicNode...; kwargs...) idx = findfirst(x -> x[1] == :name, kwargs) if idx > 0 name = kwargs[idx][2] @@ -687,7 +686,18 @@ function _define_atomic_symbol_creator(name :: String) return node end # function end # quote - return func_def + + func_def2 = quote + @doc $f_desc -> + function $func_name(args::SymbolicNode...; kwargs...) + $func_name(SymbolicNode, args...; kwargs...) + end # function + end # quote + + return quote + $func_def + $func_def2 + end end macro _import_atomic_symbol_creators() @@ -696,8 +706,8 @@ macro _import_atomic_symbol_creators() # enough to disambiguate the method for NDArray and SymbolicNode const ignored_ops = ["_set_value"] - names = _get_libmx_op_names() - func_exprs = map(names) do name + op_names = _get_libmx_op_names() + func_exprs = map(op_names) do name if name ∉ ignored_ops expr = _define_atomic_symbol_creator(name) end diff --git a/test/common.jl b/test/common.jl index fc4c4f63649e..a394acf95a93 100644 --- a/test/common.jl +++ b/test/common.jl @@ -13,9 +13,9 @@ end function mlp2() data = mx.Variable(:data) - out = mx.FullyConnected(data=data, name=:fc1, num_hidden=1000) - out = mx.Activation(data=out, act_type=:relu) - out = mx.FullyConnected(data=out, name=:fc2, num_hidden=10) + out = mx.FullyConnected(data, name=:fc1, num_hidden=1000) + out = mx.Activation(out, act_type=:relu) + out = mx.FullyConnected(out, name=:fc2, num_hidden=10) return out end diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index d78b0775a983..ca2986d4a377 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -20,8 +20,8 @@ function test_internal() info("SymbolicNode::internal") data = mx.Variable(:data) - oldfc = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) - net1 = mx.FullyConnected(data=oldfc, name=:fc2, num_hidden=100) + oldfc = mx.FullyConnected(data, name=:fc1, num_hidden=10) + net1 = mx.FullyConnected(oldfc, name=:fc2, num_hidden=100) @test mx.list_arguments(net1) == [:data,:fc1_weight,:fc1_bias,:fc2_weight,:fc2_bias] @@ -34,12 +34,12 @@ function test_compose() info("SymbolicNode::compose") data = mx.Variable(:data) - net1 = mx.FullyConnected(data=data, name=:fc1, num_hidden=10) - net1 = mx.FullyConnected(data=net1, name=:fc2, num_hidden=100) + net1 = mx.FullyConnected(data, name=:fc1, num_hidden=10) + net1 = mx.FullyConnected(net1, name=:fc2, num_hidden=100) - net2 = mx.FullyConnected(name=:fc3, num_hidden=10) - net2 = mx.Activation(data=net2, act_type=:relu) - net2 = mx.FullyConnected(data=net2, name=:fc4, num_hidden=20) + net2 = mx.FullyConnected(mx.SymbolicNode, name=:fc3, num_hidden=10) + net2 = mx.Activation(net2, act_type=:relu) + net2 = mx.FullyConnected(net2, name=:fc4, num_hidden=20) composed = net2(fc3_data=net1, name=:composed) multi_out = mx.Group(composed, net1) @@ -96,14 +96,13 @@ function test_attrs() data2 = mx.Variable(:data2, attrs = Dict(:test => "hallo!")) @test get(mx.get_attr(data2, :test)) == "hallo!" - conv = mx.Convolution(data = data2, kernel = (1,1), num_filter = 1, attrs = Dict(:a => "a", :π => "π")) + conv = mx.Convolution(data2, kernel = (1,1), num_filter = 1, attrs = Dict(:a => "a", :π => "π")) @test isnull(mx.get_attr(conv, :b)) @test get(mx.get_attr(conv, :a)) == "a" @test get(mx.get_attr(conv, :π)) == "π" - @test mx.list_attr(conv) == Dict(:a => "a", :π => "π") @test_throws MethodError mx.Variable(:data3, attrs = Dict(:test => "1.0", :test2 => 1.0)) - @test_throws MethodError mx.Convolution(data=data2, kernel = (1,1), num_filter = 1, attrs = Dict(:test => "1.0", :test2 => 1.0)) + @test_throws MethodError mx.Convolution(data2, kernel = (1,1), num_filter = 1, attrs = Dict(:test => "1.0", :test2 => 1.0)) end function test_functions() @@ -117,7 +116,7 @@ function test_dot() x = mx.Variable(:x) y = mx.Variable(:y) z = mx.dot(x, y) - z_exec = mx.bind(z, context=mx.cpu(), + z_exec = mx.bind(z, context=mx.cpu(), args=Dict(:x=>mx.ones((100, 2)), :y=>mx.ones((2, 200)))) mx.forward(z_exec) From d718cfc81b174c69cf06d6bd02d2aa18bcf0a3f6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 23 Sep 2016 10:33:46 -0400 Subject: [PATCH 419/630] fix API changes in random --- src/random.jl | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/src/random.jl b/src/random.jl index 79a8b6e9e20b..b5b53def8f54 100644 --- a/src/random.jl +++ b/src/random.jl @@ -1,5 +1,6 @@ function rand!(low::Real, high::Real, out::NDArray) - _random_uniform(low, high, out) + # XXX: note we reverse shape because julia and libmx has different dim order + _sample_uniform(NDArray, low=low, high=high, shape=reverse(size(out)), out=out) end function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}) rand(low, high, shape, cpu()) @@ -10,7 +11,8 @@ function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}, ctx::Context) end function randn!(mean::Real, stdvar::Real, out::NDArray) - _random_gaussian(mean, stdvar, out) + # XXX: note we reverse shape because julia and libmx has different dim order + _sample_normal(NDArray, loc=mean, scale=stdvar, shape=reverse(size(out)), out=out) end function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}) randn(mean, stdvar, shape, cpu()) From 590055b3f403e4d875e567594db4c0b75552a6c6 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Mon, 26 Sep 2016 15:11:33 -0400 Subject: [PATCH 420/630] change examples for new symbolic calling conventions (nnvm, #146) --- examples/char-lstm/lstm.jl | 8 ++++---- examples/cifar10/cifar10.jl | 16 ++++++++-------- examples/mnist/lenet.jl | 10 +++++----- examples/mnist/mlp.jl | 12 ++++++------ 4 files changed, 23 insertions(+), 23 deletions(-) diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index e895d8389e74..e98778b65272 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -25,9 +25,9 @@ function lstm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMPara data = mx.Dropout(data, p=dropout) end - i2h = mx.FullyConnected(data=data, weight=param.i2h_W, bias=param.i2h_b, + i2h = mx.FullyConnected(data, weight=param.i2h_W, bias=param.i2h_b, num_hidden=4num_hidden, name=symbol(name, "_i2h")) - h2h = mx.FullyConnected(data=prev_state.h, weight=param.h2h_W, bias=param.h2h_b, + h2h = mx.FullyConnected(prev_state.h, weight=param.h2h_W, bias=param.h2h_b, num_hidden=4num_hidden, name=symbol(name, "_h2h")) gates = mx.SliceChannel(i2h + h2h, num_outputs=4, name=symbol(name, "_gates")) @@ -71,7 +71,7 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla for t = 1:seq_len data = mx.Variable(symbol(name, "_data_$t")) label = mx.Variable(symbol(name, "_label_$t")) - hidden = mx.FullyConnected(data=data, weight=embed_W, num_hidden=dim_embed, + hidden = mx.FullyConnected(data, weight=embed_W, num_hidden=dim_embed, no_bias=true, name=symbol(name, "_embed_$t")) # stack LSTM cells @@ -88,7 +88,7 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla if dropout > 0 hidden = mx.Dropout(hidden, p=dropout) end - pred = mx.FullyConnected(data=hidden, weight=pred_W, bias=pred_b, num_hidden=n_class, + pred = mx.FullyConnected(hidden, weight=pred_W, bias=pred_b, num_hidden=n_class, name=symbol(name, "_pred_$t")) smax = mx.SoftmaxOutput(pred, label, name=symbol(name, "_softmax_$t")) push!(outputs, smax) diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl index e5ff751eca7d..165ee1934568 100644 --- a/examples/cifar10/cifar10.jl +++ b/examples/cifar10/cifar10.jl @@ -5,9 +5,9 @@ using MXNet # basic Conv + BN + ReLU factory function conv_factory(data, num_filter, kernel; stride=(1,1), pad=(0,0), act_type=:relu) - conv = mx.Convolution(data=data, num_filter=num_filter, kernel=kernel, stride=stride, pad=pad) - bn = mx.BatchNorm(data=conv) - act = mx.Activation(data=bn, act_type=act_type) + conv = mx.Convolution(data, num_filter=num_filter, kernel=kernel, stride=stride, pad=pad) + bn = mx.BatchNorm(conv) + act = mx.Activation(bn, act_type=act_type) return act end @@ -16,7 +16,7 @@ function downsample_factory(data, ch_3x3) # conv 3x3 conv = conv_factory(data, ch_3x3, (3,3), stride=(2,2), pad=(1,1)) # pool - pool = mx.Pooling(data=data, kernel=(3,3), stride=(2,2), pool_type=:max) + pool = mx.Pooling(data, kernel=(3,3), stride=(2,2), pool_type=:max) # concat concat = mx.Concat(conv, pool) return concat @@ -48,10 +48,10 @@ in4d = simple_factory(in4b, 48, 96) in4e = downsample_factory(in4d, 96) in5a = simple_factory(in4e, 176, 160) in5b = simple_factory(in5a, 176, 160) -pool = mx.Pooling(data=in5b, pool_type=:avg, kernel=(7,7), name=:global_pool) -flatten = mx.Flatten(data=pool, name=:flatten1) -fc = mx.FullyConnected(data=flatten, num_hidden=10, name=:fc1) -softmax = mx.SoftmaxOutput(data=fc, name=:loss) +pool = mx.Pooling(in5b, pool_type=:avg, kernel=(7,7), name=:global_pool) +flatten = mx.Flatten(pool, name=:flatten1) +fc = mx.FullyConnected(flatten, num_hidden=10, name=:fc1) +softmax = mx.SoftmaxOutput(fc, name=:loss) #-------------------------------------------------------------------------------- diff --git a/examples/mnist/lenet.jl b/examples/mnist/lenet.jl index ca48e6693213..af3e8c41dc71 100644 --- a/examples/mnist/lenet.jl +++ b/examples/mnist/lenet.jl @@ -7,25 +7,25 @@ using MXNet data = mx.Variable(:data) # first conv -conv1 = @mx.chain mx.Convolution(data=data, kernel=(5,5), num_filter=20) => +conv1 = @mx.chain mx.Convolution(data, kernel=(5,5), num_filter=20) => mx.Activation(act_type=:tanh) => mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) # second conv -conv2 = @mx.chain mx.Convolution(data=conv1, kernel=(5,5), num_filter=50) => +conv2 = @mx.chain mx.Convolution(conv1, kernel=(5,5), num_filter=50) => mx.Activation(act_type=:tanh) => mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) # first fully-connected -fc1 = @mx.chain mx.Flatten(data=conv2) => +fc1 = @mx.chain mx.Flatten(conv2) => mx.FullyConnected(num_hidden=500) => mx.Activation(act_type=:tanh) # second fully-connected -fc2 = mx.FullyConnected(data=fc1, num_hidden=10) +fc2 = mx.FullyConnected(fc1, num_hidden=10) # softmax loss -lenet = mx.SoftmaxOutput(data=fc2, name=:softmax) +lenet = mx.SoftmaxOutput(fc2, name=:softmax) #-------------------------------------------------------------------------------- diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index cdb0064da8e5..3f713654d5b9 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -6,12 +6,12 @@ using MXNet #-- Option 1: explicit composition # data = mx.Variable(:data) -# fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) -# act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) -# fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) -# act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) -# fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) -# mlp = mx.SoftmaxOutput(data = fc3, name=:softmax) +# fc1 = mx.FullyConnected(data, name=:fc1, num_hidden=128) +# act1 = mx.Activation(fc1, name=:relu1, act_type=:relu) +# fc2 = mx.FullyConnected(act1, name=:fc2, num_hidden=64) +# act2 = mx.Activation(fc2, name=:relu2, act_type=:relu) +# fc3 = mx.FullyConnected(act2, name=:fc3, num_hidden=10) +# mlp = mx.SoftmaxOutput(fc3, name=:softmax) #-- Option 2: using the mx.chain macro # mlp = @mx.chain mx.Variable(:data) => From 286d751eb29ccc69c581b5dcf76466a09efd1e61 Mon Sep 17 00:00:00 2001 From: Michael Creel Date: Fri, 30 Sep 2016 12:54:32 +0200 Subject: [PATCH 421/630] Add files via upload simple MLP for regression, illustrates data provision from memory, and how to obtain fits --- examples/regression-example.jl | 62 ++++++++++++++++++++++++++++++++++ 1 file changed, 62 insertions(+) create mode 100644 examples/regression-example.jl diff --git a/examples/regression-example.jl b/examples/regression-example.jl new file mode 100644 index 000000000000..645c6325b066 --- /dev/null +++ b/examples/regression-example.jl @@ -0,0 +1,62 @@ +#= +This script shows how a simple MLP net may be used +for regression. It shows how data in memory may be +used for training and evaluation, and how to obtain +the predictions from the trained net. + +TO DO: + * specify batch size, and allow different sizes + for the training and evaluation sets + * tanh activation does not seem to work properly, + investigate +=# +using MXNet +using Distributions +using PyPlot + +# data generating process for exogenous inputs +generate_inputs(media, var, tam) = rand(MvNormal(media, var), tam) + +# function that maps inputs to outputs +f1(data) = sin(data[1,:]).*sin(data[2,:])./(data[1,:].*data[2,:]) + +# parameters for input d.g.p. +mean=[0.0;0.0] +var=[1.0 0.0;0.0 1.0] + +# create training and evaluation data sets +TrainInput = generate_inputs(mean, var, 5000) +TrainOutput = f1(TrainInput) +ValidationInput = generate_inputs(mean, var, 5000) +ValidationOutput = f1(ValidationInput) + +# how to set up data providers using data in memory +trainprovider = mx.ArrayDataProvider(:data => TrainInput, :label => TrainOutput) +evalprovider = mx.ArrayDataProvider(:data => ValidationInput, :label => ValidationOutput) + +# create a single hidden layer MPL +data = mx.Variable(:data) +label = mx.Variable(:label) +fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=20) +act1 = mx.Activation(data = fc1, name=:relu, act_type=:relu) +fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=1) + +# cost is squared error loss +cost = mx.LinearRegressionOutput(data=fc2, label=label, name = :loss) + +# final model definition +model = mx.FeedForward(cost, context=mx.cpu()) + +# set up the optimizer +optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) + +# train, reporting loss for training and evaluation sets +mx.fit(model, optimizer, eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 1000) + +# obtain predictions +fit = mx.predict(model, evalprovider) +plot(ValidationOutput,fit',".") +xlabel("true") +ylabel("predicted") +title("outputs: true versus predicted. 45º line is what we hope for") + From 8453c0a23681eae0ebdb1fb1bf961372963c9dde Mon Sep 17 00:00:00 2001 From: Michael Creel Date: Tue, 4 Oct 2016 19:53:42 +0200 Subject: [PATCH 422/630] Update regression-example.jl (#148) adds batch size, selection of optimizers, possibility for initialization --- examples/regression-example.jl | 65 +++++++++++++++++----------------- 1 file changed, 33 insertions(+), 32 deletions(-) diff --git a/examples/regression-example.jl b/examples/regression-example.jl index 645c6325b066..8c949f9b2fac 100644 --- a/examples/regression-example.jl +++ b/examples/regression-example.jl @@ -3,60 +3,61 @@ This script shows how a simple MLP net may be used for regression. It shows how data in memory may be used for training and evaluation, and how to obtain the predictions from the trained net. - -TO DO: - * specify batch size, and allow different sizes - for the training and evaluation sets - * tanh activation does not seem to work properly, - investigate =# using MXNet using Distributions using PyPlot -# data generating process for exogenous inputs -generate_inputs(media, var, tam) = rand(MvNormal(media, var), tam) - -# function that maps inputs to outputs -f1(data) = sin(data[1,:]).*sin(data[2,:])./(data[1,:].*data[2,:]) +# data generating process +generate_inputs(mean, var, size) = rand(MvNormal(mean, var), size) +output(data) = sin(data[1,:]).*sin(data[2,:])./(data[1,:].*data[2,:]) -# parameters for input d.g.p. +# create training and evaluation data sets mean=[0.0;0.0] var=[1.0 0.0;0.0 1.0] - -# create training and evaluation data sets -TrainInput = generate_inputs(mean, var, 5000) -TrainOutput = f1(TrainInput) -ValidationInput = generate_inputs(mean, var, 5000) -ValidationOutput = f1(ValidationInput) +samplesize = 5000 +TrainInput = generate_inputs(mean, var, samplesize) +TrainOutput = output(TrainInput) +ValidationInput = generate_inputs(mean, var, samplesize) +ValidationOutput = output(ValidationInput) # how to set up data providers using data in memory -trainprovider = mx.ArrayDataProvider(:data => TrainInput, :label => TrainOutput) -evalprovider = mx.ArrayDataProvider(:data => ValidationInput, :label => ValidationOutput) +batchsize = 100 # can adjust this later, but must be defined now for next line +trainprovider = mx.ArrayDataProvider(:data => TrainInput, batch_size=batchsize, shuffle=true, :label => TrainOutput) +evalprovider = mx.ArrayDataProvider(:data => ValidationInput, batch_size=batchsize, shuffle=true, :label => ValidationOutput) -# create a single hidden layer MPL +# create a two hidden layer MPL: try varying num_hidden, and change tanh to relu, +# or add/remove a layer data = mx.Variable(:data) label = mx.Variable(:label) -fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=20) -act1 = mx.Activation(data = fc1, name=:relu, act_type=:relu) -fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=1) +net = @mx.chain mx.FullyConnected(data = data, num_hidden=10) => + mx.Activation(act_type=:tanh) => + mx.FullyConnected(num_hidden=3) => + mx.Activation(act_type=:tanh) => + mx.FullyConnected(num_hidden=1) -# cost is squared error loss -cost = mx.LinearRegressionOutput(data=fc2, label=label, name = :loss) +# squared error loss is appropriate for regression, don't change +cost = mx.LinearRegressionOutput(data = net, label=label) -# final model definition +# final model definition, don't change, except if using gpu model = mx.FeedForward(cost, context=mx.cpu()) -# set up the optimizer -optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) +# set up the optimizer: select one, explore parameters, if desired +#optimizer = mx.SGD(lr=0.01, momentum=0.9, weight_decay=0.00001) +optimizer = mx.ADAM() # train, reporting loss for training and evaluation sets -mx.fit(model, optimizer, eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 1000) +# initial training with small batch size, to get to a good neighborhood +batchsize = 100 +mx.fit(model, optimizer, initializer=mx.NormalInitializer(0.0,0.1), eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 500) +# more training with the full sample +batchsize = samplesize +mx.fit(model, optimizer, eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 500) # obtain predictions -fit = mx.predict(model, evalprovider) +plotprovider = mx.ArrayDataProvider(:data => ValidationInput, :label => ValidationOutput) +fit = mx.predict(model, plotprovider) plot(ValidationOutput,fit',".") xlabel("true") ylabel("predicted") title("outputs: true versus predicted. 45º line is what we hope for") - From 4664f3b944f1c298e5e3b182c6d86ac50d22713c Mon Sep 17 00:00:00 2001 From: Ranjan Anantharaman Date: Thu, 6 Oct 2016 20:45:59 +0530 Subject: [PATCH 423/630] Add some docs to `eachbatch` (#149) --- src/io.jl | 11 +++++++++++ 1 file changed, 11 insertions(+) diff --git a/src/io.jl b/src/io.jl index 0c5de69e53f8..da3ba52cecff 100644 --- a/src/io.jl +++ b/src/io.jl @@ -212,6 +212,17 @@ function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name error("$name is not provided by this data provider") end +""" + eachbatch(provider::AbstractDataProvider) + +Allows you to perform operations on data every epoch. This is especially useful +when you need to perform real-time augmentation of the data. + +# Arguments: +* `provider`: an instance of the custom DataProvider type. You must return this +instance after modifying its fields. + +""" eachbatch(provider :: AbstractDataProvider) = provider """ From eee5ca73ed1042f058730a2d92ef952e3bf416bf Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Mon, 24 Oct 2016 11:15:52 +0900 Subject: [PATCH 424/630] fix missing wget #150 --- src/util.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/util.jl b/src/util.jl index a53647790c06..89a2e508f993 100644 --- a/src/util.jl +++ b/src/util.jl @@ -41,7 +41,7 @@ function get_cifar10() filenames = Dict([k => joinpath(cifar10_dir, v) for (k,v) in filenames]) if !all(isfile, values(filenames)) cd(cifar10_dir) do - run(`http://data.dmlc.ml/mxnet/data/cifar10.zip`) + download("http://data.dmlc.ml/mxnet/data/cifar10.zip", "cifar10.zip") try run(`unzip -u cifar10.zip`) catch From d1eb31833c3980efb622414c37f5046f54177876 Mon Sep 17 00:00:00 2001 From: jocklawrie Date: Thu, 8 Dec 2016 12:25:14 +1100 Subject: [PATCH 425/630] Bug fix updating the ACE loss function. Included a test case. Also provided an example. --- examples/nondefault-example.jl | 130 +++++++++++++++++++++++++++++++++ src/metric.jl | 5 +- test/unittest/metric.jl | 62 ++++++++++++++++ 3 files changed, 194 insertions(+), 3 deletions(-) create mode 100644 examples/nondefault-example.jl create mode 100644 test/unittest/metric.jl diff --git a/examples/nondefault-example.jl b/examples/nondefault-example.jl new file mode 100644 index 000000000000..b93887850ca3 --- /dev/null +++ b/examples/nondefault-example.jl @@ -0,0 +1,130 @@ +#= + Contents: This file contains code for: + - Setting the initial values of the biases and weights equal to the final values of a previous run. + This is helpful for re-estimating a model on updated training data, where the original and updated training data largely overlap. + - Changing the loss function (in our example from Accuracy to ACE) + + Notes: + 1. The model is a toy example with 4 outcomes (categories). + The model is a poor fit to the data, but this is unimportant. The point of the example is to demonstrate the use of some non-default settings. + 2. For categorical outcomes, use 0-based categories! Some of the loss functions assume this, such as ACE. + 3. Incomplete batches are padded with repeated instances of an artificial observation. + This is bad because the artificial data is over-represented and thus biases the results. + The ideal solution is to distribute the observations from the incomplete batch among the complete batches. + This would result in batches of variable but similar size, and thus the estimate of the gradient would not be significantly affected. + But this doesn't happen. + For simplicity we instead drop these extra observations, so that the number of observations in the data set is a multiple of the batch_size. +=# + + +using RDatasets +using MXNet + + +################################################################################ +### Data: Exam scores discretised into 4 categories (use zero-based categories!). +df = dataset("mlmRev", "Gcsemv"); # 1905 x 5 +complete_cases!(df) # 1523 x 5 +n = nrow(df) +df[:written] = zeros(Int, n) +df[:course] = zeros(Int, n) +for i = 1:n + # Categorise :Written + if df[i, :Written] <= 20.0 + df[i, :written] = 0 + elseif df[i, :Written] <= 40.0 + df[i, :written] = 1 + elseif df[i, :Written] <= 60.0 + df[i, :written] = 2 + else + df[i, :written] = 3 + end + + # Categorise :Course + if df[i, :Course] <= 25.0 + df[i, :course] = 0 + elseif df[i, :Course] <= 50.0 + df[i, :course] = 1 + elseif df[i, :Course] <= 75.0 + df[i, :course] = 2 + else + df[i, :course] = 3 + end +end +df = df[1:1500, :] # Ensure nrows is a multiple of batch_size (100 in our example, see below) + +x = convert(Vector{Float64}, df[:course]) +y = convert(Vector{Float64}, df[:written]) + + +################################################################################ +### Hyperparameters + +# Architecture +mlp = @mx.chain mx.Variable(:data) => + mx.FullyConnected(name = :h1, num_hidden = 10) => + mx.Activation(name = :h1_out, act_type = :sigmoid) => + mx.FullyConnected(name = :out, num_hidden = 4) => + mx.SoftmaxOutput(name = :softmax) + +# Hyperparameters +n_epoch = 100 +batch_size = 100 +learn_rate = 0.1 +mom = 0.9 +wt_decay = 0.00001 + + +# Connect data, network architecture and hyperparameters +train_prov = mx.ArrayDataProvider(x, y; batch_size = batch_size) +eval_prov = mx.ArrayDataProvider(x, y; batch_size = batch_size) +opt = mx.SGD(lr = learn_rate, momentum = mom, weight_decay = wt_decay) # Optimizing algorithm + +################################################################################ +### Run 1: Basic run, storing initial and final state. + +# Learn +mdl1 = mx.FeedForward(mlp, context = mx.cpu()) # Model targets the local CPU +cb = mx.do_checkpoint("first", frequency = n_epoch, save_epoch_0 = true) # Write initial and final states to disk +mx.fit(mdl1, opt, train_prov, n_epoch = n_epoch, eval_data = eval_prov, callbacks = [cb]) # Random initial biases and weights + + +################################################################################ +### Run 2: Load the previously trained model and run it some more, starting where Run 1 finished. + +# Load final state of 1st run from disk +arch, arg_params, aux_params = mx.load_checkpoint("first", 100) # arch is the network structure, arg_params contains the weights and biases +mdl2 = mx.FeedForward(arch, context = mx.cpu()) # Only populates the arch and ctx fields +mdl2.arg_params = arg_params # Populate the arg_params fields +cb = mx.do_checkpoint("second", frequency = n_epoch, save_epoch_0 = true) +mx.fit(mdl2, opt, train_prov, n_epoch = n_epoch, eval_data = eval_prov, callbacks = [cb]) + +# Test whether the final state of 1st run equals the initial state of 2nd run +run(`diff first-0100.params second-0000.params`) # Throws error if not true, does nothing otherwise + + +#= + # Other useful functions + arch = mx.load("first-symbol.json", mx.SymbolicNode) + arg_params = mx.load("first-0100.params", mx.NDArray) +=# + + +################################################################################ +### Run 3: Change the loss function from the default Accuracy to ACE + +mdl3 = mx.FeedForward(mlp, context = mx.cpu()) +mx.fit(mdl3, opt, train_prov, n_epoch = n_epoch, eval_data = eval_prov, eval_metric = mx.ACE()) +#mx.fit(mdl3, opt, train_prov, n_epoch = n_epoch, eval_data = eval_prov, eval_metric = mx.Accuracy()) # Default eval_metric +#mx.fit(mdl3, opt, train_prov, n_epoch = n_epoch, eval_data = eval_prov, eval_metric = mx.MultiACE(4)) + +# Test manually +probs = mx.predict(mdl3, eval_prov) +LL = 0.0 +for i = 1:size(y, 1) + LL += log(probs[Int(y[i]) + 1, i]) +end +-LL / size(y, 1) # Should equal the value of ACE from the final iteration of fit(mdl3, ...) + + +# EOF diff --git a/src/metric.jl b/src/metric.jl index 4ae66acf25b7..dc3c3aef452a 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -213,15 +213,14 @@ function _update_single_output(metric :: ACE, label :: NDArray, pred :: NDArray) # Since we can only target labels right now this is the only thing we can do. target = Int(labels[i, j, 1, sample]) + 1 # klasses are 0...k-1 => julia indexing p_k = pred[i, j, target, sample] - metric.ace_sum += log(p_k) metric.n_sample += 1 end end end elseif ndims(pred) == 2 # 1-dimensional case - for sample in 1:size(labels, 1) - target = Int(labels[sample]) + 1 + for sample in 1:size(label, 1) + target = Int(label[sample]) + 1 # 0-based indexing => 1-based indexing p_k = pred[target, sample] metric.ace_sum += log(p_k) metric.n_sample += 1 diff --git a/test/unittest/metric.jl b/test/unittest/metric.jl new file mode 100644 index 000000000000..f0a79d6ce994 --- /dev/null +++ b/test/unittest/metric.jl @@ -0,0 +1,62 @@ +module TestMetric + +using MXNet +using Base.Test + +################################################################################ +# Supporting functions +################################################################################ + +""" +Returns a random n x m array in which each column defines a discrete probability distribution. +Each column contains numbers between 0 and 1, and each column sums to 1. +""" +function generate_probs(n, m) + # Init + result = rand(n, m) + + # Normalize: ensure each column sums to 1 + for j = 1:m + colsum = sum(result[:, j]) + for i = 1:n + result[i, j] /= colsum + end + end + result +end + + +function loglikelihood{T <: AbstractFloat}(labels::Vector{T}, probs::Array{T, 2}) + LL = 0.0 + for i = 1:size(labels, 1) + LL += log(probs[Int(labels[i]) + 1, i]) # labels are zero-based + end + LL / size(labels, 1) +end + + +################################################################################ +# Test Implementations +################################################################################ + +function test_ace() + info("EvalMetric::ACE") + n_categories = 4 + n_observations = 100 + labels = convert(Vector{Float32}, rand(0:(n_categories - 1), n_observations)) # MXNet uses Float32 + probs = convert(Array{Float32}, generate_probs(n_categories, n_observations)) + LL = loglikelihood(labels, probs) + metric = mx.ACE() # For categorical variables, ACE == -LL + mx._update_single_output(metric, mx.NDArray(labels), mx.NDArray(probs)) + LL_v2 = metric.ace_sum / metric.n_sample + @test_approx_eq_eps LL LL_v2 1e-12 +end + + +################################################################################ +# Run tests +################################################################################ +test_ace() + + +end From b81b26ca5a7c69afb0e160e69f15a7296d4f4d44 Mon Sep 17 00:00:00 2001 From: Arkoniak Date: Thu, 29 Dec 2016 23:55:16 +0400 Subject: [PATCH 426/630] New Optimizers (#159) * Added implementation of RMSProp, AdaGrad, AdaDelta * Added AdaMax and Nadam --- docs/src/api/optimizer.md | 29 +++++++++++ examples/mnist/mlp-test.jl | 5 ++ src/optimizer.jl | 58 +++++++++++++++++++-- src/optimizers/adadelta.jl | 91 +++++++++++++++++++++++++++++++++ src/optimizers/adagrad.jl | 66 ++++++++++++++++++++++++ src/optimizers/adam.jl | 6 +-- src/optimizers/adamax.jl | 77 ++++++++++++++++++++++++++++ src/optimizers/nadam.jl | 100 +++++++++++++++++++++++++++++++++++++ src/optimizers/rmsprop.jl | 71 ++++++++++++++++++++++++++ 9 files changed, 497 insertions(+), 6 deletions(-) create mode 100644 src/optimizers/adadelta.jl create mode 100644 src/optimizers/adagrad.jl create mode 100644 src/optimizers/adamax.jl create mode 100644 src/optimizers/nadam.jl create mode 100644 src/optimizers/rmsprop.jl diff --git a/docs/src/api/optimizer.md b/docs/src/api/optimizer.md index 81fad7cb827e..17974a577913 100644 --- a/docs/src/api/optimizer.md +++ b/docs/src/api/optimizer.md @@ -19,3 +19,32 @@ Modules = [MXNet.mx] Pages = ["optimizers/adam.jl"] ``` +### AdaGrad +```@autodocs +Modules = [MXNet.mx] +Pages = ["optimizers/adagrad.jl"] +``` + +### AdaDelta +```@autodocs +Modules = [MXNet.mx] +Pages = ["optimizers/adadelta.jl"] +``` + +### AdaMax +```@autodocs +Modules = [MXNet.mx] +Pages = ["optimizers/adamax.jl"] +``` + +### RMSProp +```@autodocs +Modules = [MXNet.mx] +Pages = ["optimizers/rmsprop.jl"] +``` + +### Nadam +```@autodocs +Modules = [MXNet.mx] +Pages = ["optimizers/nadam.jl"] +``` diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl index 4931944032a9..a88ba3772fb0 100644 --- a/examples/mnist/mlp-test.jl +++ b/examples/mnist/mlp-test.jl @@ -74,6 +74,11 @@ end function test_mnist_mlp() @test mnist_fit_and_predict(mx.SGD(lr=0.1, momentum=0.9), mx.UniformInitializer(0.01), 2) > 90 @test mnist_fit_and_predict(mx.ADAM(), mx.NormalInitializer(), 2) > 90 + @test mnist_fit_and_predict(mx.AdaGrad(), mx.NormalInitializer(), 2) > 90 + @test mnist_fit_and_predict(mx.AdaDelta(), mx.NormalInitializer(), 2) > 90 + @test mnist_fit_and_predict(mx.AdaMax(), mx.NormalInitializer(), 2) > 90 + @test mnist_fit_and_predict(mx.RMSProp(), mx.NormalInitializer(), 2) > 90 + @test mnist_fit_and_predict(mx.Nadam(), mx.NormalInitializer(), 2) > 90 end test_mnist_mlp() diff --git a/src/optimizer.jl b/src/optimizer.jl index c672c2fe998a..66f7d660847a 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -158,6 +158,42 @@ type Fixed <: AbstractMomentumScheduler momentum :: Float64 end get_momentum(self :: Fixed, state :: OptimizationState) = self.momentum + +""" + Momentum.NadamScheduler + +Nesterov-accelerated adaptive momentum scheduler. + +Description in "Incorporating Nesterov Momentum into Adam." +[http://cs229.stanford.edu/proj2015/054_report.pdf] +(http://cs229.stanford.edu/proj2015/054_report.pdf) + +``\mu_t = \mu_0 * (1 - \gamma * \alpha^{t * \delta})``. +Here +* ``t`` is the iteration count +* ``\delta``: default `0.004` is scheduler decay, +* ``\gamma``: default `0.5` +* ``\alpha``: default `0.96` +* ``\mu_0``: default `0.99` +""" +type NadamScheduler <: AbstractMomentumScheduler + mu0 :: Float64 + delta :: Float64 + gamma :: Float64 + alpha :: Float64 +end +function NadamScheduler(;mu0::Real=0.99, delta::Real=0.004, + gamma::Real=0.5, alpha::Real=0.96) + @assert(0.0 <= delta) + @assert(0.0 <= alpha <= 1.0) + @assert(0.0 <= mu0 <= 1.0) + @assert(0.0 <= gamma <= 1.0) + NadamScheduler(Float64(mu0), Float64(delta), Float64(gamma), Float64(alpha)) +end +get_momentum(self :: NadamScheduler, state :: OptimizationState) = + self.mu0 * (1.0 - self.gamma*self.alpha^(state.curr_iter * self.delta)), + self.mu0 * (1.0 - self.gamma*self.alpha^((state.curr_iter + 1) * self.delta)) + end # module Momentum ################################################################################ function get_momentum_scheduler(scheduler :: Any, momentum :: Real) @@ -170,6 +206,15 @@ function get_momentum_scheduler(scheduler :: Any, momentum :: Real) end end +function get_momentum_scheduler(scheduler :: Any, + another_scheduler :: AbstractMomentumScheduler) + + if isa(scheduler, AbstractMomentumScheduler) + return scheduler + else + return another_scheduler + end +end """ get_updater(optimizer) @@ -198,10 +243,10 @@ Base class for all optimizer options. abstract AbstractOptimizerOptions """ - normalized_gradient(opts, state, grad) + normalized_gradient(opts, state, weight, grad) * `opts::AbstractOptimizerOptions`: options for the optimizer, should contain the field - `grad_scale`, `grad_clip` and `weight_decay`. +`grad_clip` and `weight_decay`. * `state::OptimizationState`: the current optimization state. * `weight::NDArray`: the trainable weights. * `grad::NDArray`: the original gradient of the weights. @@ -216,10 +261,17 @@ function normalized_gradient(opts::AbstractOptimizerOptions, state::Optimization if opts.grad_clip > 0 grad = clip(grad, -opts.grad_clip, opts.grad_clip) end - @inplace grad += opts.weight_decay * weight + if opts.weight_decay > 0 + @inplace grad += opts.weight_decay * weight + end return grad end include("optimizers/sgd.jl") include("optimizers/adam.jl") +include("optimizers/adagrad.jl") +include("optimizers/adadelta.jl") +include("optimizers/adamax.jl") +include("optimizers/rmsprop.jl") +include("optimizers/nadam.jl") diff --git a/src/optimizers/adadelta.jl b/src/optimizers/adadelta.jl new file mode 100644 index 000000000000..e00cc9a42abd --- /dev/null +++ b/src/optimizers/adadelta.jl @@ -0,0 +1,91 @@ +@defstruct AdaDeltaOptions <: AbstractOptimizerOptions ( + (lr :: Real = 1.0, lr > 0), + (rho :: Real = 0.95, rho > 0 && rho < 1), + (epsilon :: Real = 1e-6, epsilon > 0), + (grad_clip :: Real = 0, grad_clip >= 0), + (weight_decay :: Real = 0.00001, weight_decay >= 0), + lr_scheduler :: Any = nothing +) + +""" + AdaDelta + +Scale learning rates by the ratio of accumulated gradients to accumulated +updates, see [1] and notes for further description. + + AdaDelta(; kwargs...) + +# Attributes +* `lr::Real`: default `1.0`, the learning rate controlling the + size of update steps +* `rho::Real`: default `0.9`, squared gradient moving average decay factor +* `epsilon::Real`: default `1e-6`, small value added for + numerical stability +* `grad_clip::Real`: default `0`, if positive, will clip the gradient + into the range `[-grad_clip, grad_clip]`. +* `weight_decay::Real`: default `0.00001`, weight decay is equivalent + to adding a global l2 regularizer for all the parameters. + +# Notes +`rho` should be between 0 and 1. A value of `rho` close to 1 will decay the +moving average slowly and a value close to 0 will decay the moving average +fast. + +`rho` = 0.95 and `epsilon` = 1e-6 are suggested in the paper and reported to +work for multiple datasets (MNIST, speech). In the paper, no learning rate is +considered (so `lr` = 1.0). Probably best to keep it at this value. + +`epsilon` is important for the very first update (so the numerator does +not become 0). + +Using the step size `lr` and a decay factor `rho` the learning rate is +calculated as: +``r_t &= \rho r_{t-1} + (1-\rho)*g^2\\ +\eta_t &= \eta \frac{\sqrt{s_{t-1} + \epsilon}} {\sqrt{r_t + \epsilon}}\\ +s_t &= \rho s_{t-1} + (1-\rho)*(\eta_t*g)^2`` + +# References +* [1]: Zeiler, M. D. (2012): + ADADELTA: An Adaptive Learning Rate Method. arXiv Preprint arXiv:1212.5701. +""" + +type AdaDelta <: AbstractOptimizer + opts :: AdaDeltaOptions + state :: OptimizationState + + function AdaDelta(; kwargs...) + opts = AdaDeltaOptions(;kwargs...) + opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) + + new(opts) + end +end + +type AdaDeltaState + acc :: NDArray + delta_acc :: NDArray +end + +function create_state(self :: AdaDelta, index :: Int, weight :: NDArray) + return AdaDeltaState(zeros(size(weight), context(weight)), + zeros(size(weight), context(weight))) +end + +function update(self :: AdaDelta, index :: Int, weight :: NDArray, + grad :: NDArray, state :: AdaDeltaState) + lr = get_learning_rate(self.opts.lr_scheduler, self.state) + grad = normalized_gradient(self.opts, self.state, weight, grad) + + # Update state.acc as in RMSProp + @inplace state.acc .*= self.opts.rho + @inplace state.acc .+= (1 - self.opts.rho) * grad .* grad + + # Compute update using the "old" state.delta_acc + update = grad .* sqrt(state.delta_acc + self.opts.epsilon) ./ + (sqrt(state.acc + self.opts.epsilon)) + @inplace weight .+= -lr * update + + # update state.delta_acc using update + @inplace state.delta_acc .*= self.opts.rho + @inplace state.delta_acc .+= (1 - self.opts.rho) * update .* update +end diff --git a/src/optimizers/adagrad.jl b/src/optimizers/adagrad.jl new file mode 100644 index 000000000000..196998121cce --- /dev/null +++ b/src/optimizers/adagrad.jl @@ -0,0 +1,66 @@ +@defstruct AdaGradOptions <: AbstractOptimizerOptions ( + (lr :: Real = 0.1, lr > 0), + (epsilon :: Real = 1e-6, epsilon > 0), + (grad_clip :: Real = 0, grad_clip >= 0), + (weight_decay :: Real = 0.00001, weight_decay >= 0), + lr_scheduler :: Any = nothing +) + +""" + AdaGrad + +Scale learning rates by dividing with the square root of accumulated +squared gradients. See [1] for further description. + + AdaGrad(; kwargs...) + +# Attributes +* `lr::Real`: default `0.1`, the learning rate controlling the + size of update steps +* `epsilon::Real`: default `1e-6`, small value added for + numerical stability +* `grad_clip::Real`: default `0`, if positive, will clip the gradient + into the range `[-grad_clip, grad_clip]`. +* `weight_decay::Real`: default `0.00001`, weight decay is equivalent + to adding a global l2 regularizer for all the parameters. + +# Notes +Using step size lr AdaGrad calculates the learning rate for feature i at +time step t as: +``η_{t,i} = \frac{lr}{\sqrt{\sum^t_{t^\prime} g^2_{t^\prime,i} + ϵ}} g_{t,i}`` +as such the learning rate is monotonically decreasing. +Epsilon is not included in the typical formula, see [2]. + +# References +* [1]: Duchi, J., Hazan, E., & Singer, Y. (2011): + Adaptive subgradient methods for online learning and + stochastic optimization. JMLR, 12:2121-2159. +* [2]: Chris Dyer: Notes on AdaGrad. + [http://www.ark.cs.cmu.edu/cdyer/adagrad.pdf] + (http://www.ark.cs.cmu.edu/cdyer/adagrad.pdf) +""" + +type AdaGrad <: AbstractOptimizer + opts :: AdaGradOptions + state :: OptimizationState + + function AdaGrad(; kwargs...) + opts = AdaGradOptions(;kwargs...) + opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) + + new(opts) + end +end + +function create_state(self :: AdaGrad, index :: Int, weight :: NDArray) + return zeros(size(weight), context(weight)) +end + +function update(self :: AdaGrad, index :: Int, weight :: NDArray, + grad :: NDArray, state :: NDArray) + lr = get_learning_rate(self.opts.lr_scheduler, self.state) + grad = normalized_gradient(self.opts, self.state, weight, grad) + + @inplace state .+= grad .* grad + @inplace weight .+= -lr * grad ./ (sqrt(state + self.opts.epsilon)) +end diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl index 665cc52694b0..3af5c3579736 100644 --- a/src/optimizers/adam.jl +++ b/src/optimizers/adam.jl @@ -63,11 +63,11 @@ function update(self :: ADAM, index :: Int, weight :: NDArray, grad :: NDArray, state.mt = self.opts.beta1 * state.mt + (1 - self.opts.beta1) * grad state.vt = self.opts.beta2 * state.vt + (1 - self.opts.beta2) * (grad .* grad) - mt = state.mt / (1 - state.beta1Power) - vt = state.vt / (1 - state.beta2Power) + at = sqrt(1.0 - state.beta2Power)/(1.0 - state.beta1Power) state.beta1Power *= self.opts.beta1 state.beta2Power *= self.opts.beta2 - @inplace weight .+= -lr * mt ./ (sqrt(vt) + self.opts.epsilon) + @inplace weight .+= -lr * at * state.mt ./ + (sqrt(state.vt) + self.opts.epsilon) end diff --git a/src/optimizers/adamax.jl b/src/optimizers/adamax.jl new file mode 100644 index 000000000000..838264360e1b --- /dev/null +++ b/src/optimizers/adamax.jl @@ -0,0 +1,77 @@ +@defstruct AdaMaxOptions <: AbstractOptimizerOptions ( + (lr :: Real = 0.002, lr > 0), + (beta1 :: Real = 0.9, beta1 > 0 && beta1 < 1), + (beta2 :: Real = 0.999, beta2 > 0 && beta2 < 1), + (epsilon :: Real = 1e-8, epsilon > 0), + (grad_clip :: Real = 0, grad_clip >= 0), + (weight_decay :: Real = 0.00001, weight_decay >= 0), + lr_scheduler :: Any = nothing +) + +""" + AdaMax + +This is a variant of of the Adam algorithm based on the infinity norm. +See [1] for further description. + + AdaMax(; kwargs...) + +# Attributes +* `lr::Real`: default `0.002`, the learning rate controlling the + size of update steps +* `beta1::Real`: default `0.9`, exponential decay rate + for the first moment estimates +* `beta2::Real`: default `0.999`, exponential decay rate for the + weighted infinity norm estimates +* `epsilon::Real`: default `1e-8`, small value added for + numerical stability +* `grad_clip::Real`: default `0`, if positive, will clip the gradient + into the range `[-grad_clip, grad_clip]`. +* `weight_decay::Real`: default `0.00001`, weight decay is equivalent + to adding a global l2 regularizer for all the parameters. + +# References +* [1]: Kingma, Diederik, and Jimmy Ba (2014): + Adam: A Method for Stochastic Optimization. + [http://arxiv.org/abs/1412.6980v8] + (http://arxiv.org/abs/1412.6980v8). +""" + +type AdaMax <: AbstractOptimizer + opts :: AdaMaxOptions + state :: OptimizationState + + function AdaMax(; kwargs...) + opts = AdaMaxOptions(; kwargs...) + opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) + + new(opts) + end +end + +type AdaMaxState + mt :: NDArray + ut :: NDArray + beta1Power :: Float64 +end + +function create_state(self :: AdaMax, index :: Int, weight :: NDArray) + return AdaMaxState( zeros(size(weight), context(weight)), + zeros(size(weight), context(weight)), + self.opts.beta1 ) +end + +function update(self :: AdaMax, index :: Int, weight :: NDArray, + grad :: NDArray, state :: AdaMaxState) + lr = get_learning_rate(self.opts.lr_scheduler, self.state) + grad = normalized_gradient(self.opts, self.state, weight, grad) + + @inplace state.mt .*= self.opts.beta1 + @inplace state.mt .+= (1 - self.opts.beta1) * grad + state.ut = _maximum(self.opts.beta2 * state.ut, abs(grad)) + + @inplace weight .+= - lr / (1 - state.beta1Power) * + state.mt ./ (state.ut + self.opts.epsilon) + + state.beta1Power *= self.opts.beta1 +end diff --git a/src/optimizers/nadam.jl b/src/optimizers/nadam.jl new file mode 100644 index 000000000000..65a195f674fe --- /dev/null +++ b/src/optimizers/nadam.jl @@ -0,0 +1,100 @@ +@defstruct NadamOptions <: AbstractOptimizerOptions ( + (lr :: Real = 0.001, lr > 0), + (beta1 :: Real = 0.99, beta1 > 0 && beta1 < 1), + (beta2 :: Real = 0.999, beta2 > 0 && beta2 < 1), + (epsilon :: Real = 1e-8, epsilon > 0), + (grad_clip :: Real = 0, grad_clip >= 0), + (weight_decay :: Real = 0.00001, weight_decay >= 0), + lr_scheduler :: Any = nothing, + momentum_scheduler :: Any = nothing +) + +""" + Nadam + +Nesterov Adam optimizer: Adam RMSprop with Nesterov momentum, +see [1] and notes for further description. + + Nadam(; kwargs...) + +# Attributes +* `lr::Real`: default `0.001`, learning rate. +* `beta1::Real`: default `0.99`. +* `beta2::Real`: default `0.999`. +* `epsilon::Real`: default `1e-8`, small value added for + numerical stability +* `grad_clip::Real`: default `0`, if positive, will clip the gradient + into the range `[-grad_clip, grad_clip]`. +* `weight_decay::Real`: default `0.00001`, weight decay is equivalent + to adding a global l2 regularizer for all the parameters. +* `lr_scheduler::AbstractLearningRateScheduler`: default `nothing`, a + dynamic learning rate scheduler. If set, will overwrite the `lr` + parameter. +* `momentum_scheduler::AbstractMomentumScheduler` default + `NadamScheduler` of the form + ``\mu_t = beta1 * (1 - 0.5 * 0.96^{t * 0.004})`` + +# Notes +Default parameters follow those provided in the paper. +It is recommended to leave the parameters of this optimizer +at their default values. + +# References +* [1]: Incorporating Nesterov Momentum into Adam. + [http://cs229.stanford.edu/proj2015/054_report.pdf] + (http://cs229.stanford.edu/proj2015/054_report.pdf) +* [2]: On the importance of initialization and momentum in deep learning + [http://www.cs.toronto.edu/~fritz/absps/momentum.pdf] + (http://www.cs.toronto.edu/~fritz/absps/momentum.pdf) +""" +type Nadam <: AbstractOptimizer + opts :: NadamOptions + state :: OptimizationState + + function Nadam(; kwargs...) + opts = NadamOptions(; kwargs...) + opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) + opts.momentum_scheduler = get_momentum_scheduler(opts.momentum_scheduler, + Momentum.NadamScheduler(mu0=opts.beta1)) + + new(opts) + end +end + +type NadamState + mt :: NDArray + nt :: NDArray + momentum :: Float64 + beta2Power :: Float64 +end + +function create_state(self :: Nadam, index :: Int, weight :: NDArray) + return NadamState( zeros(size(weight), context(weight)), + zeros(size(weight), context(weight)), + 1.0, + self.opts.beta2 ) +end + +function update(self :: Nadam, index :: Int, weight :: NDArray, + grad :: NDArray, state :: NadamState) + lr = get_learning_rate(self.opts.lr_scheduler, self.state) + grad = normalized_gradient(self.opts, self.state, weight, grad) + + mu_t, mu_t1 = + get_momentum(self.opts.momentum_scheduler, self.state) + state.momentum *= mu_t + momentum_next = state.momentum * mu_t1 + + grad_prime = grad / (1.0 - state.momentum) + @inplace state.mt .*= self.opts.beta1 + @inplace state.mt .+= (1.0 - self.opts.beta1) * grad + mt = state.mt / (1.0 - momentum_next) + + @inplace state.nt .*= self.opts.beta2 + @inplace state.nt .+= (1.0 - self.opts.beta2) * grad .* grad + nt = state.nt / (1.0 - state.beta2Power) + state.beta2Power *= self.opts.beta2 + + mt_prime = (1.0 - mu_t) * grad_prime + mu_t1 * mt + @inplace weight .+= -lr * mt_prime ./ (sqrt(nt) + self.opts.epsilon) +end diff --git a/src/optimizers/rmsprop.jl b/src/optimizers/rmsprop.jl new file mode 100644 index 000000000000..01a40651d2f6 --- /dev/null +++ b/src/optimizers/rmsprop.jl @@ -0,0 +1,71 @@ +@defstruct RMSPropOptions <: AbstractOptimizerOptions ( + (lr :: Real = 0.001, lr > 0), + (rho :: Real = 0.9, rho > 0 && rho < 1), + (epsilon :: Real = 1e-6, epsilon > 0), + (grad_clip :: Real = 0, grad_clip >= 0), + (weight_decay :: Real = 0.00001, weight_decay >= 0), + lr_scheduler :: Any = nothing +) + +""" + RMSProp + +Scale learning rates by dividing with the moving average of the root mean +squared (RMS) gradients. See [1] for further description. + + RMSProp(; kwargs...) + +# Attributes +* `lr::Real`: default `0.1`, the learning rate controlling the + size of update steps +* `rho::Real`: default `0.9`, gradient moving average decay factor +* `epsilon::Real`: default `1e-6`, small value added for + numerical stability +* `grad_clip::Real`: default `0`, if positive, will clip the gradient + into the range `[-grad_clip, grad_clip]`. +* `weight_decay::Real`: default `0.00001`, weight decay is equivalent + to adding a global l2 regularizer for all the parameters. + +# Notes +`rho` should be between 0 and 1. A value of `rho` close to 1 will decay the +moving average slowly and a value close to 0 will decay the moving average +fast. + +Using the step size ``lr`` and a decay factor ``\rho`` the +learning rate ``\eta_t`` is calculated as: +``r_t &= ρ r_{t-1} + (1 - ρ)*g^2 \\ + η_t &= \frac{lr}{\sqrt{r_t + ϵ}}`` + +# References +* [1]: Tieleman, T. and Hinton, G. (2012): + Neural Networks for Machine Learning, Lecture 6.5 - rmsprop. + Coursera. [http://www.youtube.com/watch?v=O3sxAc4hxZU] + (http://www.youtube.com/watch?v=O3sxAc4hxZU) (formula @5:20) +""" + +type RMSProp <: AbstractOptimizer + opts :: RMSPropOptions + state :: OptimizationState + + function RMSProp(; kwargs...) + opts = RMSPropOptions(;kwargs...) + opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) + + new(opts) + end +end + +function create_state(self :: RMSProp, index :: Int, weight :: NDArray) + return zeros(size(weight), context(weight)) +end + +function update(self :: RMSProp, index :: Int, weight :: NDArray, + grad :: NDArray, state :: NDArray) + lr = get_learning_rate(self.opts.lr_scheduler, self.state) + grad = normalized_gradient(self.opts, self.state, weight, grad) + + @inplace state .*= self.opts.rho + @inplace state .+= (1 - self.opts.rho) * grad .* grad + + @inplace weight .+= -lr * grad ./ (sqrt(state + self.opts.epsilon)) +end From 1ea44c93e77917165f5b95b0d18ba304757e11d0 Mon Sep 17 00:00:00 2001 From: Arkoniak Date: Sat, 7 Jan 2017 05:15:11 +0400 Subject: [PATCH 427/630] Fix hygiene bug (#164) --- src/symbolic-node.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index dfc54c3c3b1c..55328e5126c7 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -52,7 +52,7 @@ macro _list_symbol_info(self, func_name) ref_sz = Ref{MX_uint}(0) ref_names = Ref{char_pp}(0) @mxcall($func_name, (MX_handle, Ref{MX_uint}, Ref{char_pp}), - $self, ref_sz, ref_names) + $(esc(self)), ref_sz, ref_names) narg = ref_sz[] names = unsafe_wrap(Array, ref_names[], narg) names = [Symbol(unsafe_wrap(String, x)) for x in names] From 4d0aa87d652fddf366b2dfa2c6812ac00b2224d5 Mon Sep 17 00:00:00 2001 From: Arkoniak Date: Sat, 7 Jan 2017 05:15:51 +0400 Subject: [PATCH 428/630] Fixed visualize (#163) --- src/visualize.jl | 24 ++++++++++++++++-------- test/unittest/visualize.jl | 34 ++++++++++++++++++++++++++++++++++ 2 files changed, 50 insertions(+), 8 deletions(-) create mode 100644 test/unittest/visualize.jl diff --git a/src/visualize.jl b/src/visualize.jl index f0dd74efdc67..42d31a22d69e 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -51,6 +51,14 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp attr = deepcopy(node_attr) label = op + # Up to 0.8 version of mxnet additional info was stored in + # node["param"]. Staring from pre0.9 `param` was changed to `attr`. + if haskey(node, "param") + node_info = node["param"] + elseif haskey(node, "attr") + node_info = node["attr"] + end + if op == "null" if i ∈ heads # heads are output nodes @@ -62,23 +70,23 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp end elseif op == "Convolution" label = format("Convolution\nkernel={1}\nstride={2}\nn-filter={3}", - _extract_shape(node["param"]["kernel"]), - _extract_shape(node["param"]["stride"]), - node["param"]["num_filter"]) + _extract_shape(node_info["kernel"]), + _extract_shape(node_info["stride"]), + node_info["num_filter"]) colorkey = 2 elseif op == "FullyConnected" - label = format("FullyConnected\nnum-hidden={1}", node["param"]["num_hidden"]) + label = format("FullyConnected\nnum-hidden={1}", node_info["num_hidden"]) colorkey = 2 elseif op == "Activation" - label = format("Activation\nact-type={1}", node["param"]["act_type"]) + label = format("Activation\nact-type={1}", node_info["act_type"]) colorkey = 3 elseif op == "BatchNorm" colorkey = 4 elseif op == "Pooling" label = format("Pooling\ntype={1}\nkernel={2}\nstride={3}", - node["param"]["pool_type"], - _extract_shape(node["param"]["kernel"]), - _extract_shape(node["param"]["stride"])) + node_info["pool_type"], + _extract_shape(node_info["kernel"]), + _extract_shape(node_info["stride"])) colorkey = 5 elseif op ∈ ("Concat", "Flatten", "Reshape") colorkey = 6 diff --git a/test/unittest/visualize.jl b/test/unittest/visualize.jl new file mode 100644 index 000000000000..973c2b7034d0 --- /dev/null +++ b/test/unittest/visualize.jl @@ -0,0 +1,34 @@ +module TestVisualize +using MXNet +using Base.Test + +using ..Main: mlp2 + +################################################################################ +# Test Implementations +################################################################################ + +function test_basic() + info("Visualize::basic") + + mlp = mlp2() + + # Order of elements or default color values can change, but length of the output should be more or less stable + @test length(mx.to_graphviz(mlp)) == length( +""" +digraph "Network Visualization" { +node [fontsize=10]; +edge [fontsize=10]; +"fc1" [label="fc1\\nFullyConnected\\nnum-hidden=1000",style="rounded,filled",fixedsize=true,width=1.3,fillcolor="#fb8072",shape=box,penwidth=2,height=0.8034,color="#941305"]; +"activation0" [label="activation0\\nActivation\\nact-type=relu",style="rounded,filled",fixedsize=true,width=1.3,fillcolor="#ffffb3",shape=box,penwidth=2,height=0.8034,color="#999900"]; +"fc2" [label="fc2\\nFullyConnected\\nnum-hidden=10",style="rounded,filled",fixedsize=true,width=1.3,fillcolor="#fb8072",shape=box,penwidth=2,height=0.8034,color="#941305"]; +"activation0" -> "fc1" [arrowtail=open,color="#737373",dir=back]; +"fc2" -> "activation0" [arrowtail=open,color="#737373",dir=back]; +} +""") +end +################################################################################ +# Run tests +################################################################################ +test_basic() +end From ab80048173e833556e9f5c0efe5891107884b961 Mon Sep 17 00:00:00 2001 From: Spencer Lyon Date: Fri, 6 Jan 2017 20:19:42 -0500 Subject: [PATCH 429/630] ENH: added verbosity training option to control printouts (#162) --- src/model.jl | 43 ++++++++++++++++++++++++++++--------------- 1 file changed, 28 insertions(+), 15 deletions(-) diff --git a/src/model.jl b/src/model.jl index a892dc886ca3..c3ec17e035c0 100644 --- a/src/model.jl +++ b/src/model.jl @@ -191,7 +191,7 @@ end for copying mini-batches of data. Since there is no concern about convergence in prediction, it is better to set the mini-batch size as large as possible (limited by your device memory) if prediction speed is a concern. - + For the same reason, currently prediction will only use the first device even if multiple devices are provided to construct the model. @@ -290,6 +290,7 @@ end kvstore :: Union{Base.Symbol, KVStore} = :local, force_init :: Bool = false, callbacks :: Vector{AbstractCallback} = AbstractCallback[], + verbosity :: Int = 3 ) function _invoke_callbacks{T<:Real}(self::FeedForward, callbacks::Vector{AbstractCallback}, @@ -340,24 +341,30 @@ Train the `model` on `data` with the `optimizer`. this option is set, it will always do random initialization at the begining of training. * `callbacks::Vector{AbstractCallback}`: keyword argument, default `[]`. Callbacks to be invoked at each epoch or mini-batch, see `AbstractCallback`. +* `verbosity::Int`: Determines the verbosity of the print messages. Higher numbers + leads to more verbose printing. Acceptable values are + - `0`: Do not print anything during training + - `1`: Print starting and final messages + - `2`: Print one time messages and a message at the start of each epoch + - `3`: Print a summary of the training and validation accuracy for each epoch """ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) opts = TrainingOptions(; kwargs...) - info("Start training on $(self.ctx)") + opts.verbosity >= 1 && info("Start training on $(self.ctx)") batch_size = get_batch_size(data) num_dev = length(self.ctx) slices = _split_inputs(batch_size, num_dev) # initialize parameters - info("Initializing parameters...") + opts.verbosity >= 2 && info("Initializing parameters...") arg_names, param_names, aux_names = _init_model(self, data, opts.initializer, opts.force_init) # setup kvstore kvstore = opts.kvstore if isa(kvstore, Base.Symbol) - info("Creating KVStore...") + opts.verbosity >= 2 && info("Creating KVStore...") kvstore, update_on_kvstore = _create_kvstore(kvstore, length(self.ctx), self.arg_params) end @@ -388,7 +395,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra label_shapes = Dict([k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)]) train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=grad_req, data_shapes..., label_shapes...) dbg_str = mx.debug_str(train_execs[i]) - info(string("TempSpace: ", split(dbg_str, ['\n'])[end-2]..., " on ", self.ctx[i])) + opts.verbosity >= 2 && info(string("TempSpace: ", split(dbg_str, ['\n'])[end-2]..., " on ", self.ctx[i])) copy_params_from(train_execs[i], self.arg_params, self.aux_params) end @@ -420,7 +427,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra set_optimizer(kvstore, optimizer) end - info("Initializing KVStore...") + opts.verbosity >= 2 && info("Initializing KVStore...") # init kv with gradients for idx = 1:length(param_arrays) param_on_devs = param_arrays[idx] @@ -443,7 +450,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # invoke callbacks on epoch 0 _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback) - info("Start training...") + opts.verbosity >= 2 && info("Start training...") for i_epoch = 1:opts.n_epoch time_start = time() reset!(opts.eval_metric) @@ -515,12 +522,14 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra time_stop = time() metric = get(opts.eval_metric) - info(format("== Epoch {1:0>3d} ==========", i_epoch)) - info("## Training summary") - for (name, value) in metric - info(format("{1:>18s} = {2:.4f}", string(name), value)) + opts.verbosity >= 2 && info(format("== Epoch {1:0>3d}/{1:0>3d} ==========", i_epoch, opts.n_epoch)) + if opts.verbosity >= 3 + info("## Training summary") + for (name, value) in metric + info(format("{1:>18s} = {2:.4f}", string(name), value)) + end + info(format("{1:>18s} = {2:.4f} seconds", "time", time_stop-time_start)) end - info(format("{1:>18s} = {2:.4f} seconds", "time", time_stop-time_start)) # evaluation on validation set if !isa(opts.eval_data, Void) @@ -546,9 +555,11 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra update!(opts.eval_metric, cpu_label_arrays, cpu_output_arrays) end - info("## Validation summary") - for (name, value) in get(opts.eval_metric) - info(format("{1:>18s} = {2:.4f}", string(name), value)) + if opts.verbosity >= 3 + info("## Validation summary") + for (name, value) in get(opts.eval_metric) + info(format("{1:>18s} = {2:.4f}", string(name), value)) + end end end @@ -566,6 +577,8 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback; metric=metric) end # end of all epochs + + opts.verbosity >= 1 && info("Finish training on $(self.ctx)") end function save_checkpoint(self :: FeedForward, prefix :: AbstractString, state :: OptimizationState) From 2393d4a969877548d4b840fdd95942ca2d0e46e5 Mon Sep 17 00:00:00 2001 From: Arkoniak Date: Mon, 9 Jan 2017 05:57:01 +0400 Subject: [PATCH 430/630] Fix scalar operations in NDArray (#165) * Fixed string conversion bug * Smaller eps for Float16 * Changed rand_tensors in julian way --- src/ndarray.jl | 12 +++- test/unittest/ndarray.jl | 133 +++++++++++++++++++++++++++++++-------- 2 files changed, 119 insertions(+), 26 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index f32180a95e9c..6d19903b73cf 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -928,6 +928,16 @@ end ACCEPT_EMPTY_MUTATE_TARGET = (1 << 2) ) +function _julia_to_mx_param(val :: Any) + string(val) +end +function _julia_to_mx_param(val :: Float16) + string(val) +end +function _julia_to_mx_param(val :: Real) + @sprintf("%e", val) +end + # Import corresponding math functions from base so the automatically defined libmxnet # functions can overload them import Base: sqrt @@ -999,7 +1009,7 @@ function _get_ndarray_function_def(name :: String) num_outputs_p = [convert(Cint, num_outputs)] kw_keys_str = String[string(x[1]) for x in kwargs] - kw_vals_str = String[string(x[2]) for x in kwargs] + kw_vals_str = String[_julia_to_mx_param(x[2]) for x in kwargs] #op_handle = _get_cached_libmx_op_handle($(QuoteNode(name))) op_handle = _get_cached_libmx_op_handle($(name)) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index abc8d646fc7a..5b555b7d1adc 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -7,8 +7,9 @@ using ..Main: rand_dims, reldiff ################################################################################ # Test Implementations ################################################################################ -function rand_tensors{N}(dims::NTuple{N, Int}) - tensor = rand(mx.MX_float, dims) +rand_tensors{N}(dims::NTuple{N, Int}) = rand_tensors(mx.MX_float, dims) +function rand_tensors{N, T}(::Type{T}, dims::NTuple{N, Int}) + tensor = rand(T, dims) array = copy(tensor, mx.cpu()) return (tensor, array) end @@ -80,53 +81,99 @@ function test_plus() t1, a1 = rand_tensors(dims) t2, a2 = rand_tensors(dims) t3, a3 = rand_tensors(dims) + thresh = 1e-6 info("NDArray::plus::dims = $dims") - @test reldiff(t1+t2, copy(a1+a2)) < 1e-6 - @test reldiff(t1.+t2, copy(a1.+a2)) < 1e-6 + @test reldiff(t1+t2, copy(a1+a2)) < thresh + @test reldiff(t1.+t2, copy(a1.+a2)) < thresh - @test reldiff(t1+t2+t3, copy(a1+a2+a3)) < 1e-6 + @test reldiff(t1+t2+t3, copy(a1+a2+a3)) < thresh # test inplace += operation a0 = a1 # keep a reference to a1 @mx.inplace a1 += a2 # perform inplace += @test a0 == a1 # make sure they are still the same object - @test reldiff(copy(a0), copy(a1)) < 1e-6 - @test reldiff(copy(a1), t1+t2) < 1e-6 + @test reldiff(copy(a0), copy(a1)) < thresh + @test reldiff(copy(a1), t1+t2) < thresh # test scalar scalar = rand() - @test reldiff(t3 + scalar, copy(a3 + scalar)) < 1e-6 - @test reldiff(t2+scalar+t3, copy(a2+scalar+a3)) < 1e-6 + @test reldiff(t3 + scalar, copy(a3 + scalar)) < thresh + @test reldiff(t2+scalar+t3, copy(a2+scalar+a3)) < thresh + + # test small and large scalar + t4 = zeros(Float32, dims) + a4 = copy(t4, mx.cpu()) + scalar_small = 1e-8 + scalar_large = 1e8 + @test reldiff(t4 + scalar_small, copy(a4 .+ scalar_small)) < thresh + @test reldiff(t4 + scalar_large, copy(a4 .+ scalar_large)) < thresh + + t5 = zeros(Float64, dims) + a5 = copy(t5, mx.cpu()) + scalar_small = 1e-8 + scalar_large = 1e8 + @test reldiff(t5 + scalar_small, copy(a5 .+ scalar_small)) < thresh + @test reldiff(t5 + scalar_large, copy(a5 .+ scalar_large)) < thresh + + t6 = zeros(Float16, dims) + a6 = copy(t6, mx.cpu()) + scalar_small = Float16(1e-5) + scalar_large = Float16(1e4) + @test reldiff(t6 + scalar_small, copy(a6 .+ scalar_small)) < 1e-2 + @test reldiff(t6 + scalar_large, copy(a6 .+ scalar_large)) < 1e-2 end function test_minus() dims = rand_dims() t1, a1 = rand_tensors(dims) t2, a2 = rand_tensors(dims) + thresh = 1e-6 info("NDArray::minus::dims = $dims") - @test reldiff(t1-t2, copy(a1-a2)) < 1e-6 - @test reldiff(t1.-t2, copy(a1.-a2)) < 1e-6 + @test reldiff(t1-t2, copy(a1-a2)) < thresh + @test reldiff(t1.-t2, copy(a1.-a2)) < thresh - @test reldiff(-t1, copy(-a1)) < 1e-6 + @test reldiff(-t1, copy(-a1)) < thresh # make sure the negation is not in-place, so a1 is not changed after previous # statement is executed - @test reldiff(t1, copy(a1)) < 1e-6 + @test reldiff(t1, copy(a1)) < thresh # test inplace -= operation a0 = a1 # keep a reference to a1 @mx.inplace a1 -= a2 # perform inplace -= @test a0 == a1 # make sure they are still the same object - @test reldiff(copy(a0), copy(a1)) < 1e-6 - @test reldiff(copy(a1), t1-t2) < 1e-6 + @test reldiff(copy(a0), copy(a1)) < thresh + @test reldiff(copy(a1), t1-t2) < thresh # test scalar scalar = rand() - @test reldiff(t2 - scalar, copy(a2 - scalar)) < 1e-6 + @test reldiff(t2 - scalar, copy(a2 - scalar)) < thresh + + # test small and large scalar + t4 = zeros(Float32, dims) + a4 = copy(t4, mx.cpu()) + scalar_small = 1e-8 + scalar_large = 1e8 + @test reldiff(t4 - scalar_small, copy(a4 .- scalar_small)) < thresh + @test reldiff(t4 - scalar_large, copy(a4 .- scalar_large)) < thresh + + t5 = zeros(Float64, dims) + a5 = copy(t5, mx.cpu()) + scalar_small = 1e-8 + scalar_large = 1e8 + @test reldiff(t5 - scalar_small, copy(a5 .- scalar_small)) < thresh + @test reldiff(t5 - scalar_large, copy(a5 .- scalar_large)) < thresh + + t6 = zeros(Float16, dims) + a6 = copy(t6, mx.cpu()) + scalar_small = Float16(1e-5) + scalar_large = Float16(1e4) + @test reldiff(t6 - scalar_small, copy(a6 .- scalar_small)) < 1e-2 + @test reldiff(t6 - scalar_large, copy(a6 .- scalar_large)) < 1e-2 end function test_mul() @@ -134,44 +181,80 @@ function test_mul() t1, a1 = rand_tensors(dims) t2, a2 = rand_tensors(dims) t3, a3 = rand_tensors(dims) + thresh = 1e-6 info("NDArray::mul::dims = $dims") - @test reldiff(t1.*t2, copy(a1.*a2)) < 1e-6 + @test reldiff(t1.*t2, copy(a1.*a2)) < thresh # test inplace .*= operation a0 = a1 # keep a reference to a1 @mx.inplace a1 .*= a2 # perform inplace .*= @test a0 == a1 # make sure they are still the same object - @test reldiff(copy(a0), copy(a1)) < 1e-6 - @test reldiff(copy(a1), t1.*t2) < 1e-6 + @test reldiff(copy(a0), copy(a1)) < thresh + @test reldiff(copy(a1), t1.*t2) < thresh # test scalar - scalar = rand() - @test reldiff(t3 * scalar, copy(a3 .* scalar)) < 1e-6 + scalar = mx.MX_float(rand()) + @test reldiff(t3 * scalar, copy(a3 .* scalar)) < thresh + + # test small and large scalar + t4, a4 = rand_tensors(Float32, dims) + scalar_small = 1e-8 + scalar_large = 1e8 + @test reldiff(t4 * scalar_small, copy(a4 .* scalar_small)) < thresh + @test reldiff(t4 * scalar_large, copy(a4 .* scalar_large)) < thresh + + t5, a5 = rand_tensors(Float64, dims) + scalar_small = 1e-8 + scalar_large = 1e8 + @test reldiff(t5 * scalar_small, copy(a5 .* scalar_small)) < thresh + @test reldiff(t5 * scalar_large, copy(a5 .* scalar_large)) < thresh + + t6, a6 = rand_tensors(Float16, dims) + scalar_small = Float16(1e-5) + @test reldiff(t6 * scalar_small, copy(a6 .* scalar_small)) < 1e-2 end function test_div() dims = rand_dims() t1, a1 = rand_tensors(dims) t2, a2 = rand_tensors(dims) + thresh = 1e-6 info("NDArray::div::dims = $dims") t2 .+= 2 # avoid numerical instability @mx.inplace a2 .+= 2 - @test reldiff(t1 ./ t2, copy(a1 ./ a2)) < 1e-6 + @test reldiff(t1 ./ t2, copy(a1 ./ a2)) < thresh # test inplace -= operation a0 = a1 # keep a reference to a2 @mx.inplace a1 ./= a2 # perform inplace ./= @test a0 == a1 # make sure they are still the same object - @test reldiff(copy(a0), copy(a1)) < 1e-6 - @test reldiff(copy(a1), t1 ./ t2) < 1e-6 + @test reldiff(copy(a0), copy(a1)) < thresh + @test reldiff(copy(a1), t1 ./ t2) < thresh # test scalar scalar = rand() + 2 - @test reldiff(t2./scalar, copy(a2./scalar)) < 1e-6 + @test reldiff(t2./scalar, copy(a2./scalar)) < thresh + + # test small and large scalar + t4, a4 = rand_tensors(Float32, dims) + scalar_small = 1e-8 + scalar_large = 1e8 + @test reldiff(t4 / scalar_small, copy(a4 ./ scalar_small)) < thresh + @test reldiff(t4 / scalar_large, copy(a4 ./ scalar_large)) < thresh + + t5, a5 = rand_tensors(Float64, dims) + scalar_small = 1e-8 + scalar_large = 1e8 + @test reldiff(t5 / scalar_small, copy(a5 ./ scalar_small)) < thresh + @test reldiff(t5 / scalar_large, copy(a5 ./ scalar_large)) < thresh + + t6, a6 = rand_tensors(Float16, dims) + scalar_large = 1e4 + @test reldiff(t6 / scalar_large, copy(a6 ./ scalar_large)) < 1e-2 end function test_gd() From 179daa5deeef7197457b2235ed295ed6f5e76b22 Mon Sep 17 00:00:00 2001 From: Arkoniak Date: Fri, 13 Jan 2017 13:27:59 +0400 Subject: [PATCH 431/630] Fix of bugs in nnvm branch (#169) * Fix build error in travis Another string conversion fix * Fixed JSON and added testsets * Fixed errors in julia 0.4 --- REQUIRE | 1 + deps/build.jl | 1 + src/model.jl | 8 ++--- src/ndarray.jl | 22 +++++++++----- src/symbolic-node.jl | 5 +++- src/util.jl | 4 +-- test/runtests.jl | 19 ++++++++---- test/travis/setup_env.sh | 1 + test/unittest/bind.jl | 11 +++++-- test/unittest/io.jl | 15 +++++++--- test/unittest/kvstore.jl | 15 +++++++--- test/unittest/name.jl | 13 +++++++-- test/unittest/ndarray.jl | 53 +++++++++++++++++++--------------- test/unittest/operator.jl | 12 ++++++-- test/unittest/random.jl | 13 +++++++-- test/unittest/symbolic-node.jl | 27 ++++++++++------- test/unittest/visualize.jl | 12 ++++++-- 17 files changed, 160 insertions(+), 72 deletions(-) diff --git a/REQUIRE b/REQUIRE index d37f975fe665..1ca6bdddd26a 100644 --- a/REQUIRE +++ b/REQUIRE @@ -3,3 +3,4 @@ Compat 0.9.1 Formatting BinDeps JSON +BaseTestNext diff --git a/deps/build.jl b/deps/build.jl index b79940e8c1eb..49ff90b22b08 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -1,4 +1,5 @@ using Compat + ################################################################################ # First try to detect and load existing libmxnet ################################################################################ diff --git a/src/model.jl b/src/model.jl index a892dc886ca3..cc81e20633ad 100644 --- a/src/model.jl +++ b/src/model.jl @@ -384,8 +384,8 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra train_execs = Array(Executor, num_dev) for i = 1:num_dev - data_shapes = Dict([k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_data(data)]) - label_shapes = Dict([k => tuple(v[1:end-1]...,length(slices[i])) for (k,v) in provide_label(data)]) + data_shapes = Dict(map((x) -> x[1] => tuple(x[2][1:end-1]...,length(slices[i])), provide_data(data))) + label_shapes = Dict(map((x) -> x[1] => tuple(x[2][1:end-1]...,length(slices[i])), provide_label(data))) train_execs[i] = simple_bind(self.arch, self.ctx[i]; grad_req=grad_req, data_shapes..., label_shapes...) dbg_str = mx.debug_str(train_execs[i]) info(string("TempSpace: ", split(dbg_str, ['\n'])[end-2]..., " on ", self.ctx[i])) @@ -574,8 +574,8 @@ end function save_checkpoint(sym :: SymbolicNode, arg_params :: Dict{Base.Symbol, NDArray}, aux_params :: Dict{Base.Symbol, NDArray}, prefix :: AbstractString, epoch :: Int) save("$prefix-symbol.json", sym) - save_dict = merge(Dict([Symbol("arg:$k") => v for (k,v) in arg_params]), - Dict([Symbol("aux:$k") => v for (k,v) in aux_params])) + save_dict = merge(Dict{Base.Symbol, NDArray}(map((x) -> Symbol("arg:$(x[1])") => x[2], arg_params)), + Dict{Base.Symbol, NDArray}(map((x) -> Symbol("aux:$(x[1])") => x[2], aux_params))) save_filename = format("{1}-{2:04d}.params", prefix, epoch) save(save_filename, save_dict) info("Saved checkpoint to '$save_filename'") diff --git a/src/ndarray.jl b/src/ndarray.jl index 6d19903b73cf..7dd0a59b9ad5 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -931,11 +931,14 @@ end function _julia_to_mx_param(val :: Any) string(val) end -function _julia_to_mx_param(val :: Float16) - string(val) +function _julia_to_mx_param(val :: Float64) + @sprintf("%.16e", val) end -function _julia_to_mx_param(val :: Real) - @sprintf("%e", val) +function _julia_to_mx_param(val :: Float32) + @sprintf("%.8e", val) +end +function _julia_to_mx_param(val :: Float16) + @sprintf("%.4e", val) end # Import corresponding math functions from base so the automatically defined libmxnet @@ -986,6 +989,9 @@ function _get_ndarray_function_def(name :: String) end args = collect(args) # tuple to list + if length(args) == 0 + args = MX_handle[] + end # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped # See https://github.com/dmlc/MXNet.jl/issues/55 @@ -1000,9 +1006,11 @@ function _get_ndarray_function_def(name :: String) kwargs = Any[key != :axes ? (key, arg) : (key, reverse(map(i->length(arg)-i, arg))) for (key, arg) in kwargs] end - output_handles = [Base.cconvert(MX_handle, x) for x in output_vars] - if length(output_handles) > 0 - output_handles_pp = [Base.cconvert(Ptr{MX_handle}, output_handles)] + if length(output_vars) > 0 + output_handles = map((x) -> Base.cconvert(MX_handle, x), output_vars) + # XXX: Julia 0.4 has bug: [Array{MX_handle}] == Array{MX_handle} + output_handles_pp = Array{Array{MX_handle}}(1) + output_handles_pp[1] = Base.cconvert(Ptr{MX_handle}, output_handles) else output_handles_pp = [Base.convert(Ptr{MX_handle}, 0)] end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 1612f0c57771..ad63fe87e30b 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -52,7 +52,7 @@ macro _list_symbol_info(self, func_name) ref_sz = Ref{MX_uint}(0) ref_names = Ref{char_pp}(0) @mxcall($func_name, (MX_handle, Ref{MX_uint}, Ref{char_pp}), - $self, ref_sz, ref_names) + $(esc(self)), ref_sz, ref_names) narg = ref_sz[] names = unsafe_wrap(Array, ref_names[], narg) names = [Symbol(unsafe_wrap(String, x)) for x in names] @@ -493,6 +493,9 @@ end function /(self :: SymbolicNode, arg :: Real) ./(self, arg) end +function /(arg :: Real, self :: SymbolicNode) + _RDivScalar(self, scalar=arg) +end function ./(arg :: Real, self :: SymbolicNode) _RDivScalar(self, scalar=arg) end diff --git a/src/util.jl b/src/util.jl index 11d12e7f9dd2..8e134b05c527 100644 --- a/src/util.jl +++ b/src/util.jl @@ -15,7 +15,7 @@ function get_mnist_ubyte() :train_label => "train-labels-idx1-ubyte", :test_data => "t10k-images-idx3-ubyte", :test_label => "t10k-labels-idx1-ubyte") - filenames = Dict([k => joinpath(mnist_dir, v) for (k,v) in filenames]) + filenames = Dict(map((x) -> x[1] => joinpath(mnist_dir, x[2]), filenames)) if !all(isfile, values(filenames)) cd(mnist_dir) do mnist_dir = download("http://data.dmlc.ml/mxnet/data/mnist.zip", "mnist.zip") @@ -38,7 +38,7 @@ function get_cifar10() cifar10_dir = joinpath(data_dir, "cifar10") mkpath(cifar10_dir) filenames = Dict(:train => "cifar/train.rec", :test => "cifar/test.rec") - filenames = Dict([k => joinpath(cifar10_dir, v) for (k,v) in filenames]) + filenames = Dict(map((x) -> x[1] => joinpath(cifar10_dir, x[2]), filenames)) if !all(isfile, values(filenames)) cd(cifar10_dir) do run(`http://data.dmlc.ml/mxnet/data/cifar10.zip`) diff --git a/test/runtests.jl b/test/runtests.jl index cd9087b7202b..20125bc2b8cf 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -1,5 +1,10 @@ using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end # run test in the whole directory, latest modified files # are run first, this makes waiting time shorter when writing @@ -12,9 +17,13 @@ function test_dir(dir) end include(joinpath(dirname(@__FILE__), "common.jl")) -test_dir(joinpath(dirname(@__FILE__), "unittest")) +@testset "MXNet Test" begin + test_dir(joinpath(dirname(@__FILE__), "unittest")) -# run the basic MNIST mlp example -if haskey(ENV, "CONTINUOUS_INTEGRATION") - include(joinpath(Pkg.dir("MXNet"), "examples", "mnist", "mlp-test.jl")) + # run the basic MNIST mlp example + if haskey(ENV, "CONTINUOUS_INTEGRATION") + @testset "MNIST Test" begin + include(joinpath(Pkg.dir("MXNet"), "examples", "mnist", "mlp-test.jl")) + end + end end diff --git a/test/travis/setup_env.sh b/test/travis/setup_env.sh index 5a33a9e42955..4bae93243949 100755 --- a/test/travis/setup_env.sh +++ b/test/travis/setup_env.sh @@ -15,5 +15,6 @@ if [ ${TRAVIS_OS_NAME} == "linux" ]; then mkdir shadow_bin ln -s `which gcc-4.8` shadow_bin/gcc ln -s `which g++-4.8` shadow_bin/g++ + export PATH=$PWD/shadow_bin:$PATH fi diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl index c764435d5a9c..592a51a9f101 100644 --- a/test/unittest/bind.jl +++ b/test/unittest/bind.jl @@ -1,6 +1,11 @@ module TestBind using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end using ..Main: rand_dims, reldiff @@ -70,7 +75,9 @@ end ################################################################################ # Run tests ################################################################################ -test_arithmetic() +@testset "Bind Test" begin + test_arithmetic() +end end diff --git a/test/unittest/io.jl b/test/unittest/io.jl index 39e37f1bfe9a..9978ea4ccbce 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -1,6 +1,11 @@ module TestIO using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end using ..Main: rand_dims, reldiff @@ -117,8 +122,10 @@ function test_arrays_shuffle() @test reldiff(data_got, data[:,Int[label_got...]]) < 1e-6 end -test_arrays_shuffle() -test_arrays() -test_mnist() +@testset "IO Test" begin + test_arrays_shuffle() + test_arrays() + test_mnist() +end end diff --git a/test/unittest/kvstore.jl b/test/unittest/kvstore.jl index 2770edf7a259..05f5a9af5a60 100644 --- a/test/unittest/kvstore.jl +++ b/test/unittest/kvstore.jl @@ -1,6 +1,11 @@ module TestKVStore using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end using ..Main: rand_dims @@ -62,8 +67,10 @@ function test_aggregator() end end -test_kv_basic() -test_single_kv_pair() -test_aggregator() +@testset "KVStore Test" begin + test_kv_basic() + test_single_kv_pair() + test_aggregator() +end end diff --git a/test/unittest/name.jl b/test/unittest/name.jl index aca039670286..2df05f10b4f2 100644 --- a/test/unittest/name.jl +++ b/test/unittest/name.jl @@ -1,6 +1,11 @@ module TestNameManager using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end function test_default() info("NameManager::default") @@ -25,7 +30,9 @@ function test_prefix() @test get!(prefix_manager, "", name) == Symbol("$prefix$(name)0") end -test_default() -test_prefix() +@testset "Name Test" begin + test_default() + test_prefix() +end end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 5b555b7d1adc..42c8c0de54b6 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -1,6 +1,11 @@ module TestNDArray using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end using ..Main: rand_dims, reldiff @@ -121,8 +126,8 @@ function test_plus() a6 = copy(t6, mx.cpu()) scalar_small = Float16(1e-5) scalar_large = Float16(1e4) - @test reldiff(t6 + scalar_small, copy(a6 .+ scalar_small)) < 1e-2 - @test reldiff(t6 + scalar_large, copy(a6 .+ scalar_large)) < 1e-2 + @test reldiff(t6 + scalar_small, copy(a6 .+ scalar_small)) < 1e-1 + @test reldiff(t6 + scalar_large, copy(a6 .+ scalar_large)) < 1e-1 end function test_minus() @@ -172,8 +177,8 @@ function test_minus() a6 = copy(t6, mx.cpu()) scalar_small = Float16(1e-5) scalar_large = Float16(1e4) - @test reldiff(t6 - scalar_small, copy(a6 .- scalar_small)) < 1e-2 - @test reldiff(t6 - scalar_large, copy(a6 .- scalar_large)) < 1e-2 + @test reldiff(t6 - scalar_small, copy(a6 .- scalar_small)) < 1e-1 + @test reldiff(t6 - scalar_large, copy(a6 .- scalar_large)) < 1e-1 end function test_mul() @@ -213,7 +218,7 @@ function test_mul() t6, a6 = rand_tensors(Float16, dims) scalar_small = Float16(1e-5) - @test reldiff(t6 * scalar_small, copy(a6 .* scalar_small)) < 1e-2 + @test reldiff(t6 * scalar_small, copy(a6 .* scalar_small)) < 1e-1 end function test_div() @@ -254,7 +259,7 @@ function test_div() t6, a6 = rand_tensors(Float16, dims) scalar_large = 1e4 - @test reldiff(t6 / scalar_large, copy(a6 ./ scalar_large)) < 1e-2 + @test reldiff(t6 / scalar_large, copy(a6 ./ scalar_large)) < 1e-1 end function test_gd() @@ -300,7 +305,7 @@ function test_saveload() # save and load dictionary of ndarrays names = [Symbol("array$i") for i = 1:n_arrays] - dict = Dict([n => v for (n,v) in zip(names, nd_arrays)]) + dict = Dict([(n, v) for (n,v) in zip(names, nd_arrays)]) mx.save(fname, dict) data = mx.load(fname, mx.NDArray) @test isa(data, Dict{Symbol, mx.NDArray}) @@ -397,20 +402,22 @@ end ################################################################################ # Run tests ################################################################################ -test_assign() -test_copy() -test_slice() -test_plus() -test_minus() -test_mul() -test_div() -test_gd() -test_saveload() -test_clip() -test_sqrt() -test_eltype() -test_nd_as_jl() -test_dot() -test_kwargs() +@testset "NDArray Test" begin + test_assign() + test_copy() + test_slice() + test_plus() + test_minus() + test_mul() + test_div() + test_gd() + test_saveload() + test_clip() + test_sqrt() + test_eltype() + test_nd_as_jl() + test_dot() + test_kwargs() +end end diff --git a/test/unittest/operator.jl b/test/unittest/operator.jl index f4332582428c..e06d87e55c8f 100644 --- a/test/unittest/operator.jl +++ b/test/unittest/operator.jl @@ -1,6 +1,11 @@ module TestOperator using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end using ..Main: rand_dims, reldiff @@ -31,6 +36,9 @@ end ################################################################################ # Run tests ################################################################################ -test_scalar_op() + +@testset "Operator Test" begin + test_scalar_op() +end end diff --git a/test/unittest/random.jl b/test/unittest/random.jl index 5328aff26906..ac023d7226c9 100644 --- a/test/unittest/random.jl +++ b/test/unittest/random.jl @@ -1,6 +1,11 @@ module TestRandom using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end function test_uniform() dims = (100, 100, 2) @@ -37,7 +42,9 @@ function test_gaussian() @test abs(std(copy(ret1)) - σ) < 0.1 end -test_uniform() -test_gaussian() +@testset "Random Test" begin + test_uniform() + test_gaussian() +end end diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index ca2986d4a377..423a4c06e74e 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -1,6 +1,11 @@ module TestSymbolicNode using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end using ..Main: mlp2, reldiff @@ -128,14 +133,16 @@ end ################################################################################ # Run tests ################################################################################ -test_basic() -test_internal() -test_compose() -test_infer_shape() -test_infer_shape_error() -test_saveload() -test_attrs() -test_functions() -test_dot() +@testset "SymbolicNode Test" begin + test_basic() + test_internal() + test_compose() + test_infer_shape() + test_infer_shape_error() + test_saveload() + test_attrs() + test_functions() + test_dot() +end end diff --git a/test/unittest/visualize.jl b/test/unittest/visualize.jl index 973c2b7034d0..f8b9f2164aba 100644 --- a/test/unittest/visualize.jl +++ b/test/unittest/visualize.jl @@ -1,6 +1,11 @@ module TestVisualize using MXNet -using Base.Test +if VERSION ≥ v"0.5.0-dev+7720" + using Base.Test +else + using BaseTestNext + const Test = BaseTestNext +end using ..Main: mlp2 @@ -30,5 +35,8 @@ end ################################################################################ # Run tests ################################################################################ -test_basic() + +@testset "Visualize Test" begin + test_basic() +end end From 030990a155fab5c1e36075800f144f72c3424901 Mon Sep 17 00:00:00 2001 From: Spencer Lyon Date: Sun, 15 Jan 2017 08:38:44 -0500 Subject: [PATCH 432/630] BUG: fix two small mistakes with verbosity control (#168) --- src/model.jl | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/model.jl b/src/model.jl index 98a1a21a216f..3b38cf3193f2 100644 --- a/src/model.jl +++ b/src/model.jl @@ -522,7 +522,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra time_stop = time() metric = get(opts.eval_metric) - opts.verbosity >= 2 && info(format("== Epoch {1:0>3d}/{1:0>3d} ==========", i_epoch, opts.n_epoch)) + opts.verbosity >= 2 && info(format("== Epoch {1:0>3d}/{2:0>3d} ==========", i_epoch, opts.n_epoch)) if opts.verbosity >= 3 info("## Training summary") for (name, value) in metric @@ -579,6 +579,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end # end of all epochs opts.verbosity >= 1 && info("Finish training on $(self.ctx)") + nothing end function save_checkpoint(self :: FeedForward, prefix :: AbstractString, state :: OptimizationState) From 22a3c725747a4580a19b00217e869d390757d9ea Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Mon, 16 Jan 2017 14:12:05 +0800 Subject: [PATCH 433/630] Drop support for v0.4 and Deprecations for v0.6 (#171) * Fix deprecation warning on v0.6 * drop support for v0.4 --- .travis.yml | 1 - REQUIRE | 3 +-- src/base.jl | 12 ++++++------ src/io.jl | 4 ++-- src/kvstore.jl | 2 +- src/ndarray.jl | 2 +- src/symbolic-node.jl | 6 +++--- src/visualize.jl | 2 +- test/common.jl | 4 ++-- test/unittest/kvstore.jl | 4 ++-- test/unittest/metric.jl | 6 +++++- test/unittest/ndarray.jl | 4 ++-- 12 files changed, 26 insertions(+), 24 deletions(-) diff --git a/.travis.yml b/.travis.yml index 284ca4b422ae..571644e7773b 100644 --- a/.travis.yml +++ b/.travis.yml @@ -5,7 +5,6 @@ os: - linux - osx julia: - - 0.4 - 0.5 - nightly diff --git a/REQUIRE b/REQUIRE index 1ca6bdddd26a..7812bc91c571 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,6 +1,5 @@ -julia 0.4 +julia 0.5 Compat 0.9.1 Formatting BinDeps JSON -BaseTestNext diff --git a/src/base.jl b/src/base.jl index 588b777177bf..d34639e0516d 100644 --- a/src/base.jl +++ b/src/base.jl @@ -208,11 +208,11 @@ function _defstruct_impl(is_immutable, name, fields) name = esc(name.args[1]) end - field_defs = Array(Expr, length(fields)) # :(field2 :: Int) - field_names = Array(Expr, length(fields)) # :field2 - field_defaults = Array(Expr, length(fields)) # :(field2 = 0) - field_types = Array(Expr, length(fields)) # Int - field_asserts = Array(Expr, length(fields)) # :(field2 >= 0) + field_defs = Vector{Expr}(length(fields)) # :(field2 :: Int) + field_names = Vector{Expr}(length(fields)) # :field2 + field_defaults = Vector{Expr}(length(fields)) # :(field2 = 0) + field_types = Vector{Expr}(length(fields)) # Int + field_asserts = Vector{Expr}(length(fields)) # :(field2 >= 0) required_field = Symbol[] for i = 1:length(fields) @@ -249,7 +249,7 @@ function _defstruct_impl(is_immutable, name, fields) f_name, f_type = param :($f_name = convert($f_type, $f_name)) end - asserts = map(filter(i -> isdefined(field_asserts,i), 1:length(fields))) do i + asserts = map(filter(i -> isassigned(field_asserts,i), 1:length(fields))) do i :(@assert($(field_asserts[i]))) end construct = Expr(:call, name, field_names...) diff --git a/src/io.jl b/src/io.jl index da3ba52cecff..f65314e67c71 100644 --- a/src/io.jl +++ b/src/io.jl @@ -537,7 +537,7 @@ function _get_iter_name(hdr :: MX_handle) (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) - return Symbol(unsafe_wrap(String, ref_name[])) + return Symbol(unsafe_string(ref_name[])) end const _iter_creator_cache = Dict{Symbol, MX_handle}() @@ -564,7 +564,7 @@ function _define_data_iter_creator(hdr :: MX_handle) (MX_handle, Ref{char_p}, Ref{char_p}, Ref{MX_uint}, Ref{char_pp}, Ref{char_pp}, Ref{char_pp}), hdr, ref_name, ref_desc, ref_narg, ref_arg_names, ref_arg_types, ref_arg_descs) - iter_name = Symbol(unsafe_wrap(String, ref_name[])) + iter_name = Symbol(unsafe_string(ref_name[])) isprovider = endswith(string(iter_name), "Iter") signature = _format_signature(Int(ref_narg[]), ref_arg_names) diff --git a/src/kvstore.jl b/src/kvstore.jl index 03da58197d70..a1d835f8a6c2 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -87,7 +87,7 @@ end function get_type(self :: KVStore) type_ref = Ref{char_p}(0) @mxcall(:MXKVStoreGetType, (MX_handle, Ref{char_p}), self, type_ref) - return Symbol(unsafe_wrap(String, type_ref[])) + return Symbol(unsafe_string(type_ref[])) end function get_num_workers(self :: KVStore) diff --git a/src/ndarray.jl b/src/ndarray.jl index 7dd0a59b9ad5..d37b321a2d8a 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -882,7 +882,7 @@ function load(filename::AbstractString, ::Type{NDArray}) return [NDArray(MX_NDArrayHandle(hdr)) for hdr in unsafe_wrap(Array, out_hdrs[], out_size)] else @assert out_size == out_name_size - return Dict([(Symbol(unsafe_wrap(String, k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in + return Dict([(Symbol(unsafe_string(k)), NDArray(MX_NDArrayHandle(hdr))) for (k,hdr) in zip(unsafe_wrap(Array, out_names[], out_size), unsafe_wrap(Array, out_hdrs[], out_size))]) end end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index ad63fe87e30b..f5a518c35e56 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -55,7 +55,7 @@ macro _list_symbol_info(self, func_name) $(esc(self)), ref_sz, ref_names) narg = ref_sz[] names = unsafe_wrap(Array, ref_names[], narg) - names = [Symbol(unsafe_wrap(String, x)) for x in names] + names = [Symbol(unsafe_string(x)) for x in names] return names end end @@ -151,7 +151,7 @@ function list_attr(self :: SymbolicNode) strings = unsafe_wrap(Array, ref_strings[], narg) out = Dict{Symbol, String}() for i in 1:2:narg - key = Symbol(unsafe_wrap(String, strings[i])) + key = Symbol(unsafe_string(strings[i])) value = unsafe_string(strings[i+1]) # Creates a copy of string out[key] = value end @@ -174,7 +174,7 @@ function list_all_attr(self :: SymbolicNode) strings = unsafe_wrap(Array, ref_strings[], narg) out = Dict{Symbol, String}() for i in 1:2:narg - key = Symbol(unsafe_wrap(String, strings[i])) + key = Symbol(unsafe_string(strings[i])) value = unsafe_string(strings[i+1]) out[key] = value end diff --git a/src/visualize.jl b/src/visualize.jl index 42d31a22d69e..f7dfca859432 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -136,7 +136,7 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp end println(io, "}") - return takebuf_string(io) + return String(take!(io)) end function _format_graphviz_attr(io::IOBuffer, attrs) diff --git a/test/common.jl b/test/common.jl index a394acf95a93..7f7cd3cb78ea 100644 --- a/test/common.jl +++ b/test/common.jl @@ -2,8 +2,8 @@ # Common models used in testing ################################################################################ function reldiff(a, b) - diff = sum(abs(a - b)) - norm = sum(abs(a)) + diff = sum(abs.(a .- b)) + norm = sum(abs.(a)) return diff / (norm + 1e-10) end diff --git a/test/unittest/kvstore.jl b/test/unittest/kvstore.jl index 05f5a9af5a60..15b3f8c2c42c 100644 --- a/test/unittest/kvstore.jl +++ b/test/unittest/kvstore.jl @@ -37,7 +37,7 @@ function test_single_kv_pair() mx.push!(kv, 3, mx.ones(SHAPE)) val = mx.empty(SHAPE) mx.pull!(kv, 3, val) - @test maximum(abs(copy(val) - 1)) == 0 + @test maximum(abs.(copy(val) .- 1)) == 0 end function test_aggregator() @@ -52,7 +52,7 @@ function test_aggregator() mx.push!(kv, 3, vals) mx.pull!(kv, 3, vals) for v in vals - @test maximum(abs(copy(v)) - num_devs) == 0 + @test maximum(abs.(copy(v)) - num_devs) == 0 end # list diff --git a/test/unittest/metric.jl b/test/unittest/metric.jl index f0a79d6ce994..fd36d4ffc7f8 100644 --- a/test/unittest/metric.jl +++ b/test/unittest/metric.jl @@ -49,7 +49,11 @@ function test_ace() metric = mx.ACE() # For categorical variables, ACE == -LL mx._update_single_output(metric, mx.NDArray(labels), mx.NDArray(probs)) LL_v2 = metric.ace_sum / metric.n_sample - @test_approx_eq_eps LL LL_v2 1e-12 + @static if VERSION >= v"0.6.0-dev.2075" + @test LL ≈ LL_v2 atol=1e-12 + else + @test_approx_eq_eps LL LL_v2 1e-12 + end end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 42c8c0de54b6..9b96861e0006 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -322,7 +322,7 @@ function test_clip() info("NDArray::clip::dims = $dims") j_array, nd_array = rand_tensors(dims) - clip_up = maximum(abs(j_array)) / 2 + clip_up = maximum(abs.(j_array)) / 2 clip_down = 0 clipped = mx.clip(nd_array, a_min=clip_down, a_max=clip_up) @@ -338,7 +338,7 @@ function test_sqrt() j_array, nd_array = rand_tensors(dims) sqrt_ed = sqrt(nd_array) - @test reldiff(copy(sqrt_ed), sqrt(j_array)) < 1e-6 + @test reldiff(copy(sqrt_ed), sqrt.(j_array)) < 1e-6 end function test_nd_as_jl() From 2a66ea3242203c549f156f3650db208189a0418e Mon Sep 17 00:00:00 2001 From: mdpradeep Date: Fri, 20 Jan 2017 18:30:14 +0530 Subject: [PATCH 434/630] Update build.jl (#174) --- deps/build.jl | 17 ++++++++++++----- 1 file changed, 12 insertions(+), 5 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 37ce0c7b862d..fece3065fe4d 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -24,11 +24,18 @@ if !libmxnet_detected ################################################################################ # If not found, try to build automatically using BinDeps ################################################################################ - if is_windows() - info("Please follow the libmxnet documentation on how to build manually") - info("or to install pre-build packages:") - info("http://mxnet.readthedocs.io/en/latest/how_to/build.html#building-on-windows") - error("Automatic building libxmnet on Windows is currently not supported yet.") + if is_windows() + DOWNLOAD_URL = "https://github.com/dmlc/mxnet/releases/download/20160531/20160531_win10_x64_cpu.7z" + run(download_cmd(DOWNLOAD_URL, "mxnet.7z")) + run(`7z x mxnet.7z -y -ousr`) + run(`usr\\setupenv.cmd`) + run(`cmd /c copy "usr\\3rdparty\\openblas\\bin\\*.dll" "usr\\lib"`) + + DOWNLOAD_URL = "https://github.com/yajiedesign/mxnet/releases/download/20161125/20161125_mxnet_x64_cpu.7z" + run(download_cmd(DOWNLOAD_URL, "mxnet.7z")) + run(`7z x mxnet.7z -y -ousr`) + + return end blas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) From 3ad5819b5202d444b33e521a2430b20222b3305b Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 26 Jan 2017 17:28:43 +0900 Subject: [PATCH 435/630] update NEWS.md --- NEWS.md | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/NEWS.md b/NEWS.md index 2d0ec817ce39..f4fb93004db8 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,9 @@ +# v0.2.0 (2017.01.26) +* Drop support for Julia v0.4. +* Added support for NVVM. +* Updated supported version of MXNet to 0.9.3. +* New optimizers (@Arkoniak). + # v0.1.0 (2016.09.08) * Track specific libmxnet version for each release. From 8d044b160da4377f117860496861936677d2bcba Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 Jan 2017 14:33:02 +0900 Subject: [PATCH 436/630] refactor windows support --- deps/build.jl | 42 +++++++++++++++++++++++++++++------------- 1 file changed, 29 insertions(+), 13 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index fece3065fe4d..3ef676e8a667 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -1,10 +1,12 @@ using Compat +import JSON ################################################################################ # First try to detect and load existing libmxnet ################################################################################ libmxnet_detected = false libmxnet_curr_ver = "master" +curr_win = "20161125" if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") @@ -18,25 +20,39 @@ if haskey(ENV, "MXNET_HOME") end end + + using BinDeps @BinDeps.setup if !libmxnet_detected + if is_windows() + # TODO: Detect GPU support on Windows + info("Downloading pre-built CPU packages for Windows.") + base_url = "https://github.com/dmlc/mxnet/releases/download/20160531/20160531_win10_x64_cpu.7z" + if libmxnet_curr_ver == "master" + # download_cmd uses powershell 2, but we need powershell 3 to do this + ps_wget(url, file) = run(`powershell -NoProfile -Command "wget \"$url\" -o \"$file\""`) + ps_wget("https://api.github.com/repos/yajiedesign/mxnet/releases/latest", "mxnet.json") + curr_win = JSON.parsefile("mxnet.json")["tag_name"] + info("Can't use MXNet master on Windows, using latest binaries from $curr_win.") + end + # TODO: Get url from JSON. + package_url = "https://github.com/yajiedesign/mxnet/releases/download/$(curr_win)/$(curr_win)_mxnet_x64_vc12_cpu.7z" + + run(download_cmd(base_url, "mxnet_base.7z")) + run(`7z x mxnet_base.7z -y -ousr`) + run(`usr\\setupenv.cmd`) + run(`cmd /c copy "usr\\3rdparty\\openblas\\bin\\*.dll" "usr\\lib"`) + + run(download_cmd(package_url, "mxnet.7z")) + run(`7z x mxnet.7z -y -ousr`) + + return + end + ################################################################################ # If not found, try to build automatically using BinDeps ################################################################################ - if is_windows() - DOWNLOAD_URL = "https://github.com/dmlc/mxnet/releases/download/20160531/20160531_win10_x64_cpu.7z" - run(download_cmd(DOWNLOAD_URL, "mxnet.7z")) - run(`7z x mxnet.7z -y -ousr`) - run(`usr\\setupenv.cmd`) - run(`cmd /c copy "usr\\3rdparty\\openblas\\bin\\*.dll" "usr\\lib"`) - - DOWNLOAD_URL = "https://github.com/yajiedesign/mxnet/releases/download/20161125/20161125_mxnet_x64_cpu.7z" - run(download_cmd(DOWNLOAD_URL, "mxnet.7z")) - run(`7z x mxnet.7z -y -ousr`) - - return - end blas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) From b039771b87aa6817697cc95c3f75032befe99f24 Mon Sep 17 00:00:00 2001 From: Harsha Byadarahalli Mahesh Date: Fri, 27 Jan 2017 15:47:56 +0530 Subject: [PATCH 437/630] Using WebRequest function to download the JSON file wget was failing to download mxnet.json , so replaced them with Invoke-WebRequest --- deps/build.jl | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 3ef676e8a667..4fe217056a4e 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -31,8 +31,7 @@ if !libmxnet_detected base_url = "https://github.com/dmlc/mxnet/releases/download/20160531/20160531_win10_x64_cpu.7z" if libmxnet_curr_ver == "master" # download_cmd uses powershell 2, but we need powershell 3 to do this - ps_wget(url, file) = run(`powershell -NoProfile -Command "wget \"$url\" -o \"$file\""`) - ps_wget("https://api.github.com/repos/yajiedesign/mxnet/releases/latest", "mxnet.json") + run(`powershell -NoProfile -Command Invoke-WebRequest -Uri "https://api.github.com/repos/yajiedesign/mxnet/releases/latest" -OutFile "mxnet.json"`) curr_win = JSON.parsefile("mxnet.json")["tag_name"] info("Can't use MXNet master on Windows, using latest binaries from $curr_win.") end From 6335ecac3ece7c78d401a655ee483a7ae4abe535 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 Jan 2017 19:20:23 +0900 Subject: [PATCH 438/630] fix vectorized abs deprecation --- test/unittest/kvstore.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/test/unittest/kvstore.jl b/test/unittest/kvstore.jl index 15b3f8c2c42c..9b7b0a4e4bb4 100644 --- a/test/unittest/kvstore.jl +++ b/test/unittest/kvstore.jl @@ -62,7 +62,7 @@ function test_aggregator() for vv in vals for v in vv - @test maximum(abs(copy(v)) - 2num_devs) == 0 + @test maximum(abs.(copy(v)) - 2 * num_devs) == 0 end end end From d9f9551754c33a42596140e07b2c891cf17d87e3 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 Jan 2017 19:24:27 +0900 Subject: [PATCH 439/630] don't include code from within a function --- examples/mnist/mlp-test.jl | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl index a88ba3772fb0..c282c1dead1d 100644 --- a/examples/mnist/mlp-test.jl +++ b/examples/mnist/mlp-test.jl @@ -5,6 +5,8 @@ module MNISTTest using MXNet using Base.Test +include("mnist-data.jl") + function get_mnist_mlp() mlp = @mx.chain mx.Variable(:data) => mx.FullyConnected(name=:fc1, num_hidden=128) => @@ -17,7 +19,6 @@ function get_mnist_mlp() end function get_mnist_data(batch_size=100) - include("mnist-data.jl") return get_mnist_providers(batch_size) end From a6968a6b26ab0c4a5321ae73410ff2460ff192b6 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 Jan 2017 19:31:23 +0900 Subject: [PATCH 440/630] deprecation of filter and Array creation --- src/MXNet.jl | 4 ++++ src/model.jl | 2 +- 2 files changed, 5 insertions(+), 1 deletion(-) diff --git a/src/MXNet.jl b/src/MXNet.jl index b9de52a58bf8..892cc4e95163 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -11,6 +11,10 @@ using Compat import Compat.String import Compat.view +if VERSION >= v"0.6.0-dev.1024" + import Base.Iterators: filter +end + using Formatting # Functions from base that we can safely extend and that are defined by libmxnet. diff --git a/src/model.jl b/src/model.jl index 3b38cf3193f2..f1f05595533d 100644 --- a/src/model.jl +++ b/src/model.jl @@ -389,7 +389,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra end end - train_execs = Array(Executor, num_dev) + train_execs = Array{Executor}(num_dev) for i = 1:num_dev data_shapes = Dict(map((x) -> x[1] => tuple(x[2][1:end-1]...,length(slices[i])), provide_data(data))) label_shapes = Dict(map((x) -> x[1] => tuple(x[2][1:end-1]...,length(slices[i])), provide_label(data))) From a79d002df3f94d4878d1e4cdfc3308e7b03dee2a Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 Jan 2017 19:33:30 +0900 Subject: [PATCH 441/630] readall deprecation --- examples/char-lstm/seq-data.jl | 2 +- examples/char-lstm/train.jl | 2 +- examples/mnist/mlp-test.jl | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index 1ea93e3b6116..cfcc5a67bb04 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -5,7 +5,7 @@ using MXNet function build_vocabulary(corpus_fn::AbstractString, vocab_fn::AbstractString; max_vocab=10000) if isfile(vocab_fn) info("Vocabulary already exists, reusing $vocab_fn...") - vocab = Dict{Char,Int}([w => i for (i,w) in enumerate(readall(vocab_fn))]) + vocab = Dict{Char,Int}([w => i for (i,w) in enumerate(readstring(vocab_fn))]) else # count symbol frequency dict = Dict{Char,Int}() diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index f96fdde1d674..30578603cafc 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -14,7 +14,7 @@ lstm = LSTM(LSTM_N_LAYER, SEQ_LENGTH, DIM_HIDDEN, DIM_EMBED, #--data # load data -text_all = readall(INPUT_FILE) +text_all = readstring(INPUT_FILE) len_train = round(Int, length(text_all)*DATA_TR_RATIO) text_tr = text_all[1:len_train] text_val = text_all[len_train+1:end] diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl index c282c1dead1d..2acedd073dfa 100644 --- a/examples/mnist/mlp-test.jl +++ b/examples/mnist/mlp-test.jl @@ -41,7 +41,7 @@ function mnist_fit_and_predict(optimizer, initializer, n_epoch) end mlp_load = mx.load("$cp_prefix-symbol.json", mx.SymbolicNode) @test mx.to_json(mlp_load) == mx.to_json(mlp) - mlp_load = mx.from_json(readall("$cp_prefix-symbol.json"), mx.SymbolicNode) + mlp_load = mx.from_json(readstring("$cp_prefix-symbol.json"), mx.SymbolicNode) @test mx.to_json(mlp_load) == mx.to_json(mlp) #-------------------------------------------------------------------------------- From a476d3e448fa57ffb84f69b237fa05454af8e5ea Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 27 Jan 2017 19:53:13 +0900 Subject: [PATCH 442/630] MXNet.jl on v0.6 is currently subtlety broken due to broadcasting. --- .travis.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.travis.yml b/.travis.yml index 571644e7773b..6c2f33c114a4 100644 --- a/.travis.yml +++ b/.travis.yml @@ -6,7 +6,7 @@ os: - osx julia: - 0.5 - - nightly +# - nightly 0.6 supports depends on #170 # dependent apt packages addons: From fecfcdd146cc561a7742e11883b5c7a141c4d5c9 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sat, 28 Jan 2017 12:17:43 +0900 Subject: [PATCH 443/630] fix use of Symbol in symbolic-node.jl, fixes #189 --- src/symbolic-node.jl | 4 ++-- test/unittest/symbolic-node.jl | 9 +++++++++ 2 files changed, 11 insertions(+), 2 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index f5a518c35e56..c85420939d85 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -627,8 +627,8 @@ function _define_atomic_symbol_creator(name :: String) $(if key_narg != "" quote - if !in(Symbol($key_narg), param_keys) - push!(param_keys, Symbol($key_narg)) + if !in($key_narg, param_keys) + push!(param_keys, $key_narg) push!(param_vals, string(length(args))) end end diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 423a4c06e74e..573f541fbcd6 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -130,6 +130,14 @@ function test_dot() @test reldiff(ret, 2*ones(100, 200)) < 1e-6 end +function test_misc() + info("SymbolicNode::Miscellaneous") + # Test for #189 + a = mx.Variable("a") + b = mx.Variable("b") + symb = mx.ElementWiseSum(a,b) +end + ################################################################################ # Run tests ################################################################################ @@ -143,6 +151,7 @@ end test_attrs() test_functions() test_dot() + test_misc() end end From cac5625596312a5b9cf5628f4e2c7b6f4592059c Mon Sep 17 00:00:00 2001 From: Zac Cranko Date: Wed, 25 Jan 2017 10:13:36 +1100 Subject: [PATCH 444/630] refactor sgd.jl to exploit multiple dispatch --- src/optimizers/sgd.jl | 25 ++++++++++++++----------- 1 file changed, 14 insertions(+), 11 deletions(-) diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index 2eda1d0bf67c..cd0b998fbed0 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -49,18 +49,21 @@ function create_state(self :: SGD, index :: Int, weight :: NDArray) end end -function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: Union{Void, NDArray}) +function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: Void) lr = get_learning_rate(self.opts.lr_scheduler, self.state) grad = normalized_gradient(self.opts, self.state, weight, grad) + + @inplace weight += -lr * grad +end - if isa(state, Void) - # vanilla SGD, without momentum - @inplace weight += -lr * grad - else - mom = state :: NDArray - coef = get_momentum(self.opts.momentum_scheduler, self.state) - @inplace mom .*= coef - @inplace mom .+= -lr * grad - @inplace weight .+= mom - end +# update with momentum +function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: NDArray) + lr = get_learning_rate(self.opts.lr_scheduler, self.state) + grad = normalized_gradient(self.opts, self.state, weight, grad) + + mom = state :: NDArray + coef = get_momentum(self.opts.momentum_scheduler, self.state) + @inplace mom .*= coef + @inplace mom .+= -lr * grad + @inplace weight .+= mom end From d0d79630551693997f4e9475d0c753eae7789061 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sat, 28 Jan 2017 15:26:24 +0900 Subject: [PATCH 445/630] remove BaseTestNext and bump Compat --- REQUIRE | 2 +- test/runtests.jl | 7 +------ test/unittest/bind.jl | 7 +------ test/unittest/io.jl | 7 +------ test/unittest/kvstore.jl | 7 +------ test/unittest/name.jl | 7 +------ test/unittest/ndarray.jl | 7 +------ test/unittest/operator.jl | 7 +------ test/unittest/random.jl | 7 +------ test/unittest/symbolic-node.jl | 7 +------ test/unittest/visualize.jl | 7 +------ 11 files changed, 11 insertions(+), 61 deletions(-) diff --git a/REQUIRE b/REQUIRE index 7812bc91c571..8fdfc5fcde96 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,5 +1,5 @@ julia 0.5 -Compat 0.9.1 +Compat 0.9.5 Formatting BinDeps JSON diff --git a/test/runtests.jl b/test/runtests.jl index 20125bc2b8cf..823830b54d0d 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -1,10 +1,5 @@ using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test # run test in the whole directory, latest modified files # are run first, this makes waiting time shorter when writing diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl index 592a51a9f101..79f639518487 100644 --- a/test/unittest/bind.jl +++ b/test/unittest/bind.jl @@ -1,11 +1,6 @@ module TestBind using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test using ..Main: rand_dims, reldiff diff --git a/test/unittest/io.jl b/test/unittest/io.jl index 9978ea4ccbce..88d77bd3c16b 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -1,11 +1,6 @@ module TestIO using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test using ..Main: rand_dims, reldiff diff --git a/test/unittest/kvstore.jl b/test/unittest/kvstore.jl index 9b7b0a4e4bb4..cf15f1a65f05 100644 --- a/test/unittest/kvstore.jl +++ b/test/unittest/kvstore.jl @@ -1,11 +1,6 @@ module TestKVStore using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test using ..Main: rand_dims diff --git a/test/unittest/name.jl b/test/unittest/name.jl index 2df05f10b4f2..9287bf087074 100644 --- a/test/unittest/name.jl +++ b/test/unittest/name.jl @@ -1,11 +1,6 @@ module TestNameManager using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test function test_default() info("NameManager::default") diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 9b96861e0006..155f365d6ee8 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -1,11 +1,6 @@ module TestNDArray using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test using ..Main: rand_dims, reldiff diff --git a/test/unittest/operator.jl b/test/unittest/operator.jl index e06d87e55c8f..76e51f4403f5 100644 --- a/test/unittest/operator.jl +++ b/test/unittest/operator.jl @@ -1,11 +1,6 @@ module TestOperator using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test using ..Main: rand_dims, reldiff diff --git a/test/unittest/random.jl b/test/unittest/random.jl index ac023d7226c9..54d651482cd6 100644 --- a/test/unittest/random.jl +++ b/test/unittest/random.jl @@ -1,11 +1,6 @@ module TestRandom using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test function test_uniform() dims = (100, 100, 2) diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 573f541fbcd6..36f125cd728c 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -1,11 +1,6 @@ module TestSymbolicNode using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test using ..Main: mlp2, reldiff diff --git a/test/unittest/visualize.jl b/test/unittest/visualize.jl index f8b9f2164aba..3bdaa12824d2 100644 --- a/test/unittest/visualize.jl +++ b/test/unittest/visualize.jl @@ -1,11 +1,6 @@ module TestVisualize using MXNet -if VERSION ≥ v"0.5.0-dev+7720" - using Base.Test -else - using BaseTestNext - const Test = BaseTestNext -end +using Base.Test using ..Main: mlp2 From 0ee926ecfd76f0f066b52205eeca915bcb1c0b60 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sun, 29 Jan 2017 17:58:43 +0900 Subject: [PATCH 446/630] remove usr/setupenv.cmd because it is too invasive --- deps/build.jl | 1 - src/base.jl | 2 +- 2 files changed, 1 insertion(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 4fe217056a4e..7b654d9a9706 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -40,7 +40,6 @@ if !libmxnet_detected run(download_cmd(base_url, "mxnet_base.7z")) run(`7z x mxnet_base.7z -y -ousr`) - run(`usr\\setupenv.cmd`) run(`cmd /c copy "usr\\3rdparty\\openblas\\bin\\*.dll" "usr\\lib"`) run(download_cmd(package_url, "mxnet.7z")) diff --git a/src/base.jl b/src/base.jl index d34639e0516d..183465341f3c 100644 --- a/src/base.jl +++ b/src/base.jl @@ -18,7 +18,7 @@ typealias char_pp Ptr{char_p} ################################################################################ const MXNET_LIB = Libdl.find_library(["libmxnet.so","libmxnet.dll"], [joinpath("$(get(ENV,"MXNET_HOME",""))","lib"), - joinpath(Pkg.dir("MXNet"),"deps/usr/lib")]) + Pkg.dir("MXNet","deps","usr","lib")]) if isempty(MXNET_LIB) # touch this file, so that after the user properly build libmxnet, the precompiled # MXNet.ji will be re-compiled to get MXNET_LIB properly. From 75060bc0457499d8d06c226a2a570006d564e200 Mon Sep 17 00:00:00 2001 From: Arkoniak Date: Sun, 5 Feb 2017 17:29:17 +0400 Subject: [PATCH 447/630] Fix for symbolic node (#199) * Fix for symbolic node * wrong indentation * Better condition --- examples/char-lstm/lstm.jl | 40 +++++++++++++++++----------------- examples/char-lstm/sampler.jl | 8 +++---- examples/char-lstm/seq-data.jl | 12 +++++----- src/optimizer.jl | 2 +- src/symbolic-node.jl | 8 ++++--- 5 files changed, 36 insertions(+), 34 deletions(-) diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index e98778b65272..dcd1e6ddb60c 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -26,11 +26,11 @@ function lstm_cell(data::mx.SymbolicNode, prev_state::LSTMState, param::LSTMPara end i2h = mx.FullyConnected(data, weight=param.i2h_W, bias=param.i2h_b, - num_hidden=4num_hidden, name=symbol(name, "_i2h")) + num_hidden=4num_hidden, name=Symbol(name, "_i2h")) h2h = mx.FullyConnected(prev_state.h, weight=param.h2h_W, bias=param.h2h_b, - num_hidden=4num_hidden, name=symbol(name, "_h2h")) + num_hidden=4num_hidden, name=Symbol(name, "_h2h")) - gates = mx.SliceChannel(i2h + h2h, num_outputs=4, name=symbol(name, "_gates")) + gates = mx.SliceChannel(i2h + h2h, num_outputs=4, name=Symbol(name, "_gates")) in_gate = mx.Activation(gates[1], act_type=:sigmoid) in_trans = mx.Activation(gates[2], act_type=:tanh) @@ -49,17 +49,17 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla dropout::Real=0, name::Symbol=gensym(), output_states::Bool=false) # placeholder nodes for all parameters - embed_W = mx.Variable(symbol(name, "_embed_weight")) - pred_W = mx.Variable(symbol(name, "_pred_weight")) - pred_b = mx.Variable(symbol(name, "_pred_bias")) + embed_W = mx.Variable(Symbol(name, "_embed_weight")) + pred_W = mx.Variable(Symbol(name, "_pred_weight")) + pred_b = mx.Variable(Symbol(name, "_pred_bias")) layer_param_states = map(1:n_layer) do i - param = LSTMParam(mx.Variable(symbol(name, "_l$(i)_i2h_weight")), - mx.Variable(symbol(name, "_l$(i)_h2h_weight")), - mx.Variable(symbol(name, "_l$(i)_i2h_bias")), - mx.Variable(symbol(name, "_l$(i)_h2h_bias"))) - state = LSTMState(mx.Variable(symbol(name, "_l$(i)_init_c")), - mx.Variable(symbol(name, "_l$(i)_init_h"))) + param = LSTMParam(mx.Variable(Symbol(name, "_l$(i)_i2h_weight")), + mx.Variable(Symbol(name, "_l$(i)_h2h_weight")), + mx.Variable(Symbol(name, "_l$(i)_i2h_bias")), + mx.Variable(Symbol(name, "_l$(i)_h2h_bias"))) + state = LSTMState(mx.Variable(Symbol(name, "_l$(i)_init_c")), + mx.Variable(Symbol(name, "_l$(i)_init_h"))) (param, state) end #... @@ -69,17 +69,17 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla # now unroll over time outputs = mx.SymbolicNode[] for t = 1:seq_len - data = mx.Variable(symbol(name, "_data_$t")) - label = mx.Variable(symbol(name, "_label_$t")) + data = mx.Variable(Symbol(name, "_data_$t")) + label = mx.Variable(Symbol(name, "_label_$t")) hidden = mx.FullyConnected(data, weight=embed_W, num_hidden=dim_embed, - no_bias=true, name=symbol(name, "_embed_$t")) + no_bias=true, name=Symbol(name, "_embed_$t")) # stack LSTM cells for i = 1:n_layer l_param, l_state = layer_param_states[i] dp = i == 1 ? 0 : dropout # don't do dropout for data next_state = lstm_cell(hidden, l_state, l_param, num_hidden=dim_hidden, dropout=dp, - name=symbol(name, "_lstm_$t")) + name=Symbol(name, "_lstm_$t")) hidden = next_state.h layer_param_states[i] = (l_param, next_state) end @@ -89,8 +89,8 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla hidden = mx.Dropout(hidden, p=dropout) end pred = mx.FullyConnected(hidden, weight=pred_W, bias=pred_b, num_hidden=n_class, - name=symbol(name, "_pred_$t")) - smax = mx.SoftmaxOutput(pred, label, name=symbol(name, "_softmax_$t")) + name=Symbol(name, "_pred_$t")) + smax = mx.SoftmaxOutput(pred, label, name=Symbol(name, "_softmax_$t")) push!(outputs, smax) end #... @@ -100,8 +100,8 @@ function LSTM(n_layer::Int, seq_len::Int, dim_hidden::Int, dim_embed::Int, n_cla # append block-gradient nodes to the final states for i = 1:n_layer l_param, l_state = layer_param_states[i] - final_state = LSTMState(mx.BlockGrad(l_state.c, name=symbol(name, "_l$(i)_last_c")), - mx.BlockGrad(l_state.h, name=symbol(name, "_l$(i)_last_h"))) + final_state = LSTMState(mx.BlockGrad(l_state.c, name=Symbol(name, "_l$(i)_last_c")), + mx.BlockGrad(l_state.h, name=Symbol(name, "_l$(i)_last_h"))) layer_param_states[i] = (l_param, final_state) end diff --git a/examples/char-lstm/sampler.jl b/examples/char-lstm/sampler.jl index 22166b7700c9..ad34f344cbcd 100644 --- a/examples/char-lstm/sampler.jl +++ b/examples/char-lstm/sampler.jl @@ -10,11 +10,11 @@ vocab = build_vocabulary(INPUT_FILE, VOCAB_FILE) n_class = length(vocab) # prepare data provider -jl_data = Pair[(symbol(NAME, "_data_$t") => zeros(mx.MX_float, (length(vocab), BATCH_SIZE_SMP))) +jl_data = Pair[(Symbol(NAME, "_data_$t") => zeros(mx.MX_float, (length(vocab), BATCH_SIZE_SMP))) for t = 1:1] -jl_c = Pair[(symbol(NAME, "_l$(l)_init_c") => zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) +jl_c = Pair[(Symbol(NAME, "_l$(l)_init_c") => zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) for l = 1:LSTM_N_LAYER] -jl_h = Pair[(symbol(NAME, "_l$(l)_init_h") => zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) +jl_h = Pair[(Symbol(NAME, "_l$(l)_init_h") => zeros(mx.MX_float, (DIM_HIDDEN, BATCH_SIZE_SMP))) for l = 1:LSTM_N_LAYER] # the first input in the sequence @@ -36,7 +36,7 @@ output_samples = zeros(Char, (SAMPLE_LENGTH, BATCH_SIZE_SMP)) output_samples[1, :] = SAMPLE_START # build inverse vocabulary for convenience -inv_vocab = Dict([v => k for (k,v) in vocab]) +inv_vocab = Dict(v => k for (k,v) in vocab) # do prediction and sampling step by step for t = 2:SAMPLE_LENGTH-1 diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index cfcc5a67bb04..fb7c8378a5f1 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -5,7 +5,7 @@ using MXNet function build_vocabulary(corpus_fn::AbstractString, vocab_fn::AbstractString; max_vocab=10000) if isfile(vocab_fn) info("Vocabulary already exists, reusing $vocab_fn...") - vocab = Dict{Char,Int}([w => i for (i,w) in enumerate(readstring(vocab_fn))]) + vocab = Dict{Char,Int}(w => i for (i,w) in enumerate(readstring(vocab_fn))) else # count symbol frequency dict = Dict{Char,Int}() @@ -25,7 +25,7 @@ function build_vocabulary(corpus_fn::AbstractString, vocab_fn::AbstractString; m end end - vocab = Dict([x.first => i for (i,x) in enumerate(vocab)]) + vocab = Dict(x.first => i for (i,x) in enumerate(vocab)) end vocab[UNKNOWN_CHAR] = length(vocab) return vocab @@ -50,12 +50,12 @@ end #--provide function mx.provide_data(p :: CharSeqProvider) - [(symbol(p.prefix, "_data_$t"), (length(p.vocab), p.batch_size)) for t = 1:p.seq_len] ∪ - [(symbol(p.prefix, "_l$(l)_init_c"), (p.dim_hidden, p.batch_size)) for l=1:p.n_layer] ∪ - [(symbol(p.prefix, "_l$(l)_init_h"), (p.dim_hidden, p.batch_size)) for l=1:p.n_layer] + [(Symbol(p.prefix, "_data_$t"), (length(p.vocab), p.batch_size)) for t = 1:p.seq_len] ∪ + [(Symbol(p.prefix, "_l$(l)_init_c"), (p.dim_hidden, p.batch_size)) for l=1:p.n_layer] ∪ + [(Symbol(p.prefix, "_l$(l)_init_h"), (p.dim_hidden, p.batch_size)) for l=1:p.n_layer] end function mx.provide_label(p :: CharSeqProvider) - [(symbol(p.prefix, "_label_$t"), (p.batch_size,)) for t = 1:p.seq_len] + [(Symbol(p.prefix, "_label_$t"), (p.batch_size,)) for t = 1:p.seq_len] end #--/provide diff --git a/src/optimizer.jl b/src/optimizer.jl index 66f7d660847a..5e9065b64127 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -259,7 +259,7 @@ function normalized_gradient(opts::AbstractOptimizerOptions, state::Optimization grad = grad_scale * grad if opts.grad_clip > 0 - grad = clip(grad, -opts.grad_clip, opts.grad_clip) + grad = clip(grad, a_min=-opts.grad_clip, a_max=opts.grad_clip) end if opts.weight_decay > 0 @inplace grad += opts.weight_decay * weight diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index c85420939d85..6e421b66d1be 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -650,8 +650,8 @@ function _define_atomic_symbol_creator(name :: String) end end - if length(args) != 0 && length(symbol_kws) != 0 - @assert(false, $name * " only accepts SymbolicNode either as positional or keyword arguments, not both.") + if length(args) > 1 && length(symbol_kws) != 0 + @assert(false, $name * " only accepts SymbolicNode either as positional or keyword arguments with optional positional `data` argument, not both.") end $(if key_narg != "" quote @@ -680,8 +680,10 @@ function _define_atomic_symbol_creator(name :: String) set_attr(node, k, v) end - if length(args) != 0 + if length(symbol_kws) == 0 _compose!(node, name, args...) + elseif length(args) == 1 + _compose!(node; name=name, data=args[1], symbol_kws...) else _compose!(node; name=name, symbol_kws...) end From f33f1dc19d7f1b5919f4651ae922c2387b851347 Mon Sep 17 00:00:00 2001 From: Mike J Innes Date: Fri, 24 Feb 2017 00:27:04 +0000 Subject: [PATCH 448/630] get_name (#206) --- src/symbolic-node.jl | 21 +++++++++++++++++++++ test/unittest/symbolic-node.jl | 2 ++ 2 files changed, 23 insertions(+) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 6e421b66d1be..4c73bd33642d 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -199,6 +199,27 @@ function set_attr(self :: SymbolicNode, key :: Symbol, value :: AbstractString) @mxcall(:MXSymbolSetAttr, (MX_handle, Cstring, Cstring), self, key_s, value_s) end +""" + get_name(self :: SymbolicNode) + +Get the name of the symbol. + + julia> x = mx.Variable(:data) + julia> mx.get_name(x) + :data + + julia> y = mx.FullyConnected(x, num_hidden = 128) + julia> mx.get_name(y) + :fullyconnected0 +""" +function get_name(self :: mx.SymbolicNode) + name = Ref{mx.char_p}(0) + success = Ref(0) + @mxcall(:MXSymbolGetName, (MX_handle, Ref{char_p}, Ref{Int}), self.handle.value, name, success) + @assert success[] != -1 + return Symbol(unsafe_wrap(String, name[])) +end + """ grad(self :: SymbolicNode, wrt :: Vector{SymbolicNode}) diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 36f125cd728c..4c8cff8adccc 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -86,6 +86,7 @@ function test_attrs() data = mx.Variable(:data) + @test mx.get_name(data) == :data result = mx.get_attr(data, :test) @test isnull(result) mx.set_attr(data, :test, "1.0") @@ -100,6 +101,7 @@ function test_attrs() @test isnull(mx.get_attr(conv, :b)) @test get(mx.get_attr(conv, :a)) == "a" @test get(mx.get_attr(conv, :π)) == "π" + @test isa(mx.get_name(conv), Symbol) @test_throws MethodError mx.Variable(:data3, attrs = Dict(:test => "1.0", :test2 => 1.0)) @test_throws MethodError mx.Convolution(data2, kernel = (1,1), num_filter = 1, attrs = Dict(:test => "1.0", :test2 => 1.0)) From 17a544205b22d7092f07690816c000a25e43b0ef Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Tue, 28 Feb 2017 17:34:11 -0500 Subject: [PATCH 449/630] fix data URL error (#204) --- src/util.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/util.jl b/src/util.jl index b41641f68309..6f7dc1ba73ac 100644 --- a/src/util.jl +++ b/src/util.jl @@ -18,7 +18,7 @@ function get_mnist_ubyte() filenames = Dict(map((x) -> x[1] => joinpath(mnist_dir, x[2]), filenames)) if !all(isfile, values(filenames)) cd(mnist_dir) do - mnist_dir = download("http://data.dmlc.ml/mxnet/data/mnist.zip", "mnist.zip") + mnist_dir = download("http://data.mxnet.io/mxnet/data/mnist.zip", "mnist.zip") try run(`unzip -u $mnist_dir`) catch @@ -41,7 +41,7 @@ function get_cifar10() filenames = Dict(map((x) -> x[1] => joinpath(cifar10_dir, x[2]), filenames)) if !all(isfile, values(filenames)) cd(cifar10_dir) do - download("http://data.dmlc.ml/mxnet/data/cifar10.zip", "cifar10.zip") + download("http://data.mxnet.io/mxnet/data/cifar10.zip", "cifar10.zip") try run(`unzip -u cifar10.zip`) catch From c58eb466be4f0794b4860d31a5ce6beb3b8e6afe Mon Sep 17 00:00:00 2001 From: Michael Creel Date: Fri, 3 Mar 2017 23:58:19 +0100 Subject: [PATCH 450/630] fix for issue #207 (#208) --- examples/regression-example.jl | 17 ++++++++--------- 1 file changed, 8 insertions(+), 9 deletions(-) diff --git a/examples/regression-example.jl b/examples/regression-example.jl index 8c949f9b2fac..bf0acb14b2f1 100644 --- a/examples/regression-example.jl +++ b/examples/regression-example.jl @@ -30,17 +30,16 @@ evalprovider = mx.ArrayDataProvider(:data => ValidationInput, batch_size=batchsi # or add/remove a layer data = mx.Variable(:data) label = mx.Variable(:label) -net = @mx.chain mx.FullyConnected(data = data, num_hidden=10) => +net = @mx.chain mx.Variable(:data) => + mx.FullyConnected(num_hidden=10) => mx.Activation(act_type=:tanh) => mx.FullyConnected(num_hidden=3) => mx.Activation(act_type=:tanh) => - mx.FullyConnected(num_hidden=1) - -# squared error loss is appropriate for regression, don't change -cost = mx.LinearRegressionOutput(data = net, label=label) + mx.FullyConnected(num_hidden=1) => + mx.LinearRegressionOutput(label) # final model definition, don't change, except if using gpu -model = mx.FeedForward(cost, context=mx.cpu()) +model = mx.FeedForward(net, context=mx.cpu()) # set up the optimizer: select one, explore parameters, if desired #optimizer = mx.SGD(lr=0.01, momentum=0.9, weight_decay=0.00001) @@ -48,11 +47,11 @@ optimizer = mx.ADAM() # train, reporting loss for training and evaluation sets # initial training with small batch size, to get to a good neighborhood -batchsize = 100 -mx.fit(model, optimizer, initializer=mx.NormalInitializer(0.0,0.1), eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 500) +batchsize = 200 +mx.fit(model, optimizer, initializer=mx.NormalInitializer(0.0,0.1), eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 20) # more training with the full sample batchsize = samplesize -mx.fit(model, optimizer, eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 500) +mx.fit(model, optimizer, eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 20) # obtain predictions plotprovider = mx.ArrayDataProvider(:data => ValidationInput, :label => ValidationOutput) From fa25ad6f4ad1769bd86c3ae9a0c5c3bd050cef5d Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 10 Mar 2017 00:14:39 +0800 Subject: [PATCH 451/630] metric: intro NMSE normalized mean squared error --- src/metric.jl | 41 +++++++++++++++++++++++++++++++++++++++++ 1 file changed, 41 insertions(+) diff --git a/src/metric.jl b/src/metric.jl index dc3c3aef452a..7432657aaa14 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -179,6 +179,47 @@ function reset!(metric :: MSE) metric.n_sample = 0 end +doc""" + NMSE + +Normalized Mean Squared Error + +```math +\sum_i (\frac{label_i - pred_i}{label_i})^2 +``` +""" +type NMSE <: AbstractEvalMetric + nmse_sum :: Float64 + n_sample :: Int + + NMSE() = new(0.0, 0) +end + +function _update_single_output(metric :: NMSE, label :: NDArray, pred :: NDArray) + label = copy(label) + pred = copy(pred) + + n_sample = size(pred)[end] + metric.n_sample += n_sample + + for i = 1:n_sample + if label[i] == 0.0f0 # in case of batch padding + continue + end + + metric.nmse_sum += ((label[i] - pred[i]) / label[i])^2 + end +end + +function get(metric :: NMSE) + return [(:NMSE, metric.nmse_sum / metric.n_sample)] +end + +function reset!(metric :: NMSE) + metric.nmse_sum = 0.0 + metric.n_sample = 0 +end + """ ACE From f23b0a9dba5eed903b2f255ff9880c9e6987399c Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 10 Mar 2017 00:15:22 +0800 Subject: [PATCH 452/630] doc: update CDN link of MathJax --- docs/mkdocs.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/mkdocs.yml b/docs/mkdocs.yml index bf604818027e..ed18e479ae37 100644 --- a/docs/mkdocs.yml +++ b/docs/mkdocs.yml @@ -12,7 +12,7 @@ extra_css: - assets/Documenter.css extra_javascript: - - https://cdn.mathjax.org/mathjax/latest/MathJax.jl?config=TeX-AMS-MML_HTMLorMML + - https://cdn.mathjax.org/mathjax/latest/MathJax.js?config=TeX-AMS_HTML - assets/mathjaxhelper.js markdown_extensions: From 96191ea24346816b36c029b1bcd1bcf9dfd25781 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 10 Mar 2017 11:00:11 +0800 Subject: [PATCH 453/630] metric: add test cases for NMSE --- test/unittest/metric.jl | 36 ++++++++++++++++++++++++++++++++++++ 1 file changed, 36 insertions(+) diff --git a/test/unittest/metric.jl b/test/unittest/metric.jl index fd36d4ffc7f8..46b62a243dc1 100644 --- a/test/unittest/metric.jl +++ b/test/unittest/metric.jl @@ -57,10 +57,46 @@ function test_ace() end +function test_nmse() + info("EvalMetric::NMSE") + + @testset "EvalMetric::NMSE::update!" begin + metric = mx.NMSE() + labels = Array{mx.NDArray}( + [mx.NDArray([100.0, 0.0]), mx.NDArray([10.0, 0.0])]) + preds = Array{mx.NDArray}( + [mx.NDArray([20.0, 0.0]), mx.NDArray([2.0, 0.0])]) + + mx.update!(metric, labels, preds) + @test metric.nmse_sum ≈ 0.64 * 2 + end + + @testset "EvalMetric::NMSE::reset!" begin + metric = mx.NMSE() + metric.nmse_sum = sum(rand(10)) + metric.n_sample = 42 + + mx.reset!(metric) + + @test metric.nmse_sum == 0.0 + @test metric.n_sample == 0 + end + + @testset "EvalMetric::NMSE::get" begin + metric = mx.NMSE() + metric.nmse_sum = 100.0 + metric.n_sample = 20 + + @test mx.get(metric) == [(:NMSE, 5.0)] + end +end + + ################################################################################ # Run tests ################################################################################ test_ace() +test_nmse() end From ba97d9354af12108ed22cfcdb8a8765ad34d62ae Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 11 Mar 2017 17:43:16 +0800 Subject: [PATCH 454/630] docs: add an explanation for normalized MSE --- src/metric.jl | 38 ++++++++++++++++++++++++++++++++++++++ 1 file changed, 38 insertions(+) diff --git a/src/metric.jl b/src/metric.jl index 7432657aaa14..135fe9fa6994 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -187,6 +187,44 @@ Normalized Mean Squared Error ```math \sum_i (\frac{label_i - pred_i}{label_i})^2 ``` + +Note that there are various ways to do the *normalization*. +It depends on your own context. Please judge the problem setting you have +first. If the current implementation do not suitable for you, +feel free to file it on GitHub. + +Let me show you a use case of this kind of normalization: + +Bob is training a network for option pricing. The option pricing problem is +a regression problem (pirce predicting). There are lots of option contracts +on same target stock but different strike price. +For example, there is a stock `S`; it's market price is 1000. +And, there are two call option contracts with different strike price. +Assume Bob obtains the outcome as following table: + +``` ++--------+----------------+----------------+--------------+ +| | Strike Price | Market Price | Pred Price | ++--------+----------------+----------------+--------------+ +| Op 1 | 1500 | 100 | 80 | ++--------+----------------+----------------+--------------+ +| Op 2 | 500 | 10 | 8 | ++--------+----------------+----------------+--------------+ +``` + +Now, obviously, Bob will calculate the normalized MSE as: + +```math + (\frac{100 - 80}{100})^2 + \text{ vs } + (\frac{10 - 8}{10}) ^2 +``` + +Both of the pred prices got the same degree of error. + +For more discussion about normalized MSE, please see +[#211](https://github.com/dmlc/MXNet.jl/pull/211) also. + """ type NMSE <: AbstractEvalMetric nmse_sum :: Float64 From cf7f32b3d750c94f817510ec9437c537183d229e Mon Sep 17 00:00:00 2001 From: Steven Thornton Date: Thu, 9 Mar 2017 11:18:56 -0500 Subject: [PATCH 455/630] Fixed data attribute --- docs/src/tutorial/mnist.md | 26 +++++++++++++------------- 1 file changed, 13 insertions(+), 13 deletions(-) diff --git a/docs/src/tutorial/mnist.md b/docs/src/tutorial/mnist.md index 096d7dd0310f..9b580cfcf38d 100644 --- a/docs/src/tutorial/mnist.md +++ b/docs/src/tutorial/mnist.md @@ -29,14 +29,14 @@ data = mx.Variable(:data) and then cascading fully-connected layers and activation functions: ```julia -fc1 = mx.FullyConnected(data = data, name=:fc1, num_hidden=128) -act1 = mx.Activation(data = fc1, name=:relu1, act_type=:relu) -fc2 = mx.FullyConnected(data = act1, name=:fc2, num_hidden=64) -act2 = mx.Activation(data = fc2, name=:relu2, act_type=:relu) -fc3 = mx.FullyConnected(data = act2, name=:fc3, num_hidden=10) +fc1 = mx.FullyConnected(data, name=:fc1, num_hidden=128) +act1 = mx.Activation(fc1, name=:relu1, act_type=:relu) +fc2 = mx.FullyConnected(act1, name=:fc2, num_hidden=64) +act2 = mx.Activation(fc2, name=:relu2, act_type=:relu) +fc3 = mx.FullyConnected(act2, name=:fc3, num_hidden=10) ``` -Note each composition we take the previous symbol as the data argument, +Note each composition we take the previous symbol as the first argument, forming a feedforward chain. The architecture looks like ``` @@ -49,7 +49,7 @@ where the last 10 units correspond to the 10 output classes (digits classes: ```julia -mlp = mx.SoftmaxOutput(data = fc3, name=:softmax) +mlp = mx.SoftmaxOutput(fc3, name=:softmax) ``` As we can see, the MLP is just a chain of layers. For this case, we can @@ -148,12 +148,12 @@ listed below: data = mx.Variable(:data) # first conv -conv1 = @mx.chain mx.Convolution(data=data, kernel=(5,5), num_filter=20) => +conv1 = @mx.chain mx.Convolution(data, kernel=(5,5), num_filter=20) => mx.Activation(act_type=:tanh) => mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) # second conv -conv2 = @mx.chain mx.Convolution(data=conv1, kernel=(5,5), num_filter=50) => +conv2 = @mx.chain mx.Convolution(conv1, kernel=(5,5), num_filter=50) => mx.Activation(act_type=:tanh) => mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) ``` @@ -168,17 +168,17 @@ a tensor of shape `(28,28,1,100)`. The convolution and pooling operates in the spatial axis, so `kernel=(5,5)` indicate a square region of 5-width and 5-height. The rest of the architecture follows as: -```ulia +```julia # first fully-connected -fc1 = @mx.chain mx.Flatten(data=conv2) => +fc1 = @mx.chain mx.Flatten(conv2) => mx.FullyConnected(num_hidden=500) => mx.Activation(act_type=:tanh) # second fully-connected -fc2 = mx.FullyConnected(data=fc1, num_hidden=10) +fc2 = mx.FullyConnected(fc1, num_hidden=10) # softmax loss -lenet = mx.Softmax(data=fc2, name=:softmax) +lenet = mx.Softmax(fc2, name=:softmax) ``` Note a fully-connected operator expects the input to be a matrix. From c9eb71bc8bbc52c56dae097405caaf9985c99834 Mon Sep 17 00:00:00 2001 From: Michael Creel Date: Sun, 19 Mar 2017 20:59:26 +0100 Subject: [PATCH 456/630] switch to Plots.jl from pyplot (#217) --- examples/regression-example.jl | 7 ++----- 1 file changed, 2 insertions(+), 5 deletions(-) diff --git a/examples/regression-example.jl b/examples/regression-example.jl index bf0acb14b2f1..508dfa79b308 100644 --- a/examples/regression-example.jl +++ b/examples/regression-example.jl @@ -6,7 +6,7 @@ the predictions from the trained net. =# using MXNet using Distributions -using PyPlot +using Plots # data generating process generate_inputs(mean, var, size) = rand(MvNormal(mean, var), size) @@ -56,7 +56,4 @@ mx.fit(model, optimizer, eval_metric=mx.MSE(), trainprovider, eval_data=evalprov # obtain predictions plotprovider = mx.ArrayDataProvider(:data => ValidationInput, :label => ValidationOutput) fit = mx.predict(model, plotprovider) -plot(ValidationOutput,fit',".") -xlabel("true") -ylabel("predicted") -title("outputs: true versus predicted. 45º line is what we hope for") +scatter(ValidationOutput,fit',w = 3, xlabel="true", ylabel="predicted", title="45º line is what we hope for", show=true) From 1781290bfb6d67876db453c652bb3d924eaba13f Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 30 Mar 2017 06:08:36 +0900 Subject: [PATCH 457/630] Update ACE metric (#220) * Takes eps parameter to prevent log(0) to blow up, * Recognises learning of probability distributions. --- src/metric.jl | 43 ++++++++++++++++++++++++++++++++--------- test/unittest/metric.jl | 11 ++++++----- 2 files changed, 40 insertions(+), 14 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 135fe9fa6994..36d82fe7ab47 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -262,12 +262,16 @@ end ACE Calculates the averaged cross-entropy (logloss) for classification. + +# Arguments: +* `eps::Float64`: Prevents returning `Inf` if `p = 0`. """ type ACE <: AbstractEvalMetric ace_sum :: Float64 n_sample :: Int + eps :: Float64 - ACE() = new(0.0, 0) + ACE(eps=1.0e-8) = new(0.0, 0, eps) end function get(metric :: ACE) @@ -281,9 +285,17 @@ end function _update_single_output(metric :: ACE, label :: NDArray, pred :: NDArray) @nd_as_jl ro=(label,pred) begin + eps = metric.eps # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) - if ndims(pred) == 4 + if size(label) == size(pred) # simply calculate the cross entropy of the probabilities + for (q, p) in zip(pred, label) + # p == true probability + # q == "unnatural" probability + metric.ace_sum += p * log(q + eps) + metric.n_sample += 1 + end + elseif ndims(pred) == 4 labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) for sample in 1:size(labels, 4) for j in 1:size(labels, 2) @@ -292,7 +304,7 @@ function _update_single_output(metric :: ACE, label :: NDArray, pred :: NDArray) # Since we can only target labels right now this is the only thing we can do. target = Int(labels[i, j, 1, sample]) + 1 # klasses are 0...k-1 => julia indexing p_k = pred[i, j, target, sample] - metric.ace_sum += log(p_k) + metric.ace_sum += log(p_k + eps) metric.n_sample += 1 end end @@ -301,7 +313,7 @@ function _update_single_output(metric :: ACE, label :: NDArray, pred :: NDArray) for sample in 1:size(label, 1) target = Int(label[sample]) + 1 # 0-based indexing => 1-based indexing p_k = pred[target, sample] - metric.ace_sum += log(p_k) + metric.ace_sum += log(p_k + eps) metric.n_sample += 1 end else @@ -319,8 +331,9 @@ This can be used to quantify the influence of different classes on the overall l type MultiACE <: AbstractEvalMetric aces :: Vector{Float64} counts :: Vector{Int} + eps :: Float64 - MultiACE(nclasses) = new(Base.zeros(nclasses), Base.zeros(Int, nclasses)) + MultiACE(nclasses, eps=1.0e-8) = new(Base.zeros(nclasses), Base.zeros(Int, nclasses), eps) end function get(metric :: MultiACE) @@ -336,10 +349,22 @@ end function _update_single_output(metric :: MultiACE, label :: NDArray, pred :: NDArray) @nd_as_jl ro=(label,pred) begin + eps = metric.eps # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) - - if ndims(pred) == 4 + @assert size(metric.aces) == size(metric.counts) + if size(label) == size(pred) # simply calculate the cross entropy of the probabilities + for k in 1:length(metric.aces) + kpred = view(pred, ntuple(d->:, ndims(pred) - 2)..., k, :) + klabel = view(label, ntuple(d->:, ndims(label) - 2)..., k, :) + for (q, p) in zip(kpred, klabel) + # p == true probability + # q == "unnatural" probability + metric.aces[k] += p * log(q + eps) + metric.counts[k] += 1 + end + end + elseif ndims(pred) == 4 labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) for sample in 1:size(labels, 4) for j in 1:size(labels, 2) @@ -349,7 +374,7 @@ function _update_single_output(metric :: MultiACE, label :: NDArray, pred :: NDA target = Int(labels[i, j, 1, sample]) + 1 # klasses are 0...k-1 => julia indexing p_k = pred[i, j, target, sample] - metric.aces[target] += log(p_k) + metric.aces[target] += log(p_k + eps) metric.counts[target] += 1 end end @@ -358,7 +383,7 @@ function _update_single_output(metric :: MultiACE, label :: NDArray, pred :: NDA for sample in 1:size(label, 1) target = Int(label[sample]) + 1 p_k = pred[target, sample] - metric.aces[target] += log(p_k) + metric.aces[target] += log(p_k + eps) metric.counts[target] += 1 end else diff --git a/test/unittest/metric.jl b/test/unittest/metric.jl index 46b62a243dc1..9628f6ca28b4 100644 --- a/test/unittest/metric.jl +++ b/test/unittest/metric.jl @@ -17,10 +17,10 @@ function generate_probs(n, m) # Normalize: ensure each column sums to 1 for j = 1:m - colsum = sum(result[:, j]) - for i = 1:n - result[i, j] /= colsum - end + colsum = sum(result[:, j]) + for i = 1:n + result[i, j] /= colsum + end end result end @@ -28,8 +28,9 @@ end function loglikelihood{T <: AbstractFloat}(labels::Vector{T}, probs::Array{T, 2}) LL = 0.0 + eps = 1.0e-8 for i = 1:size(labels, 1) - LL += log(probs[Int(labels[i]) + 1, i]) # labels are zero-based + LL += log(probs[Int(labels[i]) + 1, i] + eps) # labels are zero-based end LL / size(labels, 1) end From 9474d9595785b3a25074305767c527d010f57263 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 30 Mar 2017 06:10:00 +0900 Subject: [PATCH 458/630] provide an optional context in mx.load_checkpoint (#221) --- src/model.jl | 9 +++++++-- 1 file changed, 7 insertions(+), 2 deletions(-) diff --git a/src/model.jl b/src/model.jl index f1f05595533d..46323d701f23 100644 --- a/src/model.jl +++ b/src/model.jl @@ -613,9 +613,14 @@ function load_checkpoint(prefix :: AbstractString, epoch :: Int) return (arch, arg_params, aux_params) end -function load_checkpoint(prefix :: AbstractString, epoch :: Int, ::Type{FeedForward}) +""" + load_checkpoint(prefix, epoch, ::mx.FeedForward; context) + +Load a mx.FeedForward model from the checkpoint *prefix*, *epoch* and optionally provide a context. +""" +function load_checkpoint(prefix :: AbstractString, epoch :: Int, ::Type{FeedForward}; context = nothing) arch, arg_params, aux_params = load_checkpoint(prefix, epoch) - model = FeedForward(arch) + model = FeedForward(arch, context = context) model.arg_params = arg_params model.aux_params = aux_params return model From 46440e3ff60cbb9c60147ba7572d8013658ead01 Mon Sep 17 00:00:00 2001 From: Pepe Mandioca Date: Thu, 30 Mar 2017 19:14:37 -0300 Subject: [PATCH 459/630] Added initializers for Spatial Transformer Networks (STN) layers (#223) --- src/initializer.jl | 39 ++++++++++++++++++++++++++++++++++++++- 1 file changed, 38 insertions(+), 1 deletion(-) diff --git a/src/initializer.jl b/src/initializer.jl index dacb06f349c3..dc484eb2dfe8 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -19,7 +19,13 @@ abstract AbstractInitializer function init{T<:AbstractInitializer}(self :: T, name :: Base.Symbol, array :: NDArray) strname = string(name) - if endswith(strname, "bias") + if startswith(strname,"upsampling") + _init_bilinear(self,name, array) + elseif startswith(strname,"stn_loc") && endswith(strname,"weight") + _init_zero(self,name, array) + elseif startswith(strname,"stn_loc") && endswith(strname,"bias") + _init_loc_bias(self,name, array) + elseif endswith(strname, "bias") _init_bias(self, name, array) elseif endswith(strname, "gamma") _init_gamma(self, name, array) @@ -36,6 +42,37 @@ function init{T<:AbstractInitializer}(self :: T, name :: Base.Symbol, array :: N end end +function _init_loc_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + assert(size(array) == (6,)) + array=[1.0, 0, 0, 0, 1.0, 0] +end + +function _init_bilinear(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) + # ported from python version: + #weight = np.zeros(np.prod(arr.shape), dtype='float32') + #shape = arr.shape + #f = np.ceil(shape[3] / 2.) + #c = (2 * f - 1 - f % 2) / (2. * f) + #for i in range(np.prod(shape)): + # x = i % shape[3] + # y = (i / shape[3]) % shape[2] + # weight[i] = (1 - abs(x / f - c)) * (1 - abs(y / f - c)) + #arr[:] = weight.reshape(shape) + + weight=zeros(array) + + h,w,channels,n=size(array) + f = ceil(w / 2.) + c = (2 * f - 1 - f % 2) / (2. * f) + + for i=1:length(weight) + x = i % w + y = (i / w) % h + weight[i] = (1 - abs(x / f - c)) * (1 - abs(y / f - c)) + end + array[:,:,:,:]=weight +end + function _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) array[:] = 0 end From 9dd329168313a248b56617897e6aa08b2b545834 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 2 Apr 2017 14:31:06 +0800 Subject: [PATCH 460/630] docs: update renamed `every_n_batch` ref: #407 [ci skip] --- src/callback.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/callback.jl b/src/callback.jl index 7736bbf08a44..e71bb1f844c8 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -37,7 +37,7 @@ A convenient function to construct a callback that runs every `n` mini-batches. For example, the [`speedometer`](@ref) callback is defined as ```julia -every_n_iter(frequency, call_on_0=true) do state :: OptimizationState +every_n_batch(frequency, call_on_0=true) do state :: OptimizationState if state.curr_batch == 0 # reset timer else @@ -102,7 +102,7 @@ A convenient function to construct a callback that runs every `n` full data-pass yet. This is useful if you want to inspect the randomly initialized model that has not seen any data yet. -See also [`every_n_iter`](@ref). +See also [`every_n_batch`](@ref). """ function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) From 5c02fcb0eb56f98de6eda8995301c3f638e7e161 Mon Sep 17 00:00:00 2001 From: Facundo Quiroga Date: Sun, 2 Apr 2017 20:34:26 -0300 Subject: [PATCH 461/630] Check if key stride exists in the node info when producing graphviz output. Fixes #213 --- src/visualize.jl | 17 ++++++++++++++--- 1 file changed, 14 insertions(+), 3 deletions(-) diff --git a/src/visualize.jl b/src/visualize.jl index f7dfca859432..ea700b704266 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -51,7 +51,7 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp attr = deepcopy(node_attr) label = op - # Up to 0.8 version of mxnet additional info was stored in + # Up to 0.8 version of mxnet additional info was stored in # node["param"]. Staring from pre0.9 `param` was changed to `attr`. if haskey(node, "param") node_info = node["param"] @@ -69,9 +69,15 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp continue end elseif op == "Convolution" + if haskey(node_info,"stride") + stride_info=_extract_shape(node_info["stride"]) + else + stride_info="1" + end + label = format("Convolution\nkernel={1}\nstride={2}\nn-filter={3}", _extract_shape(node_info["kernel"]), - _extract_shape(node_info["stride"]), + stride_info, node_info["num_filter"]) colorkey = 2 elseif op == "FullyConnected" @@ -83,10 +89,15 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp elseif op == "BatchNorm" colorkey = 4 elseif op == "Pooling" + if haskey(node_info,"stride") + stride_info=_extract_shape(node_info["stride"]) + else + stride_info="1" + end label = format("Pooling\ntype={1}\nkernel={2}\nstride={3}", node_info["pool_type"], _extract_shape(node_info["kernel"]), - _extract_shape(node_info["stride"])) + stride_info) colorkey = 5 elseif op ∈ ("Concat", "Flatten", "Reshape") colorkey = 6 From 31b95fb1e6bed98c2e7621f524dce51f6d91294f Mon Sep 17 00:00:00 2001 From: ultradian Date: Mon, 10 Apr 2017 07:22:46 -0700 Subject: [PATCH 462/630] Update mnist.md (#227) add link to Jupyter notebooks --- docs/src/tutorial/mnist.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/src/tutorial/mnist.md b/docs/src/tutorial/mnist.md index 9b580cfcf38d..a12e10b37821 100644 --- a/docs/src/tutorial/mnist.md +++ b/docs/src/tutorial/mnist.md @@ -6,7 +6,7 @@ multi-layer perceptron and then a convolutional neural network (the LeNet architecture) on the [MNIST handwritten digit dataset](http://yann.lecun.com/exdb/mnist/). The code for this tutorial could be found in -[examples/mnist](https://github.com/dmlc/MXNet.jl/tree/master/examples/mnist). +[examples/mnist](https://github.com/dmlc/MXNet.jl/tree/master/examples/mnist). There are also two Jupyter notebooks that expand a little more on the [MLP](https://github.com/ultradian/julia_notebooks/blob/master/mxnet/mnistMLP.ipynb) and the [LeNet](https://github.com/ultradian/julia_notebooks/blob/master/mxnet/mnistLenet.ipynb), using the more general `ArrayDataProvider`. Simple 3-layer MLP ------------------ From 1be1b8762d535fa6fed48a51caf652ad8e000cc4 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 12 Apr 2017 15:43:34 +0900 Subject: [PATCH 463/630] fix conflict with Images --- src/io.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/io.jl b/src/io.jl index f65314e67c71..ea22a4da961f 100644 --- a/src/io.jl +++ b/src/io.jl @@ -253,9 +253,9 @@ TODO: remove `data_padding` and `label_padding`, and implement rollover that cop the last or first several training samples to feed the padding. """ type ArrayDataProvider <: AbstractDataProvider - data_arrays :: Vector{Array{MX_float}} + data_arrays :: Vector{Array} data_names :: Vector{Base.Symbol} - label_arrays :: Vector{Array{MX_float}} + label_arrays :: Vector{Array} label_names :: Vector{Base.Symbol} batch_size :: Int sample_count :: Int From bfa966ac3f0c4f187a438db819c2e92e56ad8d47 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 13 Apr 2017 10:02:35 +0900 Subject: [PATCH 464/630] fixes bilinear initializer following approach in #34 --- src/initializer.jl | 43 +++++++++++++++++++++---------------------- 1 file changed, 21 insertions(+), 22 deletions(-) diff --git a/src/initializer.jl b/src/initializer.jl index dc484eb2dfe8..5e34dce8d8f9 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -48,29 +48,28 @@ function _init_loc_bias(self :: AbstractInitializer, name :: Base.Symbol, array end function _init_bilinear(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) - # ported from python version: - #weight = np.zeros(np.prod(arr.shape), dtype='float32') - #shape = arr.shape - #f = np.ceil(shape[3] / 2.) - #c = (2 * f - 1 - f % 2) / (2. * f) - #for i in range(np.prod(shape)): - # x = i % shape[3] - # y = (i / shape[3]) % shape[2] - # weight[i] = (1 - abs(x / f - c)) * (1 - abs(y / f - c)) - #arr[:] = weight.reshape(shape) - - weight=zeros(array) - - h,w,channels,n=size(array) - f = ceil(w / 2.) - c = (2 * f - 1 - f % 2) / (2. * f) - - for i=1:length(weight) - x = i % w - y = (i / w) % h - weight[i] = (1 - abs(x / f - c)) * (1 - abs(y / f - c)) + @assert ndims(array) == 4 + + W, H, C, N = size(array) # Inverse of NCHW layout + filter = Base.zeros(eltype(array), W, H) + + @assert H == W + + f = ceil(Int, W / 2) # factor + c = (2 * f - 1 - f % 2) / (2 * f) # center + for x in 0:(W-1) + for y in 0:(H-1) + filter[x+1, y+1] = (1 - abs(x / f - c)) * (1 - abs(y / f - c)) + end + end + + @nd_as_jl rw=array begin + for i in 1:N + for j in 1:C + array[:,:, j, i] = filter + end + end end - array[:,:,:,:]=weight end function _init_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) From 8947eadb6b17f702e0e550274f69131150157f3d Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 13 Apr 2017 10:38:58 +0900 Subject: [PATCH 465/630] adds test for bilinear initializer --- test/unittest/initializer.jl | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) create mode 100644 test/unittest/initializer.jl diff --git a/test/unittest/initializer.jl b/test/unittest/initializer.jl new file mode 100644 index 000000000000..750959f2eb20 --- /dev/null +++ b/test/unittest/initializer.jl @@ -0,0 +1,18 @@ +@testset "Initializers" begin + @testset "Bilinear initializer" begin + # Setup a filter with scale = 2 + expectedFilter = Float32[ + 0.0625 0.1875 0.1875 0.0625; + 0.1875 0.5625 0.5625 0.1875; + 0.1875 0.5625 0.5625 0.1875; + 0.0625 0.1875 0.1875 0.0625] + filter = mx.zeros(Float32, 4, 4, 1, 4) + mx.init(mx.XavierInitializer(), :upsampling0_weight, filter) + + mx.@nd_as_jl ro=filter begin + for s in 1:size(filter, 4) + @test all(filter[:, :, 1, s] .== expectedFilter) + end + end + end +end From 558adb7f92c7d2e8dc0351b2139992f2bae9bc84 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 28 Mar 2017 17:58:00 +0900 Subject: [PATCH 466/630] add SeqMetric to apply different metrics for multi-output --- src/metric.jl | 34 ++++++++++++++++++++++++++++++++++ 1 file changed, 34 insertions(+) diff --git a/src/metric.jl b/src/metric.jl index 36d82fe7ab47..c8a42d88854a 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -85,6 +85,40 @@ function get(metric :: MultiMetric) mapreduce(get, append!, metric.metrics) end +""" + SeqMetric(metrics::Vector{AbstractEvalMetric}) + +Apply a different metric to each output. This is especially useful for `mx.Group`. + +# Usage +Calculate accuracy [`Accuracy`](@ref) for the first output +and log-loss [`ACE`](@ref) for the second output: +```julia + mx.fit(..., eval_metric = mx.SeqMetric([mx.Accuracy(), mx.ACE()])) +``` +""" +type SeqMetric <: mx.AbstractEvalMetric + metrics :: Vector{mx.AbstractEvalMetric} +end + +function update!(metric :: SeqMetric, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + @assert length(metric.metrics) == length(labels) + @assert length(metric.metrics) == length(preds) + for (m, l, p) in zip(metric.metrics, labels, preds) + update!(m, [l], [p]) + end + return nothing +end + +function reset!(metric :: SeqMetric) + map(reset!, metric.metrics) + return nothing +end + +function get(metric :: SeqMetric) + mapreduce(get, append!, metric.metrics) +end + """ Accuracy From b4ece81a9fde4e6ea8ecfe16c1d9bbb69832e752 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Wed, 29 Mar 2017 13:02:59 +0900 Subject: [PATCH 467/630] add NullMetric --- src/metric.jl | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) diff --git a/src/metric.jl b/src/metric.jl index c8a42d88854a..eb4bff3930d9 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -54,6 +54,26 @@ function get(metric :: AbstractEvalMetric) throw(MethodError(get, (typeof(metric),))) end +""" + NullMetric() + +A metric that calculates nothing. Can be used to ignore an output during training. +""" +type NullMetric <: mx.AbstractEvalMetric +end + +function update!(metric :: NullMetric, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + return nothing +end + +function reset!(metric :: NullMetric) + return nothing +end + +function get(metric :: NullMetric) + return Tuple{Symbol, Float64}[] +end + """ MultiMetric(metrics::Vector{AbstractEvalMetric}) From ced3f73aa8503ae8f0d34e9ef73e94417af15b8e Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 30 Mar 2017 14:41:09 +0900 Subject: [PATCH 468/630] fix pointer(NDArray) for Float64 --- src/ndarray.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index d37b321a2d8a..42ad43d7c492 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -798,8 +798,8 @@ end # pointers from CPU) leads to undefined behavior. import Base.pointer function pointer(arr :: NDArray) - pdata = Ref{Ptr{MX_float}}(0) - @mxcall(:MXNDArrayGetData, (MX_handle, Ref{Ptr{MX_float}}), arr, pdata) + pdata = Ref{Ptr{Void}}(0) + @mxcall(:MXNDArrayGetData, (MX_handle, Ref{Ptr{Void}}), arr, pdata) return convert(Ptr{eltype(arr)}, pdata[]) end function _wait_to_read(arr :: NDArray) From d0253f1ba0d4d681c3e755cc1dd4a9b63e1f79ac Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 14 Apr 2017 13:00:54 +0900 Subject: [PATCH 469/630] XCode8 supports thread_local in C++ --- .travis.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.travis.yml b/.travis.yml index 6c2f33c114a4..7c1c6b9be19d 100644 --- a/.travis.yml +++ b/.travis.yml @@ -4,6 +4,7 @@ language: julia os: - linux - osx +osx_image: xcode8 julia: - 0.5 # - nightly 0.6 supports depends on #170 From 169752232f43756caab985d9dacf40ba981a498f Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Tue, 28 Mar 2017 17:58:22 +0900 Subject: [PATCH 470/630] update MSE to be agnostic to dimensions. --- src/metric.jl | 17 +++++++---------- 1 file changed, 7 insertions(+), 10 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index eb4bff3930d9..92e304f2877a 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -200,9 +200,10 @@ end """ MSE -Mean Squared Error. TODO: add support for multi-dimensional outputs. +Mean Squared Error. -Calculates the mean squared error regression loss in one dimension. +Calculates the mean squared error regression loss. +Requires that label and prediction have the same shape. """ type MSE <: AbstractEvalMetric @@ -213,14 +214,10 @@ type MSE <: AbstractEvalMetric end function _update_single_output(metric :: MSE, label :: NDArray, pred :: NDArray) - label = copy(label) - pred = copy(pred) - - n_sample = size(pred)[end] - metric.n_sample += n_sample - - for i = 1:n_sample - metric.mse_sum += (label[i] - pred[i])^2 + @assert size(label) == size(pred) + metric.n_sample += length(label) + @nd_as_jl ro=(label, pred) begin + metric.mse_sum += sumabs2(label .- pred) end end From e12052c65027abc1141cad86c11fa7423172eb18 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Thu, 30 Mar 2017 12:44:09 +0900 Subject: [PATCH 471/630] convert single outputs to array so that inference has it easier --- src/metric.jl | 204 ++++++++++++++++++++-------------------- test/unittest/metric.jl | 2 +- 2 files changed, 101 insertions(+), 105 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 92e304f2877a..271ab719ee89 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -27,7 +27,13 @@ function update!{T <: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray} number of outputs ($(length(preds))). The calculated metric might not be accuracte.") end for (label, pred) in zip(labels, preds) - _update_single_output(metric, label, pred) + @nd_as_jl ro=(label, pred) begin + # This is a dynamic dispatch since the conversion from NDArray to + # Array is not type-stable. We could use a trait to decide if we should + # convert the NDArray here so that the called function will be type-stable + # or if we should forward the NDArray. + _update_single_output(metric, label, pred) + end end end @@ -154,37 +160,35 @@ type Accuracy <: AbstractEvalMetric Accuracy() = new(0.0, 0) end -function _update_single_output(metric :: Accuracy, label :: NDArray, pred :: NDArray) - @nd_as_jl ro=(label,pred) begin - # Samples are stored in the last dimension - @assert size(label, ndims(label)) == size(pred, ndims(pred)) +function _update_single_output(metric :: Accuracy, label :: Array, pred :: Array) + # Samples are stored in the last dimension + @assert size(label, ndims(label)) == size(pred, ndims(pred)) - if ndims(pred) == 4 # Multidimensional case - # Reshape label to be of the same shape as pred. - # Except for the third dimension where the predictions are stored. - labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) + if ndims(pred) == 4 # Multidimensional case + # Reshape label to be of the same shape as pred. + # Except for the third dimension where the predictions are stored. + labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) - for sample in 1:size(labels, 4) - for j in 1:size(labels, 2) - for i in 1:size(labels, 1) - label = labels[i, j, 1, sample] - klasses = view(pred, i, j, :, sample) - klass = indmax(klasses) - 1 # Classes start at 0...k-1 + for sample in 1:size(labels, 4) + for j in 1:size(labels, 2) + for i in 1:size(labels, 1) + label = labels[i, j, 1, sample] + klasses = view(pred, i, j, :, sample) + klass = indmax(klasses) - 1 # Classes start at 0...k-1 - metric.acc_sum += klass == label - metric.n_sample += 1 - end + metric.acc_sum += klass == label + metric.n_sample += 1 end end - elseif ndims(pred) == 2 # 1-dimensional case - for sample in 1:size(label, 1) - klass = indmax(view(pred, :, sample)) - 1 - metric.acc_sum += klass == label[sample] - metric.n_sample += 1 - end - else - error("Can't handle prediction with dimensions $(ndims(pred)).") end + elseif ndims(pred) == 2 # 1-dimensional case + for sample in 1:size(label, 1) + klass = indmax(view(pred, :, sample)) - 1 + metric.acc_sum += klass == label[sample] + metric.n_sample += 1 + end + else + error("Can't handle prediction with dimensions $(ndims(pred)).") end end @@ -213,12 +217,11 @@ type MSE <: AbstractEvalMetric MSE() = new(0.0, 0) end -function _update_single_output(metric :: MSE, label :: NDArray, pred :: NDArray) +function _update_single_output{T}(metric :: MSE, label :: Array{T}, pred :: Array{T}) @assert size(label) == size(pred) metric.n_sample += length(label) - @nd_as_jl ro=(label, pred) begin - metric.mse_sum += sumabs2(label .- pred) - end + metric.mse_sum += sumabs2(label .- pred) + return nothing end function get(metric :: MSE) @@ -284,10 +287,7 @@ type NMSE <: AbstractEvalMetric NMSE() = new(0.0, 0) end -function _update_single_output(metric :: NMSE, label :: NDArray, pred :: NDArray) - label = copy(label) - pred = copy(pred) - +function _update_single_output(metric :: NMSE, label :: Array, pred :: Array) n_sample = size(pred)[end] metric.n_sample += n_sample @@ -334,42 +334,40 @@ function reset!(metric :: ACE) metric.n_sample = 0 end -function _update_single_output(metric :: ACE, label :: NDArray, pred :: NDArray) - @nd_as_jl ro=(label,pred) begin - eps = metric.eps - # Samples are stored in the last dimension - @assert size(label, ndims(label)) == size(pred, ndims(pred)) - if size(label) == size(pred) # simply calculate the cross entropy of the probabilities - for (q, p) in zip(pred, label) - # p == true probability - # q == "unnatural" probability - metric.ace_sum += p * log(q + eps) +function _update_single_output(metric :: ACE, label :: Array, pred :: Array) + eps = metric.eps + # Samples are stored in the last dimension + @assert size(label, ndims(label)) == size(pred, ndims(pred)) + if size(label) == size(pred) # simply calculate the cross entropy of the probabilities + for (q, p) in zip(pred, label) + # p == true probability + # q == "unnatural" probability + metric.ace_sum += p * log(q + eps) + metric.n_sample += 1 + end + elseif ndims(pred) == 4 + labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) + for sample in 1:size(labels, 4) + for j in 1:size(labels, 2) + for i in 1:size(labels, 1) + # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification + # Since we can only target labels right now this is the only thing we can do. + target = Int(labels[i, j, 1, sample]) + 1 # klasses are 0...k-1 => julia indexing + p_k = pred[i, j, target, sample] + metric.ace_sum += log(p_k + eps) metric.n_sample += 1 - end - elseif ndims(pred) == 4 - labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) - for sample in 1:size(labels, 4) - for j in 1:size(labels, 2) - for i in 1:size(labels, 1) - # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification - # Since we can only target labels right now this is the only thing we can do. - target = Int(labels[i, j, 1, sample]) + 1 # klasses are 0...k-1 => julia indexing - p_k = pred[i, j, target, sample] - metric.ace_sum += log(p_k + eps) - metric.n_sample += 1 - end end end - elseif ndims(pred) == 2 # 1-dimensional case - for sample in 1:size(label, 1) - target = Int(label[sample]) + 1 # 0-based indexing => 1-based indexing - p_k = pred[target, sample] - metric.ace_sum += log(p_k + eps) - metric.n_sample += 1 - end - else - error("Can't handle prediction with dimensions $(ndims(pred)).") end + elseif ndims(pred) == 2 # 1-dimensional case + for sample in 1:size(label, 1) + target = Int(label[sample]) + 1 # 0-based indexing => 1-based indexing + p_k = pred[target, sample] + metric.ace_sum += log(p_k +eps) + metric.n_sample += 1 + end + else + error("Can't handle prediction with dimensions $(ndims(pred)).") end end @@ -398,48 +396,46 @@ function reset!(metric :: MultiACE) metric.counts = Base.zero(metric.counts) end -function _update_single_output(metric :: MultiACE, label :: NDArray, pred :: NDArray) - @nd_as_jl ro=(label,pred) begin - eps = metric.eps - # Samples are stored in the last dimension - @assert size(label, ndims(label)) == size(pred, ndims(pred)) - @assert size(metric.aces) == size(metric.counts) - if size(label) == size(pred) # simply calculate the cross entropy of the probabilities - for k in 1:length(metric.aces) - kpred = view(pred, ntuple(d->:, ndims(pred) - 2)..., k, :) - klabel = view(label, ntuple(d->:, ndims(label) - 2)..., k, :) - for (q, p) in zip(kpred, klabel) - # p == true probability - # q == "unnatural" probability - metric.aces[k] += p * log(q + eps) - metric.counts[k] += 1 - end +function _update_single_output(metric :: MultiACE, label :: Array, pred :: Array) + eps = metric.eps + # Samples are stored in the last dimension + @assert size(label, ndims(label)) == size(pred, ndims(pred)) + @assert size(metric.aces) == size(metric.counts) + if size(label) == size(pred) # simply calculate the cross entropy of the probabilities + for k in 1:length(metric.aces) + kpred = view(pred, ntuple(d->:, ndims(pred) - 2)..., k, :) + klabel = view(label, ntuple(d->:, ndims(label) - 2)..., k, :) + for (q, p) in zip(kpred, klabel) + # p == true probability + # q == "unnatural" probability + metric.aces[k] += p * log(q + eps) + metric.counts[k] += 1 end - elseif ndims(pred) == 4 - labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) - for sample in 1:size(labels, 4) - for j in 1:size(labels, 2) - for i in 1:size(labels, 1) - # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification - # Since we can only target labels right now this is the only thing we can do. - target = Int(labels[i, j, 1, sample]) + 1 # klasses are 0...k-1 => julia indexing - p_k = pred[i, j, target, sample] - - metric.aces[target] += log(p_k + eps) - metric.counts[target] += 1 - end + end + elseif ndims(pred) == 4 + labels = reshape(label, size(pred, 1, 2)..., 1, size(pred, 4)) + for sample in 1:size(labels, 4) + for j in 1:size(labels, 2) + for i in 1:size(labels, 1) + # Cross-entropy reduces to -(ln(p_1)*0 + ln(p_2)*1) for classification + # Since we can only target labels right now this is the only thing we can do. + target = Int(labels[i, j, 1, sample]) + 1 # klasses are 0...k-1 => julia indexing + p_k = pred[i, j, target, sample] + + metric.aces[target] += log(p_k + eps) + metric.counts[target] += 1 end end - elseif ndims(pred) == 2 - for sample in 1:size(label, 1) - target = Int(label[sample]) + 1 - p_k = pred[target, sample] - metric.aces[target] += log(p_k + eps) - metric.counts[target] += 1 - end - else - error("Can't handle prediction with dimensions $(ndims(pred)).") end + elseif ndims(pred) == 2 + for sample in 1:size(label, 1) + target = Int(label[sample]) + 1 + p_k = pred[target, sample] + metric.aces[target] += log(p_k + eps) + metric.counts[target] += 1 + end + else + error("Can't handle prediction with dimensions $(ndims(pred)).") end end diff --git a/test/unittest/metric.jl b/test/unittest/metric.jl index 9628f6ca28b4..1377c4c2bb81 100644 --- a/test/unittest/metric.jl +++ b/test/unittest/metric.jl @@ -48,7 +48,7 @@ function test_ace() probs = convert(Array{Float32}, generate_probs(n_categories, n_observations)) LL = loglikelihood(labels, probs) metric = mx.ACE() # For categorical variables, ACE == -LL - mx._update_single_output(metric, mx.NDArray(labels), mx.NDArray(probs)) + mx._update_single_output(metric, labels, probs) LL_v2 = metric.ace_sum / metric.n_sample @static if VERSION >= v"0.6.0-dev.2075" @test LL ≈ LL_v2 atol=1e-12 From def129f20a03bec6913217c6b9e685941dad66e2 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 14 Apr 2017 11:45:16 +0900 Subject: [PATCH 472/630] convert eps to eltype of array --- src/metric.jl | 8 ++++---- test/unittest/metric.jl | 2 +- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 271ab719ee89..1eed64988b12 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -334,8 +334,8 @@ function reset!(metric :: ACE) metric.n_sample = 0 end -function _update_single_output(metric :: ACE, label :: Array, pred :: Array) - eps = metric.eps +function _update_single_output{T}(metric :: ACE, label :: Array{T}, pred :: Array{T}) + eps = convert(T, metric.eps) # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) if size(label) == size(pred) # simply calculate the cross entropy of the probabilities @@ -396,8 +396,8 @@ function reset!(metric :: MultiACE) metric.counts = Base.zero(metric.counts) end -function _update_single_output(metric :: MultiACE, label :: Array, pred :: Array) - eps = metric.eps +function _update_single_output{T}(metric :: MultiACE, label :: Array{T}, pred :: Array{T}) + eps = convert(T, metric.eps) # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) @assert size(metric.aces) == size(metric.counts) diff --git a/test/unittest/metric.jl b/test/unittest/metric.jl index 1377c4c2bb81..5b5632a87c76 100644 --- a/test/unittest/metric.jl +++ b/test/unittest/metric.jl @@ -28,7 +28,7 @@ end function loglikelihood{T <: AbstractFloat}(labels::Vector{T}, probs::Array{T, 2}) LL = 0.0 - eps = 1.0e-8 + eps = convert(T, 1.0e-8) for i = 1:size(labels, 1) LL += log(probs[Int(labels[i]) + 1, i] + eps) # labels are zero-based end From c2044d5bd7dad88721f7edd6c06f0f066a91076a Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 14 Apr 2017 16:01:01 +0900 Subject: [PATCH 473/630] adds THTT to enable metrics to support NDArray or Array --- src/metric.jl | 39 ++++++++++++++++++++++++++++++++++++--- 1 file changed, 36 insertions(+), 3 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 1eed64988b12..5c5945e96a9f 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -10,6 +10,16 @@ interfaces: """ abstract AbstractEvalMetric +""" + hasNDArraySupport(metric) -> Val{true/false} + +Trait for `_update_single_output` should return `Val{true}() if metric can handle `NDArray` +directly and `Val{false}()i` if requires `Array`. Metric that work with NDArrays can be +async, while native Julia arrays require that we copy the output of the network, which is +a blocking operation. +""" +hasNDArraySupport(::AbstractEvalMetric) = Val{true}() + """ update!(metric, labels, preds) @@ -21,6 +31,21 @@ Update and accumulate metrics. * `preds::Vector{NDArray}`: the outputs (predictions) of the network. """ function update!{T <: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}) + _update!(metric, labels, preds, hasNDArraySupport(metric)) +end + +function _update!{T<: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}, :: Val{true}) + if length(labels) != length(preds) + Base.warn_once( + "The number of labels ($(length(labels))) does not correspond to the\ + number of outputs ($(length(preds))). The calculated metric might not be accuracte.") + end + for (label, pred) in zip(labels, preds) + _update_single_output(metric, label, pred) + end +end + +function _update!{T<: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}, :: Val{false}) if length(labels) != length(preds) Base.warn_once( "The number of labels ($(length(labels))) does not correspond to the\ @@ -29,9 +54,7 @@ function update!{T <: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray} for (label, pred) in zip(labels, preds) @nd_as_jl ro=(label, pred) begin # This is a dynamic dispatch since the conversion from NDArray to - # Array is not type-stable. We could use a trait to decide if we should - # convert the NDArray here so that the called function will be type-stable - # or if we should forward the NDArray. + # Array is not type-stable. _update_single_output(metric, label, pred) end end @@ -160,6 +183,8 @@ type Accuracy <: AbstractEvalMetric Accuracy() = new(0.0, 0) end +hasNDArraySupport(::Accuracy) = Val{false}() + function _update_single_output(metric :: Accuracy, label :: Array, pred :: Array) # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) @@ -217,6 +242,8 @@ type MSE <: AbstractEvalMetric MSE() = new(0.0, 0) end +hasNDArraySupport(::MSE) = Val{false}() + function _update_single_output{T}(metric :: MSE, label :: Array{T}, pred :: Array{T}) @assert size(label) == size(pred) metric.n_sample += length(label) @@ -287,6 +314,8 @@ type NMSE <: AbstractEvalMetric NMSE() = new(0.0, 0) end +hasNDArraySupport(::NMSE) = Val{false}() + function _update_single_output(metric :: NMSE, label :: Array, pred :: Array) n_sample = size(pred)[end] metric.n_sample += n_sample @@ -334,6 +363,8 @@ function reset!(metric :: ACE) metric.n_sample = 0 end +hasNDArraySupport(::ACE) = Val{false}() + function _update_single_output{T}(metric :: ACE, label :: Array{T}, pred :: Array{T}) eps = convert(T, metric.eps) # Samples are stored in the last dimension @@ -396,6 +427,8 @@ function reset!(metric :: MultiACE) metric.counts = Base.zero(metric.counts) end +hasNDArraySupport(::MultiACE) = Val{false}() + function _update_single_output{T}(metric :: MultiACE, label :: Array{T}, pred :: Array{T}) eps = convert(T, metric.eps) # Samples are stored in the last dimension From 349d2a781a7acc4a408e1efca915a0dc99ad874e Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Fri, 14 Apr 2017 16:09:07 +0900 Subject: [PATCH 474/630] convert MSE to use NDArray as an example for async --- src/metric.jl | 17 ++++++++++------- 1 file changed, 10 insertions(+), 7 deletions(-) diff --git a/src/metric.jl b/src/metric.jl index 5c5945e96a9f..3bff815d4f35 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -236,27 +236,30 @@ Requires that label and prediction have the same shape. """ type MSE <: AbstractEvalMetric - mse_sum :: Float64 + mse_sum :: Vector{NDArray} n_sample :: Int - MSE() = new(0.0, 0) + MSE() = new(Vector{NDArray}(), 0) end -hasNDArraySupport(::MSE) = Val{false}() +hasNDArraySupport(::MSE) = Val{true}() -function _update_single_output{T}(metric :: MSE, label :: Array{T}, pred :: Array{T}) +function _update_single_output(metric :: MSE, label :: NDArray, pred :: NDArray) @assert size(label) == size(pred) metric.n_sample += length(label) - metric.mse_sum += sumabs2(label .- pred) + mse_sum = mx.sum(mx._PowerScalar(label - pred,scalar=2)) + push!(metric.mse_sum, mse_sum) return nothing end function get(metric :: MSE) - return [(:MSE, metric.mse_sum / metric.n_sample)] + # Delay copy until last possible moment + mse_sum = mapreduce(nda->copy(nda)[1], +, 0.0, metric.mse_sum) + return [(:MSE, mse_sum / metric.n_sample)] end function reset!(metric :: MSE) - metric.mse_sum = 0.0 + metric.mse_sum = Vector{NDArray}() metric.n_sample = 0 end From c4a265863557fb25314e56403d77e4fb00af25e9 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sat, 15 Apr 2017 11:51:27 +0900 Subject: [PATCH 475/630] ensure that new submodules are initialized --- deps/build.jl | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 7b654d9a9706..03e07fccbd22 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -115,7 +115,8 @@ if !libmxnet_detected `git -C mshadow checkout -- make/mshadow.mk` `git fetch` `git checkout $libmxnet_curr_ver` - `git submodule update` + `git submodule update --init` + `make clean` `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` end FileRule(joinpath(_mxdir, "config.mk"), @build_steps begin From 9aac7e13c4828872fc96a30131980e4fe086c654 Mon Sep 17 00:00:00 2001 From: undefdev Date: Sat, 15 Apr 2017 17:50:50 +0200 Subject: [PATCH 476/630] Update callback.jl (#235) fixed typo in comment --- src/callback.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/callback.jl b/src/callback.jl index e71bb1f844c8..ee200d2e30c9 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -97,7 +97,7 @@ end A convenient function to construct a callback that runs every `n` full data-passes. -* `call_on_0::Int`: keyword argument, default false. Unless set, the callback +* `call_on_0::Bool`: keyword argument, default false. Unless set, the callback will *not* be run on epoch 0. Epoch 0 means no training has been performed yet. This is useful if you want to inspect the randomly initialized model that has not seen any data yet. From 7a530fafec87966c71ae3ce9d9e44ad07be49e22 Mon Sep 17 00:00:00 2001 From: Pepe Mandioca Date: Wed, 26 Apr 2017 19:45:40 -0300 Subject: [PATCH 477/630] Fixed SpatialTransformerNetwork loc_bias initializer. Added lenet-stn example. (#238) --- examples/mnist/lenet-stn.jl | 64 +++++++++++++++++++++++++++++++++++++ src/initializer.jl | 2 +- 2 files changed, 65 insertions(+), 1 deletion(-) create mode 100644 examples/mnist/lenet-stn.jl diff --git a/examples/mnist/lenet-stn.jl b/examples/mnist/lenet-stn.jl new file mode 100644 index 000000000000..23ca9de3fdb3 --- /dev/null +++ b/examples/mnist/lenet-stn.jl @@ -0,0 +1,64 @@ +using MXNet + +#-------------------------------------------------------------------------------- +# define lenet with stn layer + + + +# input +data = mx.Variable(:data) + + +# the localisation network in lenet-stn +# it will increase acc about more than 1%, when num-epoch >=15 +# The localization net just takes the data as input and must output a vector in R^n +loc_net = @mx.chain mx.Convolution(data, num_filter=10, kernel=(5, 5), stride=(2,2)) => + mx.Activation(act_type=:relu) => + mx.Pooling( kernel=(2, 2), stride=(2, 2), pool_type=:max) => + mx.Convolution( num_filter=10, kernel=(3, 3), stride=(2,2), pad=(1, 1)) => + mx.Activation(act_type=:relu) => + mx.Pooling( global_pool=true, kernel=(2, 2), pool_type=:avg) => + mx.Flatten() => + mx.FullyConnected(num_hidden=6, name=:stn_loc) + +data=mx.SpatialTransformer(data,loc_net, target_shape = (28,28), transform_type="affine", sampler_type="bilinear") + +# first conv +conv1 = @mx.chain mx.Convolution(data, kernel=(5,5), num_filter=20) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) + +# second conv +conv2 = @mx.chain mx.Convolution(conv1, kernel=(5,5), num_filter=50) => + mx.Activation(act_type=:tanh) => + mx.Pooling(pool_type=:max, kernel=(2,2), stride=(2,2)) + +# first fully-connected +fc1 = @mx.chain mx.Flatten(conv2) => + mx.FullyConnected(num_hidden=500) => + mx.Activation(act_type=:tanh) + +# second fully-connected +fc2 = mx.FullyConnected(fc1, num_hidden=10) + +# softmax loss +lenet = mx.SoftmaxOutput(fc2, name=:softmax) + + +#-------------------------------------------------------------------------------- + +# load data +batch_size = 100 +include("mnist-data.jl") +train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) + +#-------------------------------------------------------------------------------- +# fit model +model = mx.FeedForward(lenet, context=mx.cpu()) + +# optimizer +optimizer = mx.ADAM(lr=0.01, weight_decay=0.00001) + +# fit parameters +initializer=mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 1) +mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider,initializer=initializer) diff --git a/src/initializer.jl b/src/initializer.jl index 5e34dce8d8f9..4685f41101cc 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -44,7 +44,7 @@ end function _init_loc_bias(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) assert(size(array) == (6,)) - array=[1.0, 0, 0, 0, 1.0, 0] + array[:]= [1.0, 0, 0, 0, 1.0, 0] end function _init_bilinear(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) From 06010b8936e82bfc74b7e0a59324e2b2162aa745 Mon Sep 17 00:00:00 2001 From: Mus M Date: Sat, 29 Apr 2017 22:13:38 -0400 Subject: [PATCH 478/630] explicitly specify 7z (#239) --- deps/build.jl | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 03e07fccbd22..6be844574968 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -43,7 +43,8 @@ if !libmxnet_detected run(`cmd /c copy "usr\\3rdparty\\openblas\\bin\\*.dll" "usr\\lib"`) run(download_cmd(package_url, "mxnet.7z")) - run(`7z x mxnet.7z -y -ousr`) + exe7z = joinpath(JULIA_HOME, "7z.exe") + run(`$exe7z x mxnet.7z -y -ousr`) return end From 6cc9e99cd4fbff26c099ded296cd4984e21cf5a7 Mon Sep 17 00:00:00 2001 From: Robin Deits Date: Tue, 9 May 2017 14:13:35 -0400 Subject: [PATCH 479/630] add verbosity option to predict() --- src/model.jl | 18 ++++++++++++------ 1 file changed, 12 insertions(+), 6 deletions(-) diff --git a/src/model.jl b/src/model.jl index 46323d701f23..afa3aa351a8a 100644 --- a/src/model.jl +++ b/src/model.jl @@ -143,7 +143,7 @@ function init_model(self :: FeedForward, initializer :: AbstractInitializer; ove return (arg_names, param_names, aux_names) end -function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_shapes...) +function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; verbosity :: Integer = 1, data_shapes...) if !isdefined(self, :pred_exec) || isa(self.pred_exec, Void) || overwrite if !isdefined(self, :arg_params) || !isdefined(self, :aux_params) @assert(false, "Model weights not defined, please init or train the model, or load from file") @@ -152,7 +152,7 @@ function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; data_sha # the predictor use only the first device self.pred_exec = simple_bind(self.arch, self.ctx[1]; grad_req=GRAD_NOP, data_shapes...) dbg_str = mx.debug_str(self.pred_exec) - info(string("TempSpace: ", split(dbg_str, ['\n'])[end-2]..., " on ", self.ctx[1])) + verbosity >= 1 && info(string("TempSpace: ", split(dbg_str, ['\n'])[end-2]..., " on ", self.ctx[1])) copy_params_from(self.pred_exec, self.arg_params, self.aux_params) else # make sure the new setup is compatible with the existing one @@ -185,6 +185,10 @@ end then the executor can be potentially be re-used. So, if `overwrite` is false, we will try to re-use, and raise an error if batch-size changed. If `overwrite` is true (the default), a new `Executor` will be created to replace the old one. +* `verbosity::Integer`: Determines the verbosity of the print messages. Higher numbers + leads to more verbose printing. Acceptable values are + - `0`: Do not print anything during prediction + - `1`: Print allocation information during prediction !!! note Prediction is computationally much less costly than training, so the bottleneck sometimes becomes the IO @@ -203,13 +207,15 @@ end See also [`train`](@ref), [`fit`](@ref), [`init_model`](@ref), and [`load_checkpoint`](@ref) """ -function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = true) - predict(self, data; overwrite = overwrite, callback=callback) +function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; + overwrite :: Bool = true, verbosity :: Integer = 1) + predict(self, data; overwrite = overwrite, callback=callback, verbosity = verbosity) end -function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::Bool=true, callback::Union{Function,Void}=nothing) +function predict(self :: FeedForward, data :: AbstractDataProvider; + overwrite::Bool=true, callback::Union{Function,Void}=nothing, verbosity :: Integer = 1) data_shapes = provide_data(data) data_names = [x[1] for x in data_shapes] - _setup_predictor(self, overwrite; data_shapes...) + _setup_predictor(self, overwrite; verbosity = verbosity, data_shapes...) batch_size = get_batch_size(data) data_arrays = [self.pred_exec.arg_dict[name] for name in data_names] From 5d163055fd0a2b96d00877e0e15164b91f3dac11 Mon Sep 17 00:00:00 2001 From: Mus M Date: Fri, 12 May 2017 09:54:59 -0400 Subject: [PATCH 480/630] explicitly specify 7z --- deps/build.jl | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 6be844574968..aebc679e304e 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -38,12 +38,13 @@ if !libmxnet_detected # TODO: Get url from JSON. package_url = "https://github.com/yajiedesign/mxnet/releases/download/$(curr_win)/$(curr_win)_mxnet_x64_vc12_cpu.7z" + exe7z = joinpath(JULIA_HOME, "7z.exe") + run(download_cmd(base_url, "mxnet_base.7z")) - run(`7z x mxnet_base.7z -y -ousr`) + run(`$exe7z x mxnet_base.7z -y -ousr`) run(`cmd /c copy "usr\\3rdparty\\openblas\\bin\\*.dll" "usr\\lib"`) run(download_cmd(package_url, "mxnet.7z")) - exe7z = joinpath(JULIA_HOME, "7z.exe") run(`$exe7z x mxnet.7z -y -ousr`) return From 8918f1b362cd20f44fa545f9a117cb09e4ec34da Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sat, 13 May 2017 00:03:16 +0900 Subject: [PATCH 481/630] update appveyor script (#195) --- appveyor.yml | 13 ++++++++----- 1 file changed, 8 insertions(+), 5 deletions(-) diff --git a/appveyor.yml b/appveyor.yml index 8b7699447712..62356194de72 100644 --- a/appveyor.yml +++ b/appveyor.yml @@ -1,14 +1,12 @@ environment: matrix: - - JULIAVERSION: "julialang/bin/winnt/x86/0.3/julia-0.3-latest-win32.exe" - - JULIAVERSION: "julialang/bin/winnt/x64/0.3/julia-0.3-latest-win64.exe" - - JULIAVERSION: "julianightlies/bin/winnt/x86/julia-latest-win32.exe" - - JULIAVERSION: "julianightlies/bin/winnt/x64/julia-latest-win64.exe" + - JULIAVERSION: "julialang/bin/winnt/x86/0.5/julia-0.5-latest-win32.exe" + - JULIAVERSION: "julialang/bin/winnt/x64/0.5/julia-0.5-latest-win64.exe" branches: only: - master - - /release-.*/ + - stable notifications: - provider: Email @@ -17,6 +15,11 @@ notifications: on_build_status_changed: false install: +# If there's a newer build queued for the same PR, cancel this one + - ps: if ($env:APPVEYOR_PULL_REQUEST_NUMBER -and $env:APPVEYOR_BUILD_NUMBER -ne ((Invoke-RestMethod ` + https://ci.appveyor.com/api/projects/$env:APPVEYOR_ACCOUNT_NAME/$env:APPVEYOR_PROJECT_SLUG/history?recordsNumber=50).builds | ` + Where-Object pullRequestId -eq $env:APPVEYOR_PULL_REQUEST_NUMBER)[0].buildNumber) { ` + throw "There are newer queued builds for this pull request, failing early." } # Download most recent Julia Windows binary - ps: (new-object net.webclient).DownloadFile( $("http://s3.amazonaws.com/"+$env:JULIAVERSION), From 60f5306a31106b623365455cc35b1cf452c747de Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sun, 29 Jan 2017 14:47:56 +0900 Subject: [PATCH 482/630] improve GPU detection. --- deps/build.jl | 55 ++++++++++++++++++++++++---------- docs/src/user-guide/install.md | 9 ++++-- 2 files changed, 46 insertions(+), 18 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index aebc679e304e..ddc4dfc99ea4 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -20,23 +20,56 @@ if haskey(ENV, "MXNET_HOME") end end +# Try to find cuda +CUDAPATHS = String[] +if haskey(ENV, "CUDA_HOME") + push!(CUDAPATHS, joinpath(ENV["CUDA_HOME"], "lib64")) +elseif is_linux() + append!(CUDAPATHS, ["/opt/cuda/lib64", "/usr/local/cuda/lib64"]) +end + +if is_unix() + try + push!(CUDAPATHS, replace(strip(readstring(`which nvcc`)), "bin/nvcc", "lib64")) + end +end + +HAS_CUDA = false +let cudalib = Libdl.find_library(["libcuda", "nvcuda.dll"], CUDAPATHS) + HAS_CUDA = Libdl.dlopen_e(cudalib) != C_NULL +end + +if !HAS_CUDA && is_windows() + # TODO: this needs to be improved. + try + run(`nvcc --version`) + HAS_CUDA = true + end +end +if HAS_CUDA + info("Found a CUDA installation.") +else + info("Did not find a CUDA installation, using CPU-only version of MXNet.") +end using BinDeps @BinDeps.setup if !libmxnet_detected if is_windows() - # TODO: Detect GPU support on Windows - info("Downloading pre-built CPU packages for Windows.") - base_url = "https://github.com/dmlc/mxnet/releases/download/20160531/20160531_win10_x64_cpu.7z" + info("Downloading pre-built packages for Windows.") + name = "20160531_win10_x64_$(HAS_CUDA ? "gpu" : "cpu").7z" + base_url = "https://github.com/dmlc/mxnet/releases/download/20160531/$name" + if libmxnet_curr_ver == "master" # download_cmd uses powershell 2, but we need powershell 3 to do this - run(`powershell -NoProfile -Command Invoke-WebRequest -Uri "https://api.github.com/repos/yajiedesign/mxnet/releases/latest" -OutFile "mxnet.json"`) + run(`powershell -NoProfile -Command Invoke-WebRequest -Uri "https://api.github.com/repos/yajiedesign/mxnet/releases/latest" -OutFile "mxnet.json"`) curr_win = JSON.parsefile("mxnet.json")["tag_name"] info("Can't use MXNet master on Windows, using latest binaries from $curr_win.") end # TODO: Get url from JSON. - package_url = "https://github.com/yajiedesign/mxnet/releases/download/$(curr_win)/$(curr_win)_mxnet_x64_vc12_cpu.7z" + name = "mxnet_x64_vc12_$(HAS_CUDA ? "gpu" : "cpu").7z" + package_url = "https://github.com/yajiedesign/mxnet/releases/download/$(curr_win)/$(curr_win)_$(name)" exe7z = joinpath(JULIA_HOME, "7z.exe") @@ -56,16 +89,6 @@ if !libmxnet_detected blas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) - # Try to find cuda - hascuda = false - if haskey(ENV, "CUDA_HOME") - hascuda = Libdl.dlopen_e(joinpath(ENV["CUDA_HOME"], "lib64", "libcuda.so")) != C_NULL - else - cudapaths = String["/opt/cuda/lib64", "/usr/local/cuda/lib64"] - cudalib = Libdl.find_library(["libcuda", "libcuda.so"], cudapaths) - hascuda = Libdl.dlopen_e(cudalib) != C_NULL - end - if VERSION >= v"0.5.0-dev+4338" blas_vendor = Base.BLAS.vendor() else @@ -129,7 +152,7 @@ if !libmxnet_detected `cp make/config.mk config.mk` end `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` - if hascuda + if HAS_CUDA `sed -i -s 's/USE_CUDA = 0/USE_CUDA = 1/' config.mk` if haskey(ENV, "CUDA_HOME") `sed -i -s 's/USE_CUDA_PATH = NULL/USE_CUDA_PATH = $(ENV["CUDA_HOME"])/' config.mk` diff --git a/docs/src/user-guide/install.md b/docs/src/user-guide/install.md index 34c532321ef7..abc48dcf76c0 100644 --- a/docs/src/user-guide/install.md +++ b/docs/src/user-guide/install.md @@ -21,9 +21,14 @@ MXNet.jl is built on top of [libmxnet](https://github.com/dmlc/mxnet). Upon installation, Julia will try to automatically download and build libmxnet. +There are two environment variables that change this behaviour. If you +already have a pre-installed version of mxnet you can use `MXNET_HOME` +to point the build-process in the right direction. If the automatic +cuda detection fails you can also set `CUDA_HOME` to override the process. + The libmxnet source is downloaded to `Pkg.dir("MXNet")/deps/src/mxnet`. -The automatic build is using default configurations, with OpenCV, CUDA -disabled. If the compilation failed due to unresolved dependency, or if +The automatic build is using default configurations, with OpenCV disabled. +If the compilation failed due to unresolved dependency, or if you want to customize the build, you can compile and install libmxnet manually. Please see below for more details. From efff124a42e446098c2b7620cb0f9f20e36c8536 Mon Sep 17 00:00:00 2001 From: Chiyuan Zhang Date: Fri, 12 May 2017 11:18:11 -0400 Subject: [PATCH 483/630] Add appveyor badge --- README.md | 1 + 1 file changed, 1 insertion(+) diff --git a/README.md b/README.md index 06313473c060..624b04206a48 100644 --- a/README.md +++ b/README.md @@ -1,6 +1,7 @@ # MXNet [![Build Status](https://travis-ci.org/dmlc/MXNet.jl.svg?branch=master)](https://travis-ci.org/dmlc/MXNet.jl) +[![Windows Build](https://ci.appveyor.com/api/projects/status/re90njols2th2ide?svg=true)](https://ci.appveyor.com/project/pluskid/mxnet-jl) [![codecov.io](https://codecov.io/github/dmlc/MXNet.jl/coverage.svg?branch=master)](https://codecov.io/github/dmlc/MXNet.jl?branch=master) [![](https://img.shields.io/badge/docs-latest-blue.svg)](https://dmlc.github.io/MXNet.jl/latest) [![MXNet](http://pkg.julialang.org/badges/MXNet_0.4.svg)](http://pkg.julialang.org/?pkg=MXNet) From 07777d670a9c36564866de7a01b6e04265d4ac4c Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sat, 13 May 2017 00:16:42 +0900 Subject: [PATCH 484/630] switch to vc14 --- deps/build.jl | 7 +++---- 1 file changed, 3 insertions(+), 4 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index ddc4dfc99ea4..39688bf8d183 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -6,7 +6,7 @@ import JSON ################################################################################ libmxnet_detected = false libmxnet_curr_ver = "master" -curr_win = "20161125" +curr_win = "20170502" if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") @@ -58,8 +58,7 @@ using BinDeps if !libmxnet_detected if is_windows() info("Downloading pre-built packages for Windows.") - name = "20160531_win10_x64_$(HAS_CUDA ? "gpu" : "cpu").7z" - base_url = "https://github.com/dmlc/mxnet/releases/download/20160531/$name" + base_url = "https://github.com/yajiedesign/mxnet/releases/download/weekly_binary_build/prebuildbase_win10_x64_vc14.7z" if libmxnet_curr_ver == "master" # download_cmd uses powershell 2, but we need powershell 3 to do this @@ -68,7 +67,7 @@ if !libmxnet_detected info("Can't use MXNet master on Windows, using latest binaries from $curr_win.") end # TODO: Get url from JSON. - name = "mxnet_x64_vc12_$(HAS_CUDA ? "gpu" : "cpu").7z" + name = "mxnet_x64_vc14_$(HAS_CUDA ? "gpu" : "cpu").7z" package_url = "https://github.com/yajiedesign/mxnet/releases/download/$(curr_win)/$(curr_win)_$(name)" exe7z = joinpath(JULIA_HOME, "7z.exe") From 28344a49d14eef467723a09393ea796a9b52ea77 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sat, 13 May 2017 14:41:18 +0900 Subject: [PATCH 485/630] actually copy the mxnet.dll to the right place on windows --- deps/build.jl | 2 ++ 1 file changed, 2 insertions(+) diff --git a/deps/build.jl b/deps/build.jl index 39688bf8d183..c2b10b459089 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -75,9 +75,11 @@ if !libmxnet_detected run(download_cmd(base_url, "mxnet_base.7z")) run(`$exe7z x mxnet_base.7z -y -ousr`) run(`cmd /c copy "usr\\3rdparty\\openblas\\bin\\*.dll" "usr\\lib"`) + run(`cmd /c copy "usr\\3rdparty\\opencv\\*.dll" "usr\\lib"`) run(download_cmd(package_url, "mxnet.7z")) run(`$exe7z x mxnet.7z -y -ousr`) + run(`cmd /c copy "usr\\build\\*.dll" "usr\\lib"`) return end From 96bdfa7056d179353f061265f569d3f8fd3c11a6 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sat, 13 May 2017 15:01:23 +0900 Subject: [PATCH 486/630] Prebuilt binaries only work on windows 64bit --- appveyor.yml | 1 - deps/build.jl | 4 ++++ 2 files changed, 4 insertions(+), 1 deletion(-) diff --git a/appveyor.yml b/appveyor.yml index 62356194de72..569f13ae0b57 100644 --- a/appveyor.yml +++ b/appveyor.yml @@ -1,6 +1,5 @@ environment: matrix: - - JULIAVERSION: "julialang/bin/winnt/x86/0.5/julia-0.5-latest-win32.exe" - JULIAVERSION: "julialang/bin/winnt/x64/0.5/julia-0.5-latest-win64.exe" branches: diff --git a/deps/build.jl b/deps/build.jl index c2b10b459089..754836288851 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -57,6 +57,10 @@ using BinDeps @BinDeps.setup if !libmxnet_detected if is_windows() + if Sys.ARCH != :x86_64 + info("Prebuilt windows binaries are only available on 64bit. You will have to built MXNet yourself.") + return + end info("Downloading pre-built packages for Windows.") base_url = "https://github.com/yajiedesign/mxnet/releases/download/weekly_binary_build/prebuildbase_win10_x64_vc14.7z" From 2ecf2c1666cf3edc4a32c18836cc8e86094172f7 Mon Sep 17 00:00:00 2001 From: Valentin Churavy Date: Sun, 14 May 2017 11:07:50 +0900 Subject: [PATCH 487/630] update NEWS.md --- NEWS.md | 12 +++++++++++- 1 file changed, 11 insertions(+), 1 deletion(-) diff --git a/NEWS.md b/NEWS.md index f4fb93004db8..551985db996c 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,7 +1,17 @@ +# v0.2.2 (2017.05.14) +* Updated supported version of MXNet to 0.9.4. +* Improved build-system with support for auto-detecting GPU support. +* Several updates to Metrics. +* CI for Windows. +* Verbosity option for `predict` (@rdeits) + +# v0.2.1 (2017.01.29) +* Bugfix release for Windows + # v0.2.0 (2017.01.26) * Drop support for Julia v0.4. * Added support for NVVM. -* Updated supported version of MXNet to 0.9.3. +* Updated supported version of MXNet to 0.9.2 * New optimizers (@Arkoniak). # v0.1.0 (2016.09.08) From 9c709227f90af180bd81094c53668ae6edeca024 Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Tue, 16 May 2017 17:19:53 -0700 Subject: [PATCH 488/630] Update CI URLs to point to new caching infrastructure --- appveyor.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/appveyor.yml b/appveyor.yml index 569f13ae0b57..3de92afc4c9d 100644 --- a/appveyor.yml +++ b/appveyor.yml @@ -1,6 +1,6 @@ environment: matrix: - - JULIAVERSION: "julialang/bin/winnt/x64/0.5/julia-0.5-latest-win64.exe" + - JULIA_URL: "https://julialang-s3.julialang.org/bin/winnt/x64/0.5/julia-0.5-latest-win64.exe" branches: only: @@ -14,6 +14,7 @@ notifications: on_build_status_changed: false install: + - ps: "[System.Net.ServicePointManager]::SecurityProtocol = [System.Net.SecurityProtocolType]::Tls12" # If there's a newer build queued for the same PR, cancel this one - ps: if ($env:APPVEYOR_PULL_REQUEST_NUMBER -and $env:APPVEYOR_BUILD_NUMBER -ne ((Invoke-RestMethod ` https://ci.appveyor.com/api/projects/$env:APPVEYOR_ACCOUNT_NAME/$env:APPVEYOR_PROJECT_SLUG/history?recordsNumber=50).builds | ` @@ -21,7 +22,7 @@ install: throw "There are newer queued builds for this pull request, failing early." } # Download most recent Julia Windows binary - ps: (new-object net.webclient).DownloadFile( - $("http://s3.amazonaws.com/"+$env:JULIAVERSION), + $env:JULIA_URL, "C:\projects\julia-binary.exe") # Run installer silently, output to C:\projects\julia - C:\projects\julia-binary.exe /S /D=C:\projects\julia From b63fd9b7d19ef1dcd6eed610fb0089f22f829784 Mon Sep 17 00:00:00 2001 From: holl- Date: Tue, 23 May 2017 19:59:24 +0200 Subject: [PATCH 489/630] Fix #242 (#247) Previously, when providing a KVStore object to mx.fit, the method would crash with an UndefVarError. This is now fixed by moving the definition of update_on_kvstore from _create_kvstore to fit. --- src/model.jl | 26 ++++++++++++-------------- 1 file changed, 12 insertions(+), 14 deletions(-) diff --git a/src/model.jl b/src/model.jl index afa3aa351a8a..4be38ededb92 100644 --- a/src/model.jl +++ b/src/model.jl @@ -207,11 +207,11 @@ end See also [`train`](@ref), [`fit`](@ref), [`init_model`](@ref), and [`load_checkpoint`](@ref) """ -function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; +function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; overwrite :: Bool = true, verbosity :: Integer = 1) predict(self, data; overwrite = overwrite, callback=callback, verbosity = verbosity) end -function predict(self :: FeedForward, data :: AbstractDataProvider; +function predict(self :: FeedForward, data :: AbstractDataProvider; overwrite::Bool=true, callback::Union{Function,Void}=nothing, verbosity :: Integer = 1) data_shapes = provide_data(data) data_names = [x[1] for x in data_shapes] @@ -264,9 +264,9 @@ function _init_model(self :: FeedForward, data :: AbstractDataProvider, initiali init_model(self, initializer; overwrite=overwrite, [provide_data(data)..., provide_label(data)...]...) end -function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}) +function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}, verbosity :: Int) if num_device == 1 && !ismatch(r"dist", string(kv_type)) - kv = nothing + return nothing else if kv_type == :local max_size = maximum([prod(size(param)) for (k,param) in arg_params]) @@ -275,17 +275,10 @@ function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params : else kv_type = :local_allreduce_cpu end - info("Auto-select kvstore type = $kv_type") + verbosity >= 2 && info("Auto-select kvstore type = $kv_type") end - kv = KVStore(kv_type) - end - - update_on_kvstore = true - if isa(kv, Void) || ismatch(r"local_allreduce", string(get_type(kv))) - update_on_kvstore = false + return KVStore(kv_type) end - - return (kv, update_on_kvstore) end @defstruct TrainingOptions ( @@ -371,7 +364,12 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra kvstore = opts.kvstore if isa(kvstore, Base.Symbol) opts.verbosity >= 2 && info("Creating KVStore...") - kvstore, update_on_kvstore = _create_kvstore(kvstore, length(self.ctx), self.arg_params) + kvstore = _create_kvstore(kvstore, length(self.ctx), self.arg_params, opts.verbosity) + end + + update_on_kvstore = true + if isa(kvstore, Void) || ismatch(r"local_allreduce", string(get_type(kvstore))) + update_on_kvstore = false end # get grad attribute to allow for freezing From 172af604bbcb0a4e0fd9c98671b5051f08d83e91 Mon Sep 17 00:00:00 2001 From: Elliot Saba Date: Tue, 30 May 2017 07:38:51 -0700 Subject: [PATCH 490/630] Use `Sys.CPU_CORES` not `nprocs()` when doing a parallel `make` (#250) --- deps/build.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 754836288851..0b728e3edfb4 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -168,9 +168,9 @@ if !libmxnet_detected ChangeDirectory(_mxdir) `cp ../../cblas.h include/cblas.h` if USE_JULIA_BLAS - `make -j$(nprocs()) USE_BLAS=$blas_name $MSHADOW_LDFLAGS` + `make -j$(min(Sys.CPU_CORES,8)) USE_BLAS=$blas_name $MSHADOW_LDFLAGS` else - `make -j$(nprocs())` + `make -j$(min(Sys.CPU_CORES,8))` end end FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin From 2b26bc2a3e150087c10c4f700731a16fa6fbbf28 Mon Sep 17 00:00:00 2001 From: ExpandingMan Date: Thu, 1 Jun 2017 11:17:41 -0400 Subject: [PATCH 491/630] update for Julia v0.6 (#248) * Updated for Julia v0.6 * Updated tests. * Added 0.5 compat. * Updated REQUIRE. * Removed compat macros. Should now work for both 0.5 and 0.6. * Attempting to fix dot operators for 0.5. * Still trying to fix the damn dot ops in 0.5. * Dotted operators now get imported from Base in version 0.5. * Updated appveyor and travis to use both 0.5 and 0.6. * Rewrote @chain to remove all AST dependance. * Updated appveyor yml. * Added a basic test for chain macro. * Fixed isa in chain to work on 0.5. * Fixed incorrect broadcast issue. * Updated appveyor. * Fixed broadcast multiplications for 0.5, again. --- .travis.yml | 1 + REQUIRE | 5 +- appveyor.yml | 3 ++ src/MXNet.jl | 4 ++ src/base.jl | 10 ++-- src/callback.jl | 10 ++-- src/compat.jl | 32 ++++++++++++ src/initializer.jl | 2 +- src/io.jl | 8 +-- src/metric.jl | 2 +- src/model.jl | 2 +- src/name.jl | 6 +-- src/ndarray.jl | 38 +++++++------- src/optimizer.jl | 12 +++-- src/optimizers/adadelta.jl | 6 +-- src/optimizers/adagrad.jl | 2 +- src/optimizers/adam.jl | 2 +- src/optimizers/nadam.jl | 2 +- src/optimizers/rmsprop.jl | 2 +- src/symbolic-node.jl | 94 ++++++++++++++++++---------------- test/common.jl | 6 +++ test/unittest/bind.jl | 8 +-- test/unittest/ndarray.jl | 2 +- test/unittest/symbolic-node.jl | 12 ++++- 24 files changed, 170 insertions(+), 101 deletions(-) create mode 100644 src/compat.jl diff --git a/.travis.yml b/.travis.yml index 7c1c6b9be19d..708b5392fd3e 100644 --- a/.travis.yml +++ b/.travis.yml @@ -7,6 +7,7 @@ os: osx_image: xcode8 julia: - 0.5 + - 0.6 # - nightly 0.6 supports depends on #170 # dependent apt packages diff --git a/REQUIRE b/REQUIRE index 8fdfc5fcde96..ca30ebc84ff9 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,5 +1,6 @@ -julia 0.5 -Compat 0.9.5 +julia 0.5.2 +Compat 0.25.2 Formatting BinDeps JSON +MacroTools diff --git a/appveyor.yml b/appveyor.yml index 3de92afc4c9d..e3d1984f4732 100644 --- a/appveyor.yml +++ b/appveyor.yml @@ -1,6 +1,7 @@ environment: matrix: - JULIA_URL: "https://julialang-s3.julialang.org/bin/winnt/x64/0.5/julia-0.5-latest-win64.exe" + - JULIA_URL: "https://julialang-s3.julialang.org/bin/winnt/x64/0.6/julia-0.6-latest-win64.exe" branches: only: @@ -20,6 +21,7 @@ install: https://ci.appveyor.com/api/projects/$env:APPVEYOR_ACCOUNT_NAME/$env:APPVEYOR_PROJECT_SLUG/history?recordsNumber=50).builds | ` Where-Object pullRequestId -eq $env:APPVEYOR_PULL_REQUEST_NUMBER)[0].buildNumber) { ` throw "There are newer queued builds for this pull request, failing early." } + # Download most recent Julia Windows binary - ps: (new-object net.webclient).DownloadFile( $env:JULIA_URL, @@ -35,3 +37,4 @@ build_script: test_script: - C:\projects\julia\bin\julia --check-bounds=yes -e "Pkg.test(\"MXNet\")" + diff --git a/src/MXNet.jl b/src/MXNet.jl index 892cc4e95163..bcc6296b3fb8 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -16,12 +16,16 @@ if VERSION >= v"0.6.0-dev.1024" end using Formatting +using MacroTools # Functions from base that we can safely extend and that are defined by libmxnet. import Base: round, ceil, floor, cos, sin, abs, sign, exp, sqrt, exp, log, norm, transpose include("base.jl") + +include("compat.jl") + include("context.jl") include("util.jl") diff --git a/src/base.jl b/src/base.jl index 183465341f3c..dd816dd41582 100644 --- a/src/base.jl +++ b/src/base.jl @@ -6,12 +6,12 @@ end ################################################################################ # Common types used in MXNet API ################################################################################ -typealias MX_uint Cuint -typealias MX_float Cfloat -typealias MX_handle Ptr{Void} +const MX_uint = Cuint +const MX_float = Cfloat +const MX_handle = Ptr{Void} -typealias char_p Ptr{UInt8} -typealias char_pp Ptr{char_p} +const char_p = Ptr{UInt8} +const char_pp = Ptr{char_p} ################################################################################ # Initialization and library API entrance diff --git a/src/callback.jl b/src/callback.jl index ee200d2e30c9..780869daf9f0 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -3,21 +3,21 @@ Abstract type of callback functions used in training. """ -abstract AbstractCallback +@compat abstract type AbstractCallback end """ AbstractBatchCallback Abstract type of callbacks to be called every mini-batch. """ -abstract AbstractBatchCallback <: AbstractCallback +@compat abstract type AbstractBatchCallback <: AbstractCallback end """ AbstractEpochCallback Abstract type of callbacks to be called every epoch. """ -abstract AbstractEpochCallback <: AbstractCallback +@compat abstract type AbstractEpochCallback <: AbstractCallback end type BatchCallback <: AbstractBatchCallback frequency :: Int @@ -51,7 +51,7 @@ See also [`every_n_epoch`](@ref) and [`speedometer`](@ref). function every_n_batch(callback :: Function, n :: Int; call_on_0 :: Bool = false) BatchCallback(n, call_on_0, callback) end -@compat function (cb :: BatchCallback)(state :: OptimizationState) +function (cb :: BatchCallback)(state :: OptimizationState) if state.curr_batch == 0 if cb.call_on_0 cb.callback(state) @@ -107,7 +107,7 @@ See also [`every_n_batch`](@ref). function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) end -@compat function (cb :: EpochCallback){T<:Real}(model :: Any, state :: OptimizationState, metric :: Vector{Tuple{Base.Symbol, T}}) +function (cb :: EpochCallback){T<:Real}(model :: Any, state :: OptimizationState, metric :: Vector{Tuple{Base.Symbol, T}}) if state.curr_epoch == 0 if cb.call_on_0 cb.callback(model, state, metric) diff --git a/src/compat.jl b/src/compat.jl new file mode 100644 index 000000000000..7357632174e5 --- /dev/null +++ b/src/compat.jl @@ -0,0 +1,32 @@ +# this file contains code used for enabling backward compatibility with 0.5 + +# have to import base dotted operators if in 0.5 +if VERSION < v"0.6.0-dev" + import Base: .+, .-, .*, ./, .^ +end + + +# this is for declaring broadcasted functions in 0.5 +# TODO this macro should be removed when 0.5 support is dropped +macro compatdot(fblock) + if VERSION ≥ v"0.6.0-dev" + return esc(fblock) + end + @capture(fblock, function Base.broadcast(::typeof(op_), args__) + body_ + end) + opdot = Symbol(string('.',op)) + esc(quote + function $opdot($(args...)) + $body + end + end) +end + +macro compatmul(expr1, expr2) + if VERSION ≥ v"0.6.0-dev" + esc(:(broadcast(*, $expr1, $expr2))) + else + esc(:($expr1 .* $expr2)) + end +end diff --git a/src/initializer.jl b/src/initializer.jl index 4685f41101cc..80e6026d1bf4 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -15,7 +15,7 @@ Or, if full behavior customization is needed, override the following function init(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) """ -abstract AbstractInitializer +@compat abstract type AbstractInitializer end function init{T<:AbstractInitializer}(self :: T, name :: Base.Symbol, array :: NDArray) strname = string(name) diff --git a/src/io.jl b/src/io.jl index ea22a4da961f..242a9ad98d1a 100644 --- a/src/io.jl +++ b/src/io.jl @@ -15,7 +15,7 @@ Normally this involves defining: * `Base.done(provider, state) -> Bool` * `Base.next(provider, state) -> (AbstractDataBatch, AbstractDataProvider)` """ -abstract AbstractDataProvider +@compat abstract type AbstractDataProvider end """ get_batch_size(provider) -> Int @@ -53,7 +53,7 @@ function provide_label end Base type for data provider states. """ -abstract AbstractDataProviderState +@compat abstract type AbstractDataProviderState end """ AbstractDataBatch @@ -70,7 +70,7 @@ The following utility functions will be automatically defined: * [`load_data!`](@ref) * [`load_label!`](@ref) """ -abstract AbstractDataBatch +@compat abstract type AbstractDataBatch end """ count_samples(provider, batch) -> Int @@ -127,7 +127,7 @@ get_label{Provider<:AbstractDataProvider}(::Provider, batch :: DataBatch) = batc A alias type of `Tuple{UnitRange{Int},NDArray}`. """ -typealias SlicedNDArray Tuple{UnitRange{Int},NDArray} +const SlicedNDArray = Tuple{UnitRange{Int},NDArray} function _load_general!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{Vector{SlicedNDArray}}, loader::Function) diff --git a/src/metric.jl b/src/metric.jl index 3bff815d4f35..b39309f6275c 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -8,7 +8,7 @@ interfaces: * [`reset!`](@ref) * [`get`](@ref) """ -abstract AbstractEvalMetric +@compat abstract type AbstractEvalMetric end """ hasNDArraySupport(metric) -> Val{true/false} diff --git a/src/model.jl b/src/model.jl index 4be38ededb92..a592b500e9cb 100644 --- a/src/model.jl +++ b/src/model.jl @@ -3,7 +3,7 @@ The abstract super type of all models in MXNet.jl. """ -abstract AbstractModel +@compat abstract type AbstractModel end """ FeedForward diff --git a/src/name.jl b/src/name.jl index 2ec531834232..8ba0f707ff1a 100644 --- a/src/name.jl +++ b/src/name.jl @@ -1,6 +1,6 @@ -abstract AbstractNameManager -typealias NameType Union{Base.Symbol, AbstractString} -typealias NameCounter Dict{Base.Symbol, Int} +@compat abstract type AbstractNameManager end +const NameType = Union{Base.Symbol, AbstractString} +const NameCounter = Dict{Base.Symbol, Int} import Base: get! diff --git a/src/ndarray.jl b/src/ndarray.jl index 42ad43d7c492..442f46d682ea 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1,7 +1,7 @@ # All the types supported by mshadow. -typealias DType Union{Float32, Float64, Float16, UInt8, Int32} +const DType = Union{Float32, Float64, Float16, UInt8, Int32} @enum TypeFlag kFloat32 kFloat64 kFloat16 kUint8 kInt32 -typealias DEFAULT_DTYPE Float32 +const DEFAULT_DTYPE = Float32 function toTypeFlag{T <: DType}(:: Type{T}) if T == Float32 @@ -300,7 +300,6 @@ function eltype{T <: Union{NDArray, MX_NDArrayHandle}}(arr :: T) end -import Base: slice """ slice(arr :: NDArray, start:stop) @@ -532,7 +531,8 @@ function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) return dst end -import Base: +, .+ +import Base.broadcast +import Base: + """ +(args...) @@ -546,14 +546,15 @@ function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) ret = copy(arg0, context(arg0)) add_to!(ret, args...) end -function .+(arg0 :: NDArray, args :: Union{Real, NDArray}...) +@compatdot function Base.broadcast(::typeof(+), arg0 :: NDArray, args :: Union{Real, NDArray}...) +(arg0, args...) end function +(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) +(arg1, arg0, args...) end -function .+(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) - .+(arg1, arg0, args...) +@compatdot function Base.broadcast(::typeof(+), arg0 :: Real, arg1 :: NDArray, + args :: Union{Real, NDArray}...) + broadcast(+, arg1, arg0, args...) end """ @@ -570,7 +571,7 @@ function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) end end -import Base: -, .- +import Base: - """ -(arg0, arg1) @@ -584,7 +585,7 @@ function -(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) sub_from!(ret, arg1) end -function .-(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) +@compatdot function Base.broadcast(::typeof(-), arg0 :: NDArray, arg1 :: Union{Real, NDArray}) -(arg0, arg1) end function -(arg0 :: Real, arg1 :: NDArray) @@ -592,7 +593,7 @@ function -(arg0 :: Real, arg1 :: NDArray) add_to!(ret, arg0) return ret end -function .-(arg0 :: Real, arg1 :: NDArray) +@compatdot function Base.broadcast(::typeof(-), arg0 :: Real, arg1 :: NDArray) -(arg0, arg1) end @@ -616,19 +617,19 @@ function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) return dst end -import Base: .*, * +import Base: * """ .*(arg0, arg1) Elementwise multiplication of `arg0` and `arg`, could be either scalar or `NDArray`. """ -function .*(arg0 :: NDArray, arg :: Union{Real, NDArray}) +@compatdot function Base.broadcast(::typeof(*), arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) mul_to!(ret, arg) end -function .*(arg0 :: Real, arg :: NDArray) - .*(arg, arg0) +@compatdot function Base.broadcast(::typeof(*), arg0 :: Real, arg :: NDArray) + arg .* arg0 end """ @@ -659,13 +660,13 @@ function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) end end -import Base: ./, / +import Base: / """ ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) Elementwise dividing an `NDArray` by a scalar or another `NDArray` of the same shape. """ -function ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) +@compatdot function Base.broadcast(::typeof(/), arg0 :: NDArray, arg :: Union{Real, NDArray}) ret = copy(arg0, context(arg0)) div_from!(ret, arg) end @@ -676,7 +677,7 @@ end Divide an `NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. """ function /(arg0 :: NDArray, arg :: Real) - ./(arg0, arg) + arg0 ./ arg end @@ -1063,7 +1064,8 @@ macro _import_ndarray_functions() func_name = Symbol(name) expr = quote - $(isdefined(Base, func_name) ? :(import Base.$func_name) : :()) + # TODO the explicit exclusion of take will no longer be necessary when it is removed from Base + $((isdefined(Base, func_name) && func_name ≠ :take)? :(import Base.$func_name) : :()) $func_def @doc $desc -> $func_def2 diff --git a/src/optimizer.jl b/src/optimizer.jl index 5e9065b64127..11508bf22035 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -3,21 +3,21 @@ Base type for all optimizers. """ -abstract AbstractOptimizer +@compat abstract type AbstractOptimizer end """ AbstractLearningRateScheduler Base type for all learning rate scheduler. """ -abstract AbstractLearningRateScheduler +@compat abstract type AbstractLearningRateScheduler end """ AbstractMomentumScheduler Base type for all momentum scheduler. """ -abstract AbstractMomentumScheduler +@compat abstract type AbstractMomentumScheduler end @@ -62,6 +62,7 @@ function get_learning_rate end ################################################################################ # The learning rate module module LearningRate +using Compat import ..mx: AbstractLearningRateScheduler, OptimizationState, get_learning_rate """ @@ -137,6 +138,7 @@ end ################################################################################ # The Momentum module module Momentum +using Compat import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum """ @@ -145,7 +147,7 @@ import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum The null momentum scheduler always returns 0 for momentum. It is also used to explicitly indicate momentum should not be used. """ -type Null <: AbstractMomentumScheduler +immutable Null <: AbstractMomentumScheduler end get_momentum(self :: Null, state :: OptimizationState) = 0.0 @@ -240,7 +242,7 @@ end Base class for all optimizer options. """ -abstract AbstractOptimizerOptions +@compat abstract type AbstractOptimizerOptions end """ normalized_gradient(opts, state, weight, grad) diff --git a/src/optimizers/adadelta.jl b/src/optimizers/adadelta.jl index e00cc9a42abd..aec81445fbb2 100644 --- a/src/optimizers/adadelta.jl +++ b/src/optimizers/adadelta.jl @@ -78,14 +78,14 @@ function update(self :: AdaDelta, index :: Int, weight :: NDArray, # Update state.acc as in RMSProp @inplace state.acc .*= self.opts.rho - @inplace state.acc .+= (1 - self.opts.rho) * grad .* grad + @inplace state.acc .+= (1 - self.opts.rho) * @compatmul(grad, grad) # Compute update using the "old" state.delta_acc - update = grad .* sqrt(state.delta_acc + self.opts.epsilon) ./ + update = @compatmul(grad, sqrt(state.delta_acc + self.opts.epsilon)) ./ (sqrt(state.acc + self.opts.epsilon)) @inplace weight .+= -lr * update # update state.delta_acc using update @inplace state.delta_acc .*= self.opts.rho - @inplace state.delta_acc .+= (1 - self.opts.rho) * update .* update + @inplace state.delta_acc .+= (1 - self.opts.rho) * @compatmul(update, update) end diff --git a/src/optimizers/adagrad.jl b/src/optimizers/adagrad.jl index 196998121cce..2df3c07efd44 100644 --- a/src/optimizers/adagrad.jl +++ b/src/optimizers/adagrad.jl @@ -61,6 +61,6 @@ function update(self :: AdaGrad, index :: Int, weight :: NDArray, lr = get_learning_rate(self.opts.lr_scheduler, self.state) grad = normalized_gradient(self.opts, self.state, weight, grad) - @inplace state .+= grad .* grad + @inplace state .+= @compatmul(grad, grad) @inplace weight .+= -lr * grad ./ (sqrt(state + self.opts.epsilon)) end diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl index 3af5c3579736..a6b5c69eefc3 100644 --- a/src/optimizers/adam.jl +++ b/src/optimizers/adam.jl @@ -61,7 +61,7 @@ function update(self :: ADAM, index :: Int, weight :: NDArray, grad :: NDArray, grad = normalized_gradient(self.opts, self.state, weight, grad) state.mt = self.opts.beta1 * state.mt + (1 - self.opts.beta1) * grad - state.vt = self.opts.beta2 * state.vt + (1 - self.opts.beta2) * (grad .* grad) + state.vt = self.opts.beta2 * state.vt + (1 - self.opts.beta2) * @compatmul(grad, grad) at = sqrt(1.0 - state.beta2Power)/(1.0 - state.beta1Power) diff --git a/src/optimizers/nadam.jl b/src/optimizers/nadam.jl index 65a195f674fe..b90b7a106984 100644 --- a/src/optimizers/nadam.jl +++ b/src/optimizers/nadam.jl @@ -91,7 +91,7 @@ function update(self :: Nadam, index :: Int, weight :: NDArray, mt = state.mt / (1.0 - momentum_next) @inplace state.nt .*= self.opts.beta2 - @inplace state.nt .+= (1.0 - self.opts.beta2) * grad .* grad + @inplace state.nt .+= (1.0 - self.opts.beta2) * @compatmul(grad, grad) nt = state.nt / (1.0 - state.beta2Power) state.beta2Power *= self.opts.beta2 diff --git a/src/optimizers/rmsprop.jl b/src/optimizers/rmsprop.jl index 01a40651d2f6..0c6c2d45a753 100644 --- a/src/optimizers/rmsprop.jl +++ b/src/optimizers/rmsprop.jl @@ -65,7 +65,7 @@ function update(self :: RMSProp, index :: Int, weight :: NDArray, grad = normalized_gradient(self.opts, self.state, weight, grad) @inplace state .*= self.opts.rho - @inplace state .+= (1 - self.opts.rho) * grad .* grad + @inplace state .+= (1 - self.opts.rho) * @compatmul(grad, grad) @inplace weight .+= -lr * grad ./ (sqrt(state + self.opts.epsilon)) end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 4c73bd33642d..8a567c2e8003 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -38,11 +38,11 @@ function Base.copy(self :: SymbolicNode) Base.deepcopy(self) end -@compat function (self::SymbolicNode)(args :: SymbolicNode...) +function (self::SymbolicNode)(args :: SymbolicNode...) s = deepcopy(self) _compose!(s, args...) end -@compat function (self::SymbolicNode)(;kwargs...) +function (self::SymbolicNode)(;kwargs...) s = deepcopy(self) _compose!(s; kwargs...) end @@ -217,7 +217,7 @@ function get_name(self :: mx.SymbolicNode) success = Ref(0) @mxcall(:MXSymbolGetName, (MX_handle, Ref{char_p}, Ref{Int}), self.handle.value, name, success) @assert success[] != -1 - return Symbol(unsafe_wrap(String, name[])) + return Symbol(unsafe_string(name[])) end """ @@ -435,7 +435,8 @@ function Base.getindex(self :: SymbolicNode, idx :: Int) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -import Base: +, .+ +import Base.broadcast +import Base: + function +(self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) ret = self for arg in args @@ -447,34 +448,35 @@ function +(self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) end ret end -function .+(self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) +@compatdot function Base.broadcast(::typeof(+), self::SymbolicNode, args::Union{SymbolicNode,Real}...) +(self, args...) end function +(s1 :: Real, self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) +(self, s1, args...) end -function .+(s1 :: Real, self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) +@compatdot function Base.broadcast(::typeof(+), s1::Real, self::SymbolicNode, + args::Union{SymbolicNode,Real}...) +(self, s1, args...) end -import Base: -, .- +import Base: - function -(self :: SymbolicNode, arg :: SymbolicNode) _Minus(self, arg) end -function .-(self :: SymbolicNode, arg :: SymbolicNode) +@compatdot function Base.broadcast(::typeof(-), self :: SymbolicNode, arg :: SymbolicNode) -(self, arg) end function -(self :: SymbolicNode, arg :: Real) _MinusScalar(self, scalar=MX_float(arg)) end -function .-(self :: SymbolicNode, arg :: Real) +@compatdot function Base.broadcast(::typeof(-), self :: SymbolicNode, arg :: Real) -(self, arg) end function -(arg :: Real, self :: SymbolicNode) _RMinusScalar(self, scalar=arg) end -function .-(arg :: Real, self :: SymbolicNode) +@compatdot function Base.broadcast(::typeof(-), arg :: Real, self :: SymbolicNode) -(arg, self) end @@ -482,8 +484,8 @@ function -(self :: SymbolicNode) -(0, self) end -import Base: .*, * -function .*(self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) +import Base: * +@compatdot function Base.broadcast(::typeof(*), self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) ret = self for arg in args if isa(arg, SymbolicNode) @@ -494,8 +496,9 @@ function .*(self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) end ret end -function .*(arg :: Real, self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) - .*(self, arg, args...) +@compatdot function Base.broadcast(::typeof(*), arg :: Real, self :: SymbolicNode, + args :: Union{SymbolicNode,Real}...) + broadcast(*, self, arg, args...) end function *(arg :: Real, self :: SymbolicNode) _MulScalar(self, scalar=arg) @@ -504,32 +507,32 @@ function *(self :: SymbolicNode, arg :: Real) *(arg, self) end -import Base: ./, / -function ./(self :: SymbolicNode, arg :: SymbolicNode) +import Base: / +@compatdot function Base.broadcast(::typeof(/), self :: SymbolicNode, arg :: SymbolicNode) _Div(self, arg) end -function ./(self :: SymbolicNode, arg :: Real) +@compatdot function Base.broadcast(::typeof(/), self :: SymbolicNode, arg :: Real) _DivScalar(self, scalar=MX_float(arg)) end function /(self :: SymbolicNode, arg :: Real) - ./(self, arg) + self ./ arg end function /(arg :: Real, self :: SymbolicNode) _RDivScalar(self, scalar=arg) end -function ./(arg :: Real, self :: SymbolicNode) +@compatdot function Base.broadcast(::typeof(/), arg :: Real, self :: SymbolicNode) _RDivScalar(self, scalar=arg) end -import Base: .^, ^ -function .^(self :: SymbolicNode, pow :: SymbolicNode) +import Base: ^ +@compatdot function Base.broadcast(::typeof(^), self :: SymbolicNode, pow :: SymbolicNode) _Power(self, pow) end -function .^(self :: SymbolicNode, pow :: AbstractFloat) +@compatdot function Base.broadcast(::typeof(^), self :: SymbolicNode, pow :: AbstractFloat) _PowerScalar(self, scalar=pow) end function ^(self :: SymbolicNode, pow :: AbstractFloat) - .^(self, pow) + self .^ pow end function _compose!(node :: SymbolicNode; kwargs...) @@ -750,26 +753,31 @@ end # Utility macros to chain up symbols ################################################################################ macro chain(layers) - exprs = [] - last_layer = nothing - function _chain_layer(layer, last_layer) - if isa(last_layer, Void) - esc(layer) - else - @assert(isa(layer, Expr) && layer.head == :call, "Do not know how to chain up $layer") - return Expr(:call, esc(layer.args[1]), last_layer, map(esc, layer.args[2:end])...) + exprs = [] + last_layer = nothing + + function _chain_layer(layer, last_layer) + if isa(last_layer, Void) + return esc(layer) + else + if @capture(layer, f_(x__)) + return :($f($last_layer, $(x...))) + else + throw(AssertionError("$layer is not a valid function call and cannot be chained.")) + end + end end - end - while true - if layers.head == :(=>) - new_layer = gensym() - push!(exprs, :($new_layer = $(_chain_layer(layers.args[1], last_layer)))) - last_layer = new_layer - layers = layers.args[2] - else - push!(exprs, _chain_layer(layers, last_layer)) - break + + while true + if @capture(layers, l1_=>l2_) + new_layer = gensym() + push!(exprs, :($new_layer = $(_chain_layer(l1, last_layer)))) + last_layer = new_layer + layers = l2 + else + push!(exprs, _chain_layer(layers, last_layer)) + break + end end - end - return Expr(:block, exprs...) + Expr(:block, exprs...) end diff --git a/test/common.jl b/test/common.jl index 7f7cd3cb78ea..035650e74f72 100644 --- a/test/common.jl +++ b/test/common.jl @@ -19,3 +19,9 @@ function mlp2() return out end +function mlpchain() + mx.@chain mx.Variable(:data) => + mx.FullyConnected(name=:fc1, num_hidden=1000) => + mx.Activation(act_type=:relu) => + mx.FullyConnected(name=:fc2, num_hidden=10) +end diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl index 79f639518487..0e32446b9e0f 100644 --- a/test/unittest/bind.jl +++ b/test/unittest/bind.jl @@ -56,13 +56,13 @@ end function test_arithmetic() for T in [mx.fromTypeFlag(TF) for TF in instances(mx.TypeFlag)] - test_arithmetic(T, .+, (g,x,y) -> (g,g)) - test_arithmetic(T, .-, (g,x,y) -> (g,-g)) - test_arithmetic(T, .*, (g,x,y) -> (y.*g, x.*g)) + test_arithmetic(T, (x,y) -> x .+ y, (g,x,y) -> (g,g)) + test_arithmetic(T, (x,y) -> x .- y, (g,x,y) -> (g,-g)) + test_arithmetic(T, (x,y) -> x .* y, (g,x,y) -> (y.*g, x.*g)) if T <: Integer || T == Float16 warn("Not running division test for $T") else - test_arithmetic(T, ./, (g,x,y) -> (g ./ y, -x .* g ./ (y.^2))) + test_arithmetic(T, (x,y) -> x ./ y, (g,x,y) -> (g ./ y, -x .* g ./ (y.^2))) end end end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 155f365d6ee8..69599960973f 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -73,7 +73,7 @@ function test_slice() array = mx.zeros((2,4)) array[2:3] = ones(2,2) @test copy(array) == [0 1 1 0; 0 1 1 0] - @test copy(slice(array, 2:3)) == [1 1; 1 1] + @test copy(mx.slice(array, 2:3)) == [1 1; 1 1] end function test_plus() diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 4c8cff8adccc..5d8d01b608db 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -2,7 +2,7 @@ module TestSymbolicNode using MXNet using Base.Test -using ..Main: mlp2, reldiff +using ..Main: mlp2, mlpchain, reldiff ################################################################################ # Test Implementations @@ -16,6 +16,15 @@ function test_basic() @test mx.list_auxiliary_states(model) == Symbol[] end +function test_chain() + info("SymbolicNode::chain") + + model = mlpchain() + @test mx.list_arguments(model) == [:data,:fc1_weight,:fc1_bias,:fc2_weight,:fc2_bias] + @test mx.list_outputs(model) == [:fc2_output] + @test mx.list_auxiliary_states(model) == Symbol[] +end + function test_internal() info("SymbolicNode::internal") @@ -140,6 +149,7 @@ end ################################################################################ @testset "SymbolicNode Test" begin test_basic() + test_chain() test_internal() test_compose() test_infer_shape() From 841e9ee0937df6587f5d24dfc9a8efed1e26de17 Mon Sep 17 00:00:00 2001 From: Michael Creel Date: Fri, 2 Jun 2017 14:42:53 +0200 Subject: [PATCH 492/630] update regression example for julia v0.6(#254) * update regression example for julia v0.6 Updated to work with julia 0.6.x. The plot is commented out for now. --- examples/regression-example.jl | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/examples/regression-example.jl b/examples/regression-example.jl index 508dfa79b308..885f031dc658 100644 --- a/examples/regression-example.jl +++ b/examples/regression-example.jl @@ -6,11 +6,11 @@ the predictions from the trained net. =# using MXNet using Distributions -using Plots +#using Plots # data generating process generate_inputs(mean, var, size) = rand(MvNormal(mean, var), size) -output(data) = sin(data[1,:]).*sin(data[2,:])./(data[1,:].*data[2,:]) +output(data) = sin.(data[1:1,:]).*sin.(data[2:2,:])./(data[1:1,:].*data[2:2,:]) # create training and evaluation data sets mean=[0.0;0.0] @@ -36,7 +36,7 @@ net = @mx.chain mx.Variable(:data) => mx.FullyConnected(num_hidden=3) => mx.Activation(act_type=:tanh) => mx.FullyConnected(num_hidden=1) => - mx.LinearRegressionOutput(label) + mx.LinearRegressionOutput(mx.Variable(:label)) # final model definition, don't change, except if using gpu model = mx.FeedForward(net, context=mx.cpu()) @@ -56,4 +56,5 @@ mx.fit(model, optimizer, eval_metric=mx.MSE(), trainprovider, eval_data=evalprov # obtain predictions plotprovider = mx.ArrayDataProvider(:data => ValidationInput, :label => ValidationOutput) fit = mx.predict(model, plotprovider) -scatter(ValidationOutput,fit',w = 3, xlabel="true", ylabel="predicted", title="45º line is what we hope for", show=true) +println("correlation between fitted values and true regression line: ", cor(vec(fit), vec(ValidationOutput))) +#scatter(ValidationOutput,fit',w = 3, xlabel="true", ylabel="predicted", title="45º line is what we hope for", show=true) From c965235765835e54204542f720c7a67b40e3e2f1 Mon Sep 17 00:00:00 2001 From: Josh Bode Date: Fri, 9 Jun 2017 17:16:45 +1000 Subject: [PATCH 493/630] Add extra check on CUDA library detection Some machines return a non-zero pointer for `Libdl.dlopen("")` causing MXNet dep build to incorrectly report presense of CUDA libraries. --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 0b728e3edfb4..bc86af683b23 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -36,7 +36,7 @@ end HAS_CUDA = false let cudalib = Libdl.find_library(["libcuda", "nvcuda.dll"], CUDAPATHS) - HAS_CUDA = Libdl.dlopen_e(cudalib) != C_NULL + HAS_CUDA = !isempty(cudalib) && Libdl.dlopen_e(cudalib) != C_NULL end if !HAS_CUDA && is_windows() From e7d1b622b3ffa0d3c7cb2ed6bb7b1d8f2a70a1cd Mon Sep 17 00:00:00 2001 From: Josh Bode Date: Wed, 21 Jun 2017 01:19:36 +1000 Subject: [PATCH 494/630] Added cblas_[ds]tr[sm]m to cblas include file (#259) --- deps/cblas.h | 13 +++++++++++++ 1 file changed, 13 insertions(+) diff --git a/deps/cblas.h b/deps/cblas.h index a99c8fc9920f..471550323882 100644 --- a/deps/cblas.h +++ b/deps/cblas.h @@ -48,6 +48,10 @@ typedef int blasint; #define cblas_dger cblas_dger64_ #define cblas_sdot cblas_sdot64_ #define cblas_ddot cblas_ddot64_ +#define cblas_strmm cblas_strmm64_ +#define cblas_dtrmm cblas_dtrmm64_ +#define cblas_strsm cblas_strsm64_ +#define cblas_dtrsm cblas_dtrsm64_ #endif @@ -72,6 +76,15 @@ void cblas_sgemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLA void cblas_dgemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransB, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double beta, double *C, OPENBLAS_CONST blasint ldc); +void cblas_strmm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, + OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *B, OPENBLAS_CONST blasint ldb); +void cblas_dtrmm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, + OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *B, OPENBLAS_CONST blasint ldb); +void cblas_strsm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, + OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *B, OPENBLAS_CONST blasint ldb); +void cblas_dtrsm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, + OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *B, OPENBLAS_CONST blasint ldb); + #ifdef __cplusplus } #endif /* __cplusplus */ From 10ad90bd20724bc63c480effbcab7892f28faf46 Mon Sep 17 00:00:00 2001 From: Josh Bode Date: Fri, 23 Jun 2017 23:48:24 +1000 Subject: [PATCH 495/630] Added MXNET_COMMIT env variable for upstream commit/tag (#260) Setting the `MXNET_COMMIT` environment variable to a tag, branch or hash will use that version of the upstream mxnet repo in building the libmxnet shared object. Additionally, the upstream submodules are cleared (and reinitialised) every build to prevent some issues when submodules make changes (squashes, etc). --- deps/build.jl | 9 +++++---- docs/src/user-guide/install.md | 5 ++++- 2 files changed, 9 insertions(+), 5 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index bc86af683b23..7ddce7ab4166 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -5,7 +5,7 @@ import JSON # First try to detect and load existing libmxnet ################################################################################ libmxnet_detected = false -libmxnet_curr_ver = "master" +libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "master") curr_win = "20170502" if haskey(ENV, "MXNET_HOME") @@ -138,14 +138,15 @@ if !libmxnet_detected @build_steps begin BinDeps.DirectoryRule(_mxdir, @build_steps begin ChangeDirectory(_srcdir) - `git clone --recursive https://github.com/dmlc/mxnet` + `git clone https://github.com/dmlc/mxnet` end) @build_steps begin ChangeDirectory(_mxdir) - `git -C mshadow checkout -- make/mshadow.mk` + `git submodule deinit --force .` `git fetch` `git checkout $libmxnet_curr_ver` - `git submodule update --init` + `git submodule update --init --recursive` + `git -C mshadow checkout -- make/mshadow.mk` `make clean` `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` end diff --git a/docs/src/user-guide/install.md b/docs/src/user-guide/install.md index abc48dcf76c0..a585b4409c6d 100644 --- a/docs/src/user-guide/install.md +++ b/docs/src/user-guide/install.md @@ -21,10 +21,13 @@ MXNet.jl is built on top of [libmxnet](https://github.com/dmlc/mxnet). Upon installation, Julia will try to automatically download and build libmxnet. -There are two environment variables that change this behaviour. If you +There are three environment variables that change this behaviour. If you already have a pre-installed version of mxnet you can use `MXNET_HOME` to point the build-process in the right direction. If the automatic cuda detection fails you can also set `CUDA_HOME` to override the process. +To control which version of libmxnet will be compiled, you can use the +`MXNET_COMMIT` variable to point to either a version tag (e.g. `v0.10.0`), a +branch name (e.g. `master`) or a specific commit hash (e.g. `a0b1c2d3`). The libmxnet source is downloaded to `Pkg.dir("MXNet")/deps/src/mxnet`. The automatic build is using default configurations, with OpenCV disabled. From 0750c41dbbc6245e3c1c65b1a256f5008aababec Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 8 Sep 2017 18:59:13 +0800 Subject: [PATCH 496/630] build: bump curr_win to 20170819, MXNet 0.11.0 --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 7ddce7ab4166..c97ccaaec03a 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -6,7 +6,7 @@ import JSON ################################################################################ libmxnet_detected = false libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "master") -curr_win = "20170502" +curr_win = "20170819" if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") From 85a2d97ec058156706f93b51120b62ba52001d60 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 9 Sep 2017 21:36:51 +0800 Subject: [PATCH 497/630] ndarray: add kInt8 and kInt64 into TypeFlag enum Ref: * https://github.com/dmlc/mshadow/pull/244 * https://github.com/dmlc/mshadow/pull/258 --- src/ndarray.jl | 16 ++++++++++++---- 1 file changed, 12 insertions(+), 4 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 442f46d682ea..952c944dfbdd 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1,7 +1,7 @@ -# All the types supported by mshadow. -const DType = Union{Float32, Float64, Float16, UInt8, Int32} -@enum TypeFlag kFloat32 kFloat64 kFloat16 kUint8 kInt32 -const DEFAULT_DTYPE = Float32 +# All the types supported by mshadow. See `mshadow/base.h` +const DType = Union{Float32, Float64, Float16, UInt8, Int32, Int8, Int64} +@enum TypeFlag kFloat32 kFloat64 kFloat16 kUint8 kInt32 kInt8 kInt64 +const DEFAULT_DTYPE = Float32 # MSHADOW_DEFAULT_DTYPE function toTypeFlag{T <: DType}(:: Type{T}) if T == Float32 @@ -14,6 +14,10 @@ function toTypeFlag{T <: DType}(:: Type{T}) return kUint8 elseif T == Int32 return kInt32 + elseif T == Int8 + return kInt8 + elseif T == Int64 + return kInt64 else throw(ArgumentError("Can't convert $T to DType.")) end @@ -30,6 +34,10 @@ function fromTypeFlag(T :: TypeFlag) return UInt8 elseif T == kInt32 return Int32 + elseif T == kInt8 + return Int8 + elseif T == kInt64 + return Int64 else throw(ArgumentError("Can't convert DType $T.")) end From 873715b7e722431c9c642bbe783f76c184151b47 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 8 Sep 2017 11:41:20 +0800 Subject: [PATCH 498/630] cblas: import all func prototype into header Also, enable ILP64 symbol if INTERFACE64 defined --- deps/cblas.h | 478 +++++++++++++++++++++++++++++++++++++++++++++++++-- 1 file changed, 465 insertions(+), 13 deletions(-) diff --git a/deps/cblas.h b/deps/cblas.h index 471550323882..98a02f4fa968 100644 --- a/deps/cblas.h +++ b/deps/cblas.h @@ -2,7 +2,7 @@ #define CBLAS_H /* - * This file modified from the OpenBLAS repository, + * This file modified from the OpenBLAS repository. */ #include @@ -39,21 +39,192 @@ typedef BLASLONG blasint; typedef int blasint; #endif +/* copy from openblas_config_template.h */ +/* C99 supports complex floating numbers natively, which GCC also offers as an + extension since version 3.0. If neither are available, use a compatible + structure as fallback (see Clause 6.2.5.13 of the C99 standard). */ +#if ((defined(__STDC_IEC_559_COMPLEX__) || __STDC_VERSION__ >= 199901L || \ + (__GNUC__ >= 3 && !defined(__cplusplus))) && !(defined(FORCE_OPENBLAS_COMPLEX_STRUCT))) +#ifndef __cplusplus + #include +#endif + typedef float _Complex openblas_complex_float; + typedef double _Complex openblas_complex_double; +#else + typedef struct { float real, imag; } openblas_complex_float; + typedef struct { double real, imag; } openblas_complex_double; +#endif + #ifdef INTERFACE64 -#define cblas_sgemm cblas_sgemm64_ -#define cblas_sgemv cblas_sgemv64_ -#define cblas_sger cblas_sger64_ -#define cblas_dgemm cblas_dgemm64_ -#define cblas_dgemv cblas_dgemv64_ -#define cblas_dger cblas_dger64_ -#define cblas_sdot cblas_sdot64_ -#define cblas_ddot cblas_ddot64_ -#define cblas_strmm cblas_strmm64_ -#define cblas_dtrmm cblas_dtrmm64_ -#define cblas_strsm cblas_strsm64_ -#define cblas_dtrsm cblas_dtrsm64_ +# define cblas_sdsdot cblas_sdsdot64_ +# define cblas_dsdot cblas_dsdot64_ +# define cblas_sdot cblas_sdot64_ +# define cblas_ddot cblas_ddot64_ +# define cblas_cdotu cblas_cdotu64_ +# define cblas_cdotc cblas_cdotc64_ +# define cblas_zdotu cblas_zdotu64_ +# define cblas_zdotc cblas_zdotc64_ +# define cblas_cdotu_sub cblas_cdotu_sub64_ +# define cblas_cdotc_sub cblas_cdotc_sub64_ +# define cblas_zdotu_sub cblas_zdotu_sub64_ +# define cblas_zdotc_sub cblas_zdotc_sub64_ +# define cblas_sasum cblas_sasum64_ +# define cblas_dasum cblas_dasum64_ +# define cblas_scasum cblas_scasum64_ +# define cblas_dzasum cblas_dzasum64_ +# define cblas_snrm2 cblas_snrm264_ +# define cblas_dnrm2 cblas_dnrm264_ +# define cblas_scnrm2 cblas_scnrm264_ +# define cblas_dznrm2 cblas_dznrm264_ +# define cblas_isamax cblas_isamax64_ +# define cblas_idamax cblas_idamax64_ +# define cblas_icamax cblas_icamax64_ +# define cblas_izamax cblas_izamax64_ +# define cblas_saxpy cblas_saxpy64_ +# define cblas_daxpy cblas_daxpy64_ +# define cblas_caxpy cblas_caxpy64_ +# define cblas_zaxpy cblas_zaxpy64_ +# define cblas_scopy cblas_scopy64_ +# define cblas_dcopy cblas_dcopy64_ +# define cblas_ccopy cblas_ccopy64_ +# define cblas_zcopy cblas_zcopy64_ +# define cblas_sswap cblas_sswap64_ +# define cblas_dswap cblas_dswap64_ +# define cblas_cswap cblas_cswap64_ +# define cblas_zswap cblas_zswap64_ +# define cblas_srot cblas_srot64_ +# define cblas_drot cblas_drot64_ +# define cblas_srotg cblas_srotg64_ +# define cblas_drotg cblas_drotg64_ +# define cblas_srotm cblas_srotm64_ +# define cblas_drotm cblas_drotm64_ +# define cblas_srotmg cblas_srotmg64_ +# define cblas_drotmg cblas_drotmg64_ +# define cblas_sscal cblas_sscal64_ +# define cblas_dscal cblas_dscal64_ +# define cblas_cscal cblas_cscal64_ +# define cblas_zscal cblas_zscal64_ +# define cblas_csscal cblas_csscal64_ +# define cblas_zdscal cblas_zdscal64_ +# define cblas_sgemv cblas_sgemv64_ +# define cblas_dgemv cblas_dgemv64_ +# define cblas_cgemv cblas_cgemv64_ +# define cblas_zgemv cblas_zgemv64_ +# define cblas_sger cblas_sger64_ +# define cblas_dger cblas_dger64_ +# define cblas_cgeru cblas_cgeru64_ +# define cblas_cgerc cblas_cgerc64_ +# define cblas_zgeru cblas_zgeru64_ +# define cblas_zgerc cblas_zgerc64_ +# define cblas_strsv cblas_strsv64_ +# define cblas_dtrsv cblas_dtrsv64_ +# define cblas_ctrsv cblas_ctrsv64_ +# define cblas_ztrsv cblas_ztrsv64_ +# define cblas_strmv cblas_strmv64_ +# define cblas_dtrmv cblas_dtrmv64_ +# define cblas_ctrmv cblas_ctrmv64_ +# define cblas_ztrmv cblas_ztrmv64_ +# define cblas_ssyr cblas_ssyr64_ +# define cblas_dsyr cblas_dsyr64_ +# define cblas_cher cblas_cher64_ +# define cblas_zher cblas_zher64_ +# define cblas_ssyr2 cblas_ssyr264_ +# define cblas_dsyr2 cblas_dsyr264_ +# define cblas_cher2 cblas_cher264_ +# define cblas_zher2 cblas_zher264_ +# define cblas_sgbmv cblas_sgbmv64_ +# define cblas_dgbmv cblas_dgbmv64_ +# define cblas_cgbmv cblas_cgbmv64_ +# define cblas_zgbmv cblas_zgbmv64_ +# define cblas_ssbmv cblas_ssbmv64_ +# define cblas_dsbmv cblas_dsbmv64_ +# define cblas_stbmv cblas_stbmv64_ +# define cblas_dtbmv cblas_dtbmv64_ +# define cblas_ctbmv cblas_ctbmv64_ +# define cblas_ztbmv cblas_ztbmv64_ +# define cblas_stbsv cblas_stbsv64_ +# define cblas_dtbsv cblas_dtbsv64_ +# define cblas_ctbsv cblas_ctbsv64_ +# define cblas_ztbsv cblas_ztbsv64_ +# define cblas_stpmv cblas_stpmv64_ +# define cblas_dtpmv cblas_dtpmv64_ +# define cblas_ctpmv cblas_ctpmv64_ +# define cblas_ztpmv cblas_ztpmv64_ +# define cblas_stpsv cblas_stpsv64_ +# define cblas_dtpsv cblas_dtpsv64_ +# define cblas_ctpsv cblas_ctpsv64_ +# define cblas_ztpsv cblas_ztpsv64_ +# define cblas_ssymv cblas_ssymv64_ +# define cblas_dsymv cblas_dsymv64_ +# define cblas_chemv cblas_chemv64_ +# define cblas_zhemv cblas_zhemv64_ +# define cblas_sspmv cblas_sspmv64_ +# define cblas_dspmv cblas_dspmv64_ +# define cblas_sspr cblas_sspr64_ +# define cblas_dspr cblas_dspr64_ +# define cblas_chpr cblas_chpr64_ +# define cblas_zhpr cblas_zhpr64_ +# define cblas_sspr2 cblas_sspr264_ +# define cblas_dspr2 cblas_dspr264_ +# define cblas_chpr2 cblas_chpr264_ +# define cblas_zhpr2 cblas_zhpr264_ +# define cblas_chbmv cblas_chbmv64_ +# define cblas_zhbmv cblas_zhbmv64_ +# define cblas_chpmv cblas_chpmv64_ +# define cblas_zhpmv cblas_zhpmv64_ +# define cblas_sgemm cblas_sgemm64_ +# define cblas_dgemm cblas_dgemm64_ +# define cblas_cgemm cblas_cgemm64_ +# define cblas_cgemm3m cblas_cgemm3m64_ +# define cblas_zgemm cblas_zgemm64_ +# define cblas_zgemm3m cblas_zgemm3m64_ +# define cblas_ssymm cblas_ssymm64_ +# define cblas_dsymm cblas_dsymm64_ +# define cblas_csymm cblas_csymm64_ +# define cblas_zsymm cblas_zsymm64_ +# define cblas_ssyrk cblas_ssyrk64_ +# define cblas_dsyrk cblas_dsyrk64_ +# define cblas_csyrk cblas_csyrk64_ +# define cblas_zsyrk cblas_zsyrk64_ +# define cblas_ssyr2k cblas_ssyr2k64_ +# define cblas_dsyr2k cblas_dsyr2k64_ +# define cblas_csyr2k cblas_csyr2k64_ +# define cblas_zsyr2k cblas_zsyr2k64_ +# define cblas_strmm cblas_strmm64_ +# define cblas_dtrmm cblas_dtrmm64_ +# define cblas_ctrmm cblas_ctrmm64_ +# define cblas_ztrmm cblas_ztrmm64_ +# define cblas_strsm cblas_strsm64_ +# define cblas_dtrsm cblas_dtrsm64_ +# define cblas_ctrsm cblas_ctrsm64_ +# define cblas_ztrsm cblas_ztrsm64_ +# define cblas_chemm cblas_chemm64_ +# define cblas_zhemm cblas_zhemm64_ +# define cblas_cherk cblas_cherk64_ +# define cblas_zherk cblas_zherk64_ +# define cblas_cher2k cblas_cher2k64_ +# define cblas_zher2k cblas_zher2k64_ +# define cblas_xerbla cblas_xerbla64_ +# define cblas_saxpby cblas_saxpby64_ +# define cblas_daxpby cblas_daxpby64_ +# define cblas_caxpby cblas_caxpby64_ +# define cblas_zaxpby cblas_zaxpby64_ +# define cblas_somatcopy cblas_somatcopy64_ +# define cblas_domatcopy cblas_domatcopy64_ +# define cblas_comatcopy cblas_comatcopy64_ +# define cblas_zomatcopy cblas_zomatcopy64_ +# define cblas_simatcopy cblas_simatcopy64_ +# define cblas_dimatcopy cblas_dimatcopy64_ +# define cblas_cimatcopy cblas_cimatcopy64_ +# define cblas_zimatcopy cblas_zimatcopy64_ +# define cblas_sgeadd cblas_sgeadd64_ +# define cblas_dgeadd cblas_dgeadd64_ +# define cblas_cgeadd cblas_cgeadd64_ +# define cblas_zgeadd cblas_zgeadd64_ #endif +#define CBLAS_INDEX size_t + typedef enum CBLAS_ORDER {CblasRowMajor=101, CblasColMajor=102} CBLAS_ORDER; typedef enum CBLAS_TRANSPOSE {CblasNoTrans=111, CblasTrans=112, CblasConjTrans=113, CblasConjNoTrans=114} CBLAS_TRANSPOSE; @@ -61,29 +232,310 @@ typedef enum CBLAS_UPLO {CblasUpper=121, CblasLower=122} CBLAS_UPLO; typedef enum CBLAS_DIAG {CblasNonUnit=131, CblasUnit=132} CBLAS_DIAG; typedef enum CBLAS_SIDE {CblasLeft=141, CblasRight=142} CBLAS_SIDE; +float cblas_sdsdot(OPENBLAS_CONST blasint n, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float *y, OPENBLAS_CONST blasint incy); +double cblas_dsdot (OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float *y, OPENBLAS_CONST blasint incy); float cblas_sdot(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float *y, OPENBLAS_CONST blasint incy); double cblas_ddot(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST double *y, OPENBLAS_CONST blasint incy); +openblas_complex_float cblas_cdotu(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float *y, OPENBLAS_CONST blasint incy); +openblas_complex_float cblas_cdotc(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float *y, OPENBLAS_CONST blasint incy); +openblas_complex_double cblas_zdotu(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST double *y, OPENBLAS_CONST blasint incy); +openblas_complex_double cblas_zdotc(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST double *y, OPENBLAS_CONST blasint incy); + +void cblas_cdotu_sub(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float *y, OPENBLAS_CONST blasint incy, openblas_complex_float *ret); +void cblas_cdotc_sub(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float *y, OPENBLAS_CONST blasint incy, openblas_complex_float *ret); +void cblas_zdotu_sub(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST double *y, OPENBLAS_CONST blasint incy, openblas_complex_double *ret); +void cblas_zdotc_sub(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST double *y, OPENBLAS_CONST blasint incy, openblas_complex_double *ret); + +float cblas_sasum (OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx); +double cblas_dasum (OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx); +float cblas_scasum(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx); +double cblas_dzasum(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx); + +float cblas_snrm2 (OPENBLAS_CONST blasint N, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX); +double cblas_dnrm2 (OPENBLAS_CONST blasint N, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX); +float cblas_scnrm2(OPENBLAS_CONST blasint N, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX); +double cblas_dznrm2(OPENBLAS_CONST blasint N, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX); + +CBLAS_INDEX cblas_isamax(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx); +CBLAS_INDEX cblas_idamax(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx); +CBLAS_INDEX cblas_icamax(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx); +CBLAS_INDEX cblas_izamax(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx); + +void cblas_saxpy(OPENBLAS_CONST blasint n, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, float *y, OPENBLAS_CONST blasint incy); +void cblas_daxpy(OPENBLAS_CONST blasint n, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, double *y, OPENBLAS_CONST blasint incy); +void cblas_caxpy(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, float *y, OPENBLAS_CONST blasint incy); +void cblas_zaxpy(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, double *y, OPENBLAS_CONST blasint incy); + +void cblas_scopy(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, float *y, OPENBLAS_CONST blasint incy); +void cblas_dcopy(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, double *y, OPENBLAS_CONST blasint incy); +void cblas_ccopy(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, float *y, OPENBLAS_CONST blasint incy); +void cblas_zcopy(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, double *y, OPENBLAS_CONST blasint incy); + +void cblas_sswap(OPENBLAS_CONST blasint n, float *x, OPENBLAS_CONST blasint incx, float *y, OPENBLAS_CONST blasint incy); +void cblas_dswap(OPENBLAS_CONST blasint n, double *x, OPENBLAS_CONST blasint incx, double *y, OPENBLAS_CONST blasint incy); +void cblas_cswap(OPENBLAS_CONST blasint n, float *x, OPENBLAS_CONST blasint incx, float *y, OPENBLAS_CONST blasint incy); +void cblas_zswap(OPENBLAS_CONST blasint n, double *x, OPENBLAS_CONST blasint incx, double *y, OPENBLAS_CONST blasint incy); + +void cblas_srot(OPENBLAS_CONST blasint N, float *X, OPENBLAS_CONST blasint incX, float *Y, OPENBLAS_CONST blasint incY, OPENBLAS_CONST float c, OPENBLAS_CONST float s); +void cblas_drot(OPENBLAS_CONST blasint N, double *X, OPENBLAS_CONST blasint incX, double *Y, OPENBLAS_CONST blasint incY, OPENBLAS_CONST double c, OPENBLAS_CONST double s); + +void cblas_srotg(float *a, float *b, float *c, float *s); +void cblas_drotg(double *a, double *b, double *c, double *s); + +void cblas_srotm(OPENBLAS_CONST blasint N, float *X, OPENBLAS_CONST blasint incX, float *Y, OPENBLAS_CONST blasint incY, OPENBLAS_CONST float *P); +void cblas_drotm(OPENBLAS_CONST blasint N, double *X, OPENBLAS_CONST blasint incX, double *Y, OPENBLAS_CONST blasint incY, OPENBLAS_CONST double *P); + +void cblas_srotmg(float *d1, float *d2, float *b1, OPENBLAS_CONST float b2, float *P); +void cblas_drotmg(double *d1, double *d2, double *b1, OPENBLAS_CONST double b2, double *P); + +void cblas_sscal(OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, float *X, OPENBLAS_CONST blasint incX); +void cblas_dscal(OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, double *X, OPENBLAS_CONST blasint incX); +void cblas_cscal(OPENBLAS_CONST blasint N, OPENBLAS_CONST float *alpha, float *X, OPENBLAS_CONST blasint incX); +void cblas_zscal(OPENBLAS_CONST blasint N, OPENBLAS_CONST double *alpha, double *X, OPENBLAS_CONST blasint incX); +void cblas_csscal(OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, float *X, OPENBLAS_CONST blasint incX); +void cblas_zdscal(OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, double *X, OPENBLAS_CONST blasint incX); + void cblas_sgemv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE trans, OPENBLAS_CONST blasint m, OPENBLAS_CONST blasint n, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *a, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float beta, float *y, OPENBLAS_CONST blasint incy); void cblas_dgemv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE trans, OPENBLAS_CONST blasint m, OPENBLAS_CONST blasint n, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *a, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST double beta, double *y, OPENBLAS_CONST blasint incy); +void cblas_cgemv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE trans, OPENBLAS_CONST blasint m, OPENBLAS_CONST blasint n, + OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *a, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST float *beta, float *y, OPENBLAS_CONST blasint incy); +void cblas_zgemv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE trans, OPENBLAS_CONST blasint m, OPENBLAS_CONST blasint n, + OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *a, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx, OPENBLAS_CONST double *beta, double *y, OPENBLAS_CONST blasint incy); + void cblas_sger (OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *Y, OPENBLAS_CONST blasint incY, float *A, OPENBLAS_CONST blasint lda); void cblas_dger (OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *Y, OPENBLAS_CONST blasint incY, double *A, OPENBLAS_CONST blasint lda); +void cblas_cgeru(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *Y, OPENBLAS_CONST blasint incY, float *A, OPENBLAS_CONST blasint lda); +void cblas_cgerc(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *Y, OPENBLAS_CONST blasint incY, float *A, OPENBLAS_CONST blasint lda); +void cblas_zgeru(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *Y, OPENBLAS_CONST blasint incY, double *A, OPENBLAS_CONST blasint lda); +void cblas_zgerc(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *Y, OPENBLAS_CONST blasint incY, double *A, OPENBLAS_CONST blasint lda); + +void cblas_strsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *X, OPENBLAS_CONST blasint incX); +void cblas_dtrsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *X, OPENBLAS_CONST blasint incX); +void cblas_ctrsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *X, OPENBLAS_CONST blasint incX); +void cblas_ztrsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *X, OPENBLAS_CONST blasint incX); + +void cblas_strmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *X, OPENBLAS_CONST blasint incX); +void cblas_dtrmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *X, OPENBLAS_CONST blasint incX); +void cblas_ctrmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *X, OPENBLAS_CONST blasint incX); +void cblas_ztrmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *X, OPENBLAS_CONST blasint incX); + +void cblas_ssyr(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, float *A, OPENBLAS_CONST blasint lda); +void cblas_dsyr(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, double *A, OPENBLAS_CONST blasint lda); +void cblas_cher(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, float *A, OPENBLAS_CONST blasint lda); +void cblas_zher(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, double *A, OPENBLAS_CONST blasint lda); + +void cblas_ssyr2(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo,OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *X, + OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *Y, OPENBLAS_CONST blasint incY, float *A, OPENBLAS_CONST blasint lda); +void cblas_dsyr2(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *X, + OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *Y, OPENBLAS_CONST blasint incY, double *A, OPENBLAS_CONST blasint lda); +void cblas_cher2(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, + OPENBLAS_CONST float *Y, OPENBLAS_CONST blasint incY, float *A, OPENBLAS_CONST blasint lda); +void cblas_zher2(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, + OPENBLAS_CONST double *Y, OPENBLAS_CONST blasint incY, double *A, OPENBLAS_CONST blasint lda); + +void cblas_sgbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST blasint KL, OPENBLAS_CONST blasint KU, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float beta, float *Y, OPENBLAS_CONST blasint incY); +void cblas_dgbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST blasint KL, OPENBLAS_CONST blasint KU, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double beta, double *Y, OPENBLAS_CONST blasint incY); +void cblas_cgbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST blasint KL, OPENBLAS_CONST blasint KU, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *beta, float *Y, OPENBLAS_CONST blasint incY); +void cblas_zgbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST blasint KL, OPENBLAS_CONST blasint KU, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *beta, double *Y, OPENBLAS_CONST blasint incY); + +void cblas_ssbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, + OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float beta, float *Y, OPENBLAS_CONST blasint incY); +void cblas_dsbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, + OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double beta, double *Y, OPENBLAS_CONST blasint incY); + + +void cblas_stbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *X, OPENBLAS_CONST blasint incX); +void cblas_dtbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *X, OPENBLAS_CONST blasint incX); +void cblas_ctbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *X, OPENBLAS_CONST blasint incX); +void cblas_ztbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *X, OPENBLAS_CONST blasint incX); + +void cblas_stbsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *X, OPENBLAS_CONST blasint incX); +void cblas_dtbsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *X, OPENBLAS_CONST blasint incX); +void cblas_ctbsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *X, OPENBLAS_CONST blasint incX); +void cblas_ztbsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *X, OPENBLAS_CONST blasint incX); + +void cblas_stpmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST float *Ap, float *X, OPENBLAS_CONST blasint incX); +void cblas_dtpmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST double *Ap, double *X, OPENBLAS_CONST blasint incX); +void cblas_ctpmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST float *Ap, float *X, OPENBLAS_CONST blasint incX); +void cblas_ztpmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST double *Ap, double *X, OPENBLAS_CONST blasint incX); + +void cblas_stpsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST float *Ap, float *X, OPENBLAS_CONST blasint incX); +void cblas_dtpsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST double *Ap, double *X, OPENBLAS_CONST blasint incX); +void cblas_ctpsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST float *Ap, float *X, OPENBLAS_CONST blasint incX); +void cblas_ztpsv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, + OPENBLAS_CONST blasint N, OPENBLAS_CONST double *Ap, double *X, OPENBLAS_CONST blasint incX); + +void cblas_ssymv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, + OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float beta, float *Y, OPENBLAS_CONST blasint incY); +void cblas_dsymv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, + OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double beta, double *Y, OPENBLAS_CONST blasint incY); +void cblas_chemv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, + OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *beta, float *Y, OPENBLAS_CONST blasint incY); +void cblas_zhemv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, + OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *beta, double *Y, OPENBLAS_CONST blasint incY); + + +void cblas_sspmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *Ap, + OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float beta, float *Y, OPENBLAS_CONST blasint incY); +void cblas_dspmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *Ap, + OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double beta, double *Y, OPENBLAS_CONST blasint incY); + +void cblas_sspr(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, float *Ap); +void cblas_dspr(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, double *Ap); + +void cblas_chpr(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, float *A); +void cblas_zhpr(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *X,OPENBLAS_CONST blasint incX, double *A); + +void cblas_sspr2(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *Y, OPENBLAS_CONST blasint incY, float *A); +void cblas_dspr2(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *Y, OPENBLAS_CONST blasint incY, double *A); +void cblas_chpr2(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *Y, OPENBLAS_CONST blasint incY, float *Ap); +void cblas_zhpr2(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *Y, OPENBLAS_CONST blasint incY, double *Ap); + +void cblas_chbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *beta, float *Y, OPENBLAS_CONST blasint incY); +void cblas_zhbmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *beta, double *Y, OPENBLAS_CONST blasint incY); + +void cblas_chpmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, + OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *Ap, OPENBLAS_CONST float *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST float *beta, float *Y, OPENBLAS_CONST blasint incY); +void cblas_zhpmv(OPENBLAS_CONST enum CBLAS_ORDER order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint N, + OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *Ap, OPENBLAS_CONST double *X, OPENBLAS_CONST blasint incX, OPENBLAS_CONST double *beta, double *Y, OPENBLAS_CONST blasint incY); void cblas_sgemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransB, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float beta, float *C, OPENBLAS_CONST blasint ldc); void cblas_dgemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransB, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double beta, double *C, OPENBLAS_CONST blasint ldc); +void cblas_cgemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransB, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float *beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_cgemm3m(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransB, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float *beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_zgemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransB, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double *beta, double *C, OPENBLAS_CONST blasint ldc); +void cblas_zgemm3m(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransB, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double *beta, double *C, OPENBLAS_CONST blasint ldc); + + +void cblas_ssymm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_dsymm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double beta, double *C, OPENBLAS_CONST blasint ldc); +void cblas_csymm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float *beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_zsymm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double *beta, double *C, OPENBLAS_CONST blasint ldc); + +void cblas_ssyrk(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_dsyrk(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double beta, double *C, OPENBLAS_CONST blasint ldc); +void cblas_csyrk(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_zsyrk(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *beta, double *C, OPENBLAS_CONST blasint ldc); + +void cblas_ssyr2k(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_dsyr2k(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double beta, double *C, OPENBLAS_CONST blasint ldc); +void cblas_csyr2k(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float *beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_zsyr2k(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, + OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double *beta, double *C, OPENBLAS_CONST blasint ldc); void cblas_strmm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *B, OPENBLAS_CONST blasint ldb); void cblas_dtrmm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *B, OPENBLAS_CONST blasint ldb); +void cblas_ctrmm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, + OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *B, OPENBLAS_CONST blasint ldb); +void cblas_ztrmm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, + OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *B, OPENBLAS_CONST blasint ldb); + void cblas_strsm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *B, OPENBLAS_CONST blasint ldb); void cblas_dtrsm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *B, OPENBLAS_CONST blasint ldb); +void cblas_ctrsm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, + OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, float *B, OPENBLAS_CONST blasint ldb); +void cblas_ztrsm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE TransA, + OPENBLAS_CONST enum CBLAS_DIAG Diag, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, double *B, OPENBLAS_CONST blasint ldb); + +void cblas_chemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float *beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_zhemm(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_SIDE Side, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST blasint M, OPENBLAS_CONST blasint N, + OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double *beta, double *C, OPENBLAS_CONST blasint ldc); + +void cblas_cherk(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST float alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_zherk(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST double alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double beta, double *C, OPENBLAS_CONST blasint ldc); + +void cblas_cher2k(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST float *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST float beta, float *C, OPENBLAS_CONST blasint ldc); +void cblas_zher2k(OPENBLAS_CONST enum CBLAS_ORDER Order, OPENBLAS_CONST enum CBLAS_UPLO Uplo, OPENBLAS_CONST enum CBLAS_TRANSPOSE Trans, OPENBLAS_CONST blasint N, OPENBLAS_CONST blasint K, + OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *A, OPENBLAS_CONST blasint lda, OPENBLAS_CONST double *B, OPENBLAS_CONST blasint ldb, OPENBLAS_CONST double beta, double *C, OPENBLAS_CONST blasint ldc); + +void cblas_xerbla(blasint p, char *rout, char *form, ...); + +/*** BLAS extensions ***/ + +void cblas_saxpby(OPENBLAS_CONST blasint n, OPENBLAS_CONST float alpha, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx,OPENBLAS_CONST float beta, float *y, OPENBLAS_CONST blasint incy); + +void cblas_daxpby(OPENBLAS_CONST blasint n, OPENBLAS_CONST double alpha, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx,OPENBLAS_CONST double beta, double *y, OPENBLAS_CONST blasint incy); + +void cblas_caxpby(OPENBLAS_CONST blasint n, OPENBLAS_CONST float *alpha, OPENBLAS_CONST float *x, OPENBLAS_CONST blasint incx,OPENBLAS_CONST float *beta, float *y, OPENBLAS_CONST blasint incy); + +void cblas_zaxpby(OPENBLAS_CONST blasint n, OPENBLAS_CONST double *alpha, OPENBLAS_CONST double *x, OPENBLAS_CONST blasint incx,OPENBLAS_CONST double *beta, double *y, OPENBLAS_CONST blasint incy); + +void cblas_somatcopy(OPENBLAS_CONST enum CBLAS_ORDER CORDER, OPENBLAS_CONST enum CBLAS_TRANSPOSE CTRANS, OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST float calpha, OPENBLAS_CONST float *a, + OPENBLAS_CONST blasint clda, float *b, OPENBLAS_CONST blasint cldb); +void cblas_domatcopy(OPENBLAS_CONST enum CBLAS_ORDER CORDER, OPENBLAS_CONST enum CBLAS_TRANSPOSE CTRANS, OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST double calpha, OPENBLAS_CONST double *a, + OPENBLAS_CONST blasint clda, double *b, OPENBLAS_CONST blasint cldb); +void cblas_comatcopy(OPENBLAS_CONST enum CBLAS_ORDER CORDER, OPENBLAS_CONST enum CBLAS_TRANSPOSE CTRANS, OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST float* calpha, OPENBLAS_CONST float* a, + OPENBLAS_CONST blasint clda, float*b, OPENBLAS_CONST blasint cldb); +void cblas_zomatcopy(OPENBLAS_CONST enum CBLAS_ORDER CORDER, OPENBLAS_CONST enum CBLAS_TRANSPOSE CTRANS, OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST double* calpha, OPENBLAS_CONST double* a, + OPENBLAS_CONST blasint clda, double *b, OPENBLAS_CONST blasint cldb); + +void cblas_simatcopy(OPENBLAS_CONST enum CBLAS_ORDER CORDER, OPENBLAS_CONST enum CBLAS_TRANSPOSE CTRANS, OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST float calpha, float *a, + OPENBLAS_CONST blasint clda, OPENBLAS_CONST blasint cldb); +void cblas_dimatcopy(OPENBLAS_CONST enum CBLAS_ORDER CORDER, OPENBLAS_CONST enum CBLAS_TRANSPOSE CTRANS, OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST double calpha, double *a, + OPENBLAS_CONST blasint clda, OPENBLAS_CONST blasint cldb); +void cblas_cimatcopy(OPENBLAS_CONST enum CBLAS_ORDER CORDER, OPENBLAS_CONST enum CBLAS_TRANSPOSE CTRANS, OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST float* calpha, float* a, + OPENBLAS_CONST blasint clda, OPENBLAS_CONST blasint cldb); +void cblas_zimatcopy(OPENBLAS_CONST enum CBLAS_ORDER CORDER, OPENBLAS_CONST enum CBLAS_TRANSPOSE CTRANS, OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST double* calpha, double* a, + OPENBLAS_CONST blasint clda, OPENBLAS_CONST blasint cldb); + +void cblas_sgeadd(OPENBLAS_CONST enum CBLAS_ORDER CORDER,OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST float calpha, float *a, OPENBLAS_CONST blasint clda, OPENBLAS_CONST float cbeta, + float *c, OPENBLAS_CONST blasint cldc); +void cblas_dgeadd(OPENBLAS_CONST enum CBLAS_ORDER CORDER,OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST double calpha, double *a, OPENBLAS_CONST blasint clda, OPENBLAS_CONST double cbeta, + double *c, OPENBLAS_CONST blasint cldc); +void cblas_cgeadd(OPENBLAS_CONST enum CBLAS_ORDER CORDER,OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST float *calpha, float *a, OPENBLAS_CONST blasint clda, OPENBLAS_CONST float *cbeta, + float *c, OPENBLAS_CONST blasint cldc); +void cblas_zgeadd(OPENBLAS_CONST enum CBLAS_ORDER CORDER,OPENBLAS_CONST blasint crows, OPENBLAS_CONST blasint ccols, OPENBLAS_CONST double *calpha, double *a, OPENBLAS_CONST blasint clda, OPENBLAS_CONST double *cbeta, + double *c, OPENBLAS_CONST blasint cldc); + #ifdef __cplusplus } From 4e5ab13edd3afbefd80eeca0e8c462d34fb62fe3 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 6 Sep 2017 10:55:03 +0800 Subject: [PATCH 499/630] travis : set make -j4 and travis_wait * change # of make job in order to prevent from out-of-memory issue * travis_wait is a workaround about https://github.com/JuliaLang/julia/pull/23601 --- .travis.yml | 5 ++++- deps/build.jl | 12 ++++++++++-- 2 files changed, 14 insertions(+), 3 deletions(-) diff --git a/.travis.yml b/.travis.yml index 708b5392fd3e..2f7dee479a68 100644 --- a/.travis.yml +++ b/.travis.yml @@ -35,7 +35,10 @@ notifications: email: false script: - - source $TRAVIS/run_test.sh + # bump the time limit of no ouput + # the `travis_wait` wrapper can be removed once this issue fixed: + # https://github.com/JuliaLang/julia/pull/23601 + - travis_wait 60 $TRAVIS/run_test.sh after_success: - source $TRAVIS/run_coverage.sh diff --git a/deps/build.jl b/deps/build.jl index c97ccaaec03a..aef054a8e52f 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -53,6 +53,14 @@ else info("Did not find a CUDA installation, using CPU-only version of MXNet.") end +function get_cpucore() + if haskey(ENV, "TRAVIS") # on travis-ci + 4 + else + min(Sys.CPU_CORES, 8) + end +end + using BinDeps @BinDeps.setup if !libmxnet_detected @@ -169,9 +177,9 @@ if !libmxnet_detected ChangeDirectory(_mxdir) `cp ../../cblas.h include/cblas.h` if USE_JULIA_BLAS - `make -j$(min(Sys.CPU_CORES,8)) USE_BLAS=$blas_name $MSHADOW_LDFLAGS` + `make -j$(get_cpucore()) USE_BLAS=$blas_name $MSHADOW_LDFLAGS` else - `make -j$(min(Sys.CPU_CORES,8))` + `make -j$(get_cpucore())` end end FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin From d1bbcc4a821e9862a671817d7f75521638d6a558 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 1 Sep 2017 14:16:02 +0800 Subject: [PATCH 500/630] base/build: using `Libdl.dlext` for searching lib --- deps/build.jl | 11 +++++++---- src/base.jl | 9 +++++---- 2 files changed, 12 insertions(+), 8 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index c97ccaaec03a..03f57bcf0094 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -11,7 +11,8 @@ curr_win = "20170819" if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") info("Trying to load existing libmxnet...") - lib = Libdl.find_library(["libmxnet", "libmxnet.so"], ["$(ENV["MXNET_HOME"])/lib"]) + lib = Libdl.find_library("libmxnet.$(Libdl.dlext)", + ["$(ENV["MXNET_HOME"])/lib"]) if !isempty(lib) info("Existing libmxnet detected at $lib, skip building...") libmxnet_detected = true @@ -130,7 +131,7 @@ if !libmxnet_detected _libdir = joinpath(_prefix, "lib") # We have do eagerly delete the installed libmxnet.so # Otherwise we won't rebuild on an update. - run(`rm -f $_libdir/libmxnet.so`) + run(`rm -f $_libdir/libmxnet.$(Libdl.dlext)`) provides(BuildProcess, (@build_steps begin CreateDirectory(_srcdir) @@ -174,8 +175,10 @@ if !libmxnet_detected `make -j$(min(Sys.CPU_CORES,8))` end end - FileRule(joinpath(_libdir, "libmxnet.so"), @build_steps begin - `cp $_mxdir/lib/libmxnet.so $_libdir/` + FileRule(joinpath(_libdir, "libmxnet.$(Libdl.dlext)"), @build_steps begin + # the output file on macos is still in `.so` suffix + # so we rename it + `cp $_mxdir/lib/libmxnet.so $_libdir/libmxnet.$(Libdl.dlext)` end) end end), mxnet, installed_libpath=_libdir) diff --git a/src/base.jl b/src/base.jl index dd816dd41582..4f004f452f28 100644 --- a/src/base.jl +++ b/src/base.jl @@ -16,14 +16,15 @@ const char_pp = Ptr{char_p} ################################################################################ # Initialization and library API entrance ################################################################################ -const MXNET_LIB = Libdl.find_library(["libmxnet.so","libmxnet.dll"], - [joinpath("$(get(ENV,"MXNET_HOME",""))","lib"), - Pkg.dir("MXNet","deps","usr","lib")]) +const MXNET_LIB = Libdl.find_library("libmxnet.$(Libdl.dlext)", + [joinpath(get(ENV, "MXNET_HOME", ""), "lib"), + Pkg.dir("MXNet", "deps", "usr", "lib")]) if isempty(MXNET_LIB) # touch this file, so that after the user properly build libmxnet, the precompiled # MXNet.ji will be re-compiled to get MXNET_LIB properly. touch(@__FILE__) - error("Cannot find or load libmxnet.so. Please see the document on how to build it.") + error("Cannot find or load libmxnet.$(Libdl.dlext). " * + "Please see the document on how to build it.") else include_dependency(MXNET_LIB) end From 0d54f4b7cfb4f744bb4a8e3a81539c6abf2f16f2 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 9 Sep 2017 15:50:30 +0800 Subject: [PATCH 501/630] build: force enable LAPACK when Julia's OpenBLAS is available --- deps/build.jl | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/deps/build.jl b/deps/build.jl index c97ccaaec03a..7bf6372acebb 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -105,6 +105,7 @@ if !libmxnet_detected ilp64 = "-DINTERFACE64" end + FORCE_LAPACK = false if blas_vendor == :unknown info("Julia is built with an unkown blas library ($blas_path).") info("Attempting build without reusing the blas library") @@ -115,6 +116,7 @@ if !libmxnet_detected USE_JULIA_BLAS = true else USE_JULIA_BLAS = true + FORCE_LAPACK = true end blas_name = blas_vendor == :openblas64 ? "openblas" : string(blas_vendor) @@ -164,6 +166,11 @@ if !libmxnet_detected `sed -i -s 's/USE_CUDA_PATH = NULL/USE_CUDA_PATH = $(ENV["CUDA_HOME"])/' config.mk` end end + # Force enable LAPACK build + # Julia's OpenBLAS has LAPACK functionality already + if FORCE_LAPACK + `sed -i -s 's/ADD_CFLAGS =\(.*\)/ADD_CFLAGS =\1 -DMXNET_USE_LAPACK/' config.mk` + end end) @build_steps begin ChangeDirectory(_mxdir) From 23866bd640ad39a2e20c596e1557701b0cac52e8 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 11 Sep 2017 22:44:52 +0800 Subject: [PATCH 502/630] build: fix macOS LAPACK build --- deps/build.jl | 3 +++ 1 file changed, 3 insertions(+) diff --git a/deps/build.jl b/deps/build.jl index 558f4f7cbb61..69443c4987e5 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -178,6 +178,9 @@ if !libmxnet_detected # Force enable LAPACK build # Julia's OpenBLAS has LAPACK functionality already if FORCE_LAPACK + if is_apple() + MSHADOW_LDFLAGS *= " -framework Accelerate" + end `sed -i -s 's/ADD_CFLAGS =\(.*\)/ADD_CFLAGS =\1 -DMXNET_USE_LAPACK/' config.mk` end end) From 4e439ed5254bd0ad41f55a4e055477e2950ced00 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 11 Sep 2017 02:01:54 +0800 Subject: [PATCH 503/630] build: remove FileRule on config.mk and fix CUDA config * remove FileRule on config.mk, we always override it. Due to the following workflow is quite common: * user issue `Pkg.build("MXNet")` * then, build failed because the `CUDA_HOME` not set properly. * if the `FileRule` find `config.mk`, re-issuing `Pkg.build` will not change the `config.mk`. User need to delete/modified `config.mk` manually * fix CUDA config * the build_steps didn't being unfolded correctly. * consider following cases: ```julia @build_steps begin if true `1` `2` `3` if true `42` end end end BinDeps.SynchronousStepCollection(Any[`42`], "", "") ``` vs ```julia @build_steps begin if true @build_steps begin `1` `2` `3` if true `42` end end # inner build_steps end # if end BinDeps.SynchronousStepCollection(Any[`1`, `2`, `3`, `42`], "", "") ``` --- deps/build.jl | 25 +++++++++++++++---------- 1 file changed, 15 insertions(+), 10 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index 69443c4987e5..a11758e36f3c 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -159,22 +159,30 @@ if !libmxnet_detected `git submodule update --init --recursive` `git -C mshadow checkout -- make/mshadow.mk` `make clean` + `cp ../../cblas.h include/cblas.h` + `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` - end - FileRule(joinpath(_mxdir, "config.mk"), @build_steps begin - ChangeDirectory(_mxdir) + + # Copy config.mk, always override the file if is_apple() `cp make/osx.mk config.mk` else `cp make/config.mk config.mk` end + + # Configure OpenCV `sed -i -s 's/USE_OPENCV = 1/USE_OPENCV = 0/' config.mk` + + # Configure CUDA if HAS_CUDA - `sed -i -s 's/USE_CUDA = 0/USE_CUDA = 1/' config.mk` - if haskey(ENV, "CUDA_HOME") - `sed -i -s 's/USE_CUDA_PATH = NULL/USE_CUDA_PATH = $(ENV["CUDA_HOME"])/' config.mk` + @build_steps begin + `sed -i -s 's/USE_CUDA = 0/USE_CUDA = 1/' config.mk` + if haskey(ENV, "CUDA_HOME") + `sed -i -s "s@USE_CUDA_PATH = NONE@USE_CUDA_PATH = $(ENV["CUDA_HOME"])@" config.mk` + end end end + # Force enable LAPACK build # Julia's OpenBLAS has LAPACK functionality already if FORCE_LAPACK @@ -183,10 +191,7 @@ if !libmxnet_detected end `sed -i -s 's/ADD_CFLAGS =\(.*\)/ADD_CFLAGS =\1 -DMXNET_USE_LAPACK/' config.mk` end - end) - @build_steps begin - ChangeDirectory(_mxdir) - `cp ../../cblas.h include/cblas.h` + if USE_JULIA_BLAS `make -j$(get_cpucore()) USE_BLAS=$blas_name $MSHADOW_LDFLAGS` else From 7cc66d1c5186b6afb73c55eebc6cd609b0c01bca Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 13 Sep 2017 00:27:08 +0800 Subject: [PATCH 504/630] executor: fix docstring of `bind` --- src/executor.jl | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/executor.jl b/src/executor.jl index 3ae5301a6c92..e340537d7a63 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -65,6 +65,8 @@ function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDA return (args_hdr, args_vec) end +@enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 + """ bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) @@ -81,7 +83,6 @@ Create an `Executor` by binding a `SymbolicNode` to concrete `NDArray`. * `aux_states`: * `grad_req`: """ -@enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 function bind(self :: SymbolicNode, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; args_grad :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), aux_states :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), From 5d739daccd6d9b2f30845a52688f20cd0ec46852 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 13 Sep 2017 11:58:04 +0800 Subject: [PATCH 505/630] ndarray: implement deepcopy via MXNDArrayGetDataNDArray --- src/ndarray.jl | 15 ++++++++++++++- test/unittest/ndarray.jl | 9 +++++++++ 2 files changed, 23 insertions(+), 1 deletion(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 952c944dfbdd..d74ed07b0c1f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -403,7 +403,8 @@ function getindex(arr :: NDArray, idx::UnitRange{Int}) slice(arr, idx) end -import Base: copy!, copy, convert +import Base: copy!, copy, convert, deepcopy + """ copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) @@ -485,6 +486,18 @@ function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) convert(t, copy(arr)) end +""" + deepcopy(arr::NDArray) + +Get a deep copy of the data blob in the form of an NDArray of default storage +type. This function blocks. Do not use it in performance critical code. +""" +function deepcopy(arr::NDArray) + out_ref = Ref{MX_handle}(C_NULL) + @mxcall(:MXNDArrayGetDataNDArray, (MX_handle, Ref{MX_handle}), arr, out_ref) + NDArray(MX_NDArrayHandle(out_ref[])) +end + """ @inplace diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 69599960973f..8c058c1bf97d 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -31,6 +31,15 @@ function test_copy() @test reldiff(tensor, tensor2) < 1e-6 end +function test_deepcopy() + info("NDArray::deepcopy") + + x = mx.zeros(2, 5) + y = deepcopy(x) + x[:] = 42 + @test copy(x) != copy(y) +end + function test_assign() dims = rand_dims() tensor = rand(mx.MX_float, dims) From 16c2c5ac87459eaf8e5d459c6dcdb92a6afcefe1 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 18 Sep 2017 22:21:57 +0800 Subject: [PATCH 506/630] base: update GRAD_REQ enumeration * also, add a `grad_req_map` --- src/base.jl | 12 ++++++++++++ src/executor.jl | 2 -- 2 files changed, 12 insertions(+), 2 deletions(-) diff --git a/src/base.jl b/src/base.jl index 4f004f452f28..2d3ec8f3d053 100644 --- a/src/base.jl +++ b/src/base.jl @@ -13,6 +13,18 @@ const MX_handle = Ptr{Void} const char_p = Ptr{UInt8} const char_pp = Ptr{char_p} +################################################################################ +# Enumeration from MXNet headers +################################################################################ +# OpReqType in include/mxnet/op_attr_types.h +@enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_INPLACE=2 GRAD_ADD=3 +const grad_req_map = Dict{Symbol, GRAD_REQ}( + :nop => GRAD_NOP, # no operation, do not write anything + :write => GRAD_WRITE, # write gradient to provided space + :inplace => GRAD_INPLACE, # perform an inplace write + :add => GRAD_ADD, # add to the provided space +) + ################################################################################ # Initialization and library API entrance ################################################################################ diff --git a/src/executor.jl b/src/executor.jl index e340537d7a63..8d10102f5c75 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -65,8 +65,6 @@ function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDA return (args_hdr, args_vec) end -@enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_ADD=3 - """ bind(sym, ctx, args; args_grad=Dict(), aux_states=Dict(), grad_req=GRAD_WRITE) From e3ad29dc63ba0784f6c44ac087942c5a1ea07455 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 19 Sep 2017 10:36:27 +0800 Subject: [PATCH 507/630] travis: bring coverage report back --- .travis.yml | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/.travis.yml b/.travis.yml index 2f7dee479a68..68b1cb1b8b00 100644 --- a/.travis.yml +++ b/.travis.yml @@ -28,8 +28,8 @@ addons: - g++-4.8 before_install: - - export TRAVIS=test/travis - - source $TRAVIS/setup_env.sh + - export TRAVIS_DIR=test/travis + - source ${TRAVIS_DIR}/setup_env.sh notifications: email: false @@ -38,11 +38,10 @@ script: # bump the time limit of no ouput # the `travis_wait` wrapper can be removed once this issue fixed: # https://github.com/JuliaLang/julia/pull/23601 - - travis_wait 60 $TRAVIS/run_test.sh + - travis_wait 60 ${TRAVIS_DIR}/run_test.sh after_success: - - source $TRAVIS/run_coverage.sh + - source ${TRAVIS_DIR}/run_coverage.sh - echo $TRAVIS_JULIA_VERSION - julia -e 'Pkg.add("Documenter")' - julia -e 'cd(Pkg.dir("MXNet")); include(joinpath("docs", "make.jl"))' - From dcba690720b5e46abbe57918d5483f18a8890c87 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 11 Sep 2017 14:30:07 +0800 Subject: [PATCH 508/630] build: CuDNN detection --- deps/build.jl | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) diff --git a/deps/build.jl b/deps/build.jl index a11758e36f3c..b8ea163951c4 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -36,6 +36,8 @@ if is_unix() end HAS_CUDA = false +HAS_CUDNN = false +cudnnver = -1 let cudalib = Libdl.find_library(["libcuda", "nvcuda.dll"], CUDAPATHS) HAS_CUDA = !isempty(cudalib) && Libdl.dlopen_e(cudalib) != C_NULL end @@ -48,8 +50,21 @@ if !HAS_CUDA && is_windows() end end +if HAS_CUDA # then check cudnn + let cudnnlib = Libdl.find_library("libcudnn", CUDAPATHS) + HAS_CUDNN = !isempty(cudnnlib) && Libdl.dlopen_e(cudnnlib) != C_NULL + if HAS_CUDNN + # TODO: do more version check? + cudnnver = dec(ccall((:cudnnGetVersion, cudnnlib), Csize_t, ())) + end + end +end + if HAS_CUDA info("Found a CUDA installation.") + if HAS_CUDNN + info("Found a CuDNN installation (version -> $cudnnver).") + end else info("Did not find a CUDA installation, using CPU-only version of MXNet.") end @@ -180,6 +195,9 @@ if !libmxnet_detected if haskey(ENV, "CUDA_HOME") `sed -i -s "s@USE_CUDA_PATH = NONE@USE_CUDA_PATH = $(ENV["CUDA_HOME"])@" config.mk` end + if HAS_CUDNN + `sed -i -s 's/USE_CUDNN = 0/USE_CUDNN = 1/' config.mk` + end end end From 3d4adfb030ce6b78f76d5c4f4dad4cdf59c7aaf0 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 10 Sep 2017 12:04:36 +0800 Subject: [PATCH 509/630] ndarray: `reshape` share the same API with Base * fix #272 * deprecate `Reshape` as well * test cases included --- NEWS.md | 9 +++++++++ src/MXNet.jl | 2 ++ src/deprecated.jl | 3 +++ src/ndarray.jl | 32 +++++++++++++++++++++++++++++--- test/unittest/ndarray.jl | 31 +++++++++++++++++++++++++++---- 5 files changed, 70 insertions(+), 7 deletions(-) create mode 100644 src/deprecated.jl diff --git a/NEWS.md b/NEWS.md index 551985db996c..36f10ee2735d 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,12 @@ +# v0.3.0 (TBD) + +## API Changes + +* `reshape` of NDArray share the same interface with Base (#272). + * `reshape(NDArray, dim; reverse=false)` + * `reshape(NDArray, dim...; reverse=false)` + * `Reshape` deprecated. + # v0.2.2 (2017.05.14) * Updated supported version of MXNet to 0.9.4. * Improved build-system with support for auto-detecting GPU support. diff --git a/src/MXNet.jl b/src/MXNet.jl index bcc6296b3fb8..142f1a06d5be 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -50,6 +50,8 @@ include("visualize.jl") include("nn-factory.jl") +include("deprecated.jl") + end # mx end # module MXNet diff --git a/src/deprecated.jl b/src/deprecated.jl new file mode 100644 index 000000000000..4c9345126bde --- /dev/null +++ b/src/deprecated.jl @@ -0,0 +1,3 @@ +# reshape (#272) +@deprecate reshape(arr::NDArray; shape=()) reshape(arr, shape) +@deprecate Reshape(arr::NDArray; shape=()) reshape(arr, shape) diff --git a/src/ndarray.jl b/src/ndarray.jl index 952c944dfbdd..a5d3c97ebb67 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -921,6 +921,31 @@ function save(filename::String, data::Dict{Base.Symbol,NDArray}) filename, length(names), arrays, names) end +import Base: reshape + +""" + reshape(arr::NDArray, dim...; reverse=false) + reshape(arr::NDArray, dim; reverse=false) +""" +reshape{N}(arr::NDArray, dim::NTuple{N, Integer}; reverse::Bool=false) = + _reshape(arr, dim, reverse) +reshape{N}(arr::NDArray, dim::Vararg{Integer, N}; reverse::Bool=false) = + _reshape(arr, dim, reverse) + +@inline function _reshape{N}(arr::NDArray, dim::NTuple{N, Integer}, reverse::Bool) + op_handle = _get_cached_libmx_op_handle("reshape") + n_output = Ref(Cint(0)) + hdls_ref = Ref{Ptr{MX_handle}}(C_NULL) + @mxcall(:MXImperativeInvoke, + (MX_handle, Cint, Ptr{MX_handle}, Ref{Cint}, Ref{Ptr{MX_handle}}, + Cint, char_pp, char_pp), + op_handle, 1, [arr.handle], n_output, hdls_ref, + 2, ["shape", "reverse"], [dump_mx_param(dim), dump_mx_param(!reverse)]) + # not a typo ^^^^^^^^ + @assert n_output[] == 1 + NDArray(MX_NDArrayHandle(unsafe_load(hdls_ref[], 1))) +end + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -980,7 +1005,6 @@ Upon calling, the output arguments will be automatically initialized with empty Those functions always return the output arguments. If there is only one output (the typical situation), that object (`NDArray`) is returned. Otherwise, a tuple containing all the outputs will be returned. """ - function _get_ndarray_function_def(name :: String) func_name = Symbol(name) @@ -1063,7 +1087,9 @@ function _get_ndarray_function_def(name :: String) end macro _import_ndarray_functions() - names = _get_libmx_op_names() + black_list = ["reshape"] # do not import these funcs + names = filter(n -> ∉(lowercase(n), black_list), _get_libmx_op_names()) + func_exprs = map(names) do name op_handle = _get_libmx_op_handle(name) @@ -1073,7 +1099,7 @@ macro _import_ndarray_functions() func_name = Symbol(name) expr = quote # TODO the explicit exclusion of take will no longer be necessary when it is removed from Base - $((isdefined(Base, func_name) && func_name ≠ :take)? :(import Base.$func_name) : :()) + $((isdefined(Base, func_name) && func_name ≠ :take) ? :(import Base.$func_name) : :()) $func_def @doc $desc -> $func_def2 diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 69599960973f..b7584104d495 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -109,7 +109,7 @@ function test_plus() scalar_large = 1e8 @test reldiff(t4 + scalar_small, copy(a4 .+ scalar_small)) < thresh @test reldiff(t4 + scalar_large, copy(a4 .+ scalar_large)) < thresh - + t5 = zeros(Float64, dims) a5 = copy(t5, mx.cpu()) scalar_small = 1e-8 @@ -160,7 +160,7 @@ function test_minus() scalar_large = 1e8 @test reldiff(t4 - scalar_small, copy(a4 .- scalar_small)) < thresh @test reldiff(t4 - scalar_large, copy(a4 .- scalar_large)) < thresh - + t5 = zeros(Float64, dims) a5 = copy(t5, mx.cpu()) scalar_small = 1e-8 @@ -204,7 +204,7 @@ function test_mul() scalar_large = 1e8 @test reldiff(t4 * scalar_small, copy(a4 .* scalar_small)) < thresh @test reldiff(t4 * scalar_large, copy(a4 .* scalar_large)) < thresh - + t5, a5 = rand_tensors(Float64, dims) scalar_small = 1e-8 scalar_large = 1e8 @@ -245,7 +245,7 @@ function test_div() scalar_large = 1e8 @test reldiff(t4 / scalar_small, copy(a4 ./ scalar_small)) < thresh @test reldiff(t4 / scalar_large, copy(a4 ./ scalar_large)) < thresh - + t5, a5 = rand_tensors(Float64, dims) scalar_small = 1e-8 scalar_large = 1e8 @@ -382,6 +382,28 @@ function test_eltype() end end +function test_reshape() + info("NDArray::reshape") + A = rand(2, 3, 4) + + B = reshape(mx.NDArray(A), 4, 3, 2) + @test size(B) == (4, 3, 2) + @test copy(B)[3, 1, 1] == A[1, 2, 1] + + C = reshape(mx.NDArray(A), (4, 3, 2)) + @test size(C) == (4, 3, 2) + @test copy(C)[3, 1, 1] == A[1, 2, 1] + + info("NDArray::reshape::reverse") + A = mx.zeros(10, 5, 4) + + B = reshape(A, -1, 0) + @test size(B) == (40, 5) + + C = reshape(A, -1, 0, reverse=true) + @test size(C) == (50, 4) +end + function test_kwargs() info("NDArray::kwargs") dims1 = (2,3,4) @@ -412,6 +434,7 @@ end test_eltype() test_nd_as_jl() test_dot() + test_reshape() test_kwargs() end From 0b9bf78c385236787a75f966fd9835f10d3007d7 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 11 Sep 2017 19:10:09 +0800 Subject: [PATCH 510/630] sym-node: support `print` for debugging --- src/symbolic-node.jl | 45 ++++++++++++++++++++++++++++++++++ test/unittest/symbolic-node.jl | 8 ++++++ 2 files changed, 53 insertions(+) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 8a567c2e8003..772ff66e53f7 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -220,6 +220,51 @@ function get_name(self :: mx.SymbolicNode) return Symbol(unsafe_string(name[])) end +import Base: print + +function print(io :: IO, sym :: SymbolicNode) + out = Ref{mx.char_p}(C_NULL) + @mx.mxcall(:MXSymbolPrint, (mx.MX_SymbolHandle, Ref{mx.char_p}), sym.handle, out) + print(io, unsafe_string(out[])) +end + +print(sym :: SymbolicNode) = print(STDOUT, sym) + +""" + print([io :: IO], sym :: SymbolicNode) + +Print the content of symbol, used for debug. + +```julia +julia> layer = @mx.chain mx.Variable(:data) => + mx.FullyConnected(name=:fc1, num_hidden=128) => + mx.Activation(name=:relu1, act_type=:relu) +MXNet.mx.SymbolicNode(MXNet.mx.MX_SymbolHandle(Ptr{Void} @0x000055b29b9c3520)) + +julia> print(layer) +Symbol Outputs: + output[0]=relu1(0) +Variable:data +Variable:fc1_weight +Variable:fc1_bias +-------------------- +Op:FullyConnected, Name=fc1 +Inputs: + arg[0]=data(0) version=0 + arg[1]=fc1_weight(0) version=0 + arg[2]=fc1_bias(0) version=0 +Attrs: + num_hidden=128 +-------------------- +Op:Activation, Name=relu1 +Inputs: + arg[0]=fc1(0) +Attrs: + act_type=relu +``` +""" +print + """ grad(self :: SymbolicNode, wrt :: Vector{SymbolicNode}) diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 5d8d01b608db..534a99140115 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -136,6 +136,13 @@ function test_dot() @test reldiff(ret, 2*ones(100, 200)) < 1e-6 end +function test_print() + info("SymbolicNode::print") + io = IOBuffer() + print(io, mx.Variable(:x)) + @test !isempty(String(take!(io))) +end + function test_misc() info("SymbolicNode::Miscellaneous") # Test for #189 @@ -158,6 +165,7 @@ end test_attrs() test_functions() test_dot() + test_print() test_misc() end From 4e89c919b47fad6d79cf9e33a6b5a6f2c168b98d Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 12 Sep 2017 18:18:20 +0800 Subject: [PATCH 511/630] sym-node: extract a until function _create_atomic_symbol * from _define_atomic_symbol_creator --- src/symbolic-node.jl | 39 ++++++++++++++++++++++++--------------- 1 file changed, 24 insertions(+), 15 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 8a567c2e8003..c81b250f497a 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -614,6 +614,26 @@ end ################################################################################ # Atomic SymbolicNode functions dynamically imported from libmxnet ################################################################################ +@inline function _create_atomic_symbol(creator::MX_handle, keys::Vector{String}, + vals::Vector{String}) + ref_sym_hdr = Ref{MX_handle}(C_NULL) + @mxcall(:MXSymbolCreateAtomicSymbol, + (MX_handle, MX_uint, Ptr{char_p}, Ptr{char_p}, Ref{MX_handle}), + creator, length(keys), keys, vals, ref_sym_hdr) + SymbolicNode(MX_SymbolHandle(ref_sym_hdr[])) +end + +@inline function _create_atomic_symbol(creator::MX_handle, keys::Vector{String}, + vals::Vector{String}, + attrs::Dict{Symbol, String}) + node = _create_atomic_symbol(creator, keys, vals) + # set attrs + for (k, v) in attrs + set_attr(node, k, v) + end + node +end + function _define_atomic_symbol_creator(name :: String) handle = _get_libmx_op_handle(name) f_desc, key_narg = _get_libmx_op_description(name, handle) @@ -664,7 +684,7 @@ function _define_atomic_symbol_creator(name :: String) symbol_kws[k] = v elseif k == :attrs if isa(v, Dict) - attrs = convert(Dict{Symbol, AbstractString}, v) + attrs = convert(Dict{Symbol, String}, v) else throw(ArgumentError("attrs needs to be a Dictionary")) end @@ -686,24 +706,13 @@ function _define_atomic_symbol_creator(name :: String) end end) - local hdr = _get_cached_libmx_op_handle($name) - - # create the SymbolicNode - ref_sym_hdr = Ref{MX_handle}() - @mxcall(:MXSymbolCreateAtomicSymbol, - (MX_handle, MX_uint, Ptr{char_p}, Ptr{char_p}, Ref{MX_handle}), - hdr, length(param_keys), param_keys, param_vals, ref_sym_hdr) - sym_hdr = ref_sym_hdr[] + local op = _get_cached_libmx_op_handle($name) + node = _create_atomic_symbol(op.value, param_keys, param_vals, attrs) - node = SymbolicNode(MX_SymbolHandle(sym_hdr)) + # generate a new name for the new symbol if user not provided in kwargs hint = lowercase($name) name = get!(DEFAULT_NAME_MANAGER, name, hint) - # set attrs - for (k, v) in attrs - set_attr(node, k, v) - end - if length(symbol_kws) == 0 _compose!(node, name, args...) elseif length(args) == 1 From 63a34ccadaa59f329ca0ec4babd47f25bc35e481 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 12 Sep 2017 22:32:51 +0800 Subject: [PATCH 512/630] sym-node: implement reshape api as Base * copy the docstring from upstream, and convert it into markdown * test cases included --- src/symbolic-node.jl | 83 +++++++++++++++++++++++++++++++++- test/unittest/symbolic-node.jl | 27 +++++++++++ 2 files changed, 108 insertions(+), 2 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index c81b250f497a..620df2ed063d 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -611,6 +611,85 @@ function save(filename :: AbstractString, node :: SymbolicNode) @mxcall(:MXSymbolSaveToFile, (MX_handle, char_p), node, filename) end +import Base: reshape + +reshape{N}(sym::SymbolicNode, dim::NTuple{N, Integer}; kwargs...) = + _reshape(sym, dim, kwargs...) +reshape(sym::SymbolicNode, dim::Integer...; kwargs...) = + _reshape(sym, dim, kwargs...) + +@inline function _reshape{N}(sym::SymbolicNode, dim::NTuple{N, Integer}; + reverse::Bool=false, name::String="") + op = _get_cached_libmx_op_handle("reshape") + node = _create_atomic_symbol(op.value, ["shape"], [dump_mx_param(dim)]) + name = get!(DEFAULT_NAME_MANAGER, name, "reshape") + _compose!(node, name=name, data=sym) +end + +""" + reshape(sym::SymbolicNode, dim; reverse=false, name) + reshape(sym::SymbolicNode, dim...; reverse=false, name) + +Reshape SymbolicNode operator + +Some dimensions of the shape can take special values from the set +{0, -1, -2, -3, -4}. +The significance of each is explained below: + +- `0` copy this dimension from the input to the output shape. + + Example: + + - input shape = (2,3,4), shape = (4,0,2), output shape = (4,3,2) + - input shape = (2,3,4), shape = (2,0,0), output shape = (2,3,4) + +- `-1` infers the dimension of the output shape by using the remainder of the + input dimensions keeping the size of the new array same as that of the input + array. At most one dimension of shape can be -1. + + Example: + + - input shape = (2,3,4), shape = (6,1,-1), output shape = (6,1,4) + - input shape = (2,3,4), shape = (3,-1,8), output shape = (3,1,8) + - input shape = (2,3,4), shape=(-1,), output shape = (24,) + +- `-2` copy all/remainder of the input dimensions to the output shape. + + Example: + + - input shape = (2,3,4), shape = (-2,), output shape = (2,3,4) + - input shape = (2,3,4), shape = (2,-2), output shape = (2,3,4) + - input shape = (2,3,4), shape = (-2,1,1), output shape = (2,3,4,1,1) + +- `-3` use the product of two consecutive dimensions of the input shape as the + output dimension. + + Example: + + - input shape = (2,3,4), shape = (-3,4), output shape = (6,4) + - input shape = (2,3,4,5), shape = (-3,-3), output shape = (6,20) + - input shape = (2,3,4), shape = (0,-3), output shape = (2,12) + - input shape = (2,3,4), shape = (-3,-2), output shape = (6,4) + +- `-4` split one dimension of the input into two dimensions passed subsequent + to -4 in shape (can contain -1). + + Example: + + - input shape = (2,3,4), shape = (-4,1,2,-2), output shape =(1,2,3,4) + - input shape = (2,3,4), shape = (2,-4,-1,3,-2), output shape = (2,1,3,4) + +If the argument `reverse` is set to `1`, then the special values are inferred +from right to left. + + Example: + + - with `reverse=false`, for input shape = (10,5,4), shape = (-1,0), + output shape would be (40,5) + - with `reverse=true`, output shape will be (50,4). +""" +reshape + ################################################################################ # Atomic SymbolicNode functions dynamically imported from libmxnet ################################################################################ @@ -742,11 +821,11 @@ macro _import_atomic_symbol_creators() # XXX: those are operators defined for NDArray, we exclude them here # because the calling convention for the type signature is not strong # enough to disambiguate the method for NDArray and SymbolicNode - const ignored_ops = ["_set_value"] + const ignored_ops = ["_set_value", "reshape"] # in lowercase op_names = _get_libmx_op_names() func_exprs = map(op_names) do name - if name ∉ ignored_ops + if lowercase(name) ∉ ignored_ops expr = _define_atomic_symbol_creator(name) end end diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 5d8d01b608db..26b049e8d63c 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -122,6 +122,32 @@ function test_functions() typeof(mx.sum(data)) == mx.SymbolicNode end +function test_reshape() + info("SymbolicNode::reshape(sym, dim...)") + + A = mx.NDArray(collect(1:24)) + x = mx.Variable(:x) + y = mx.reshape(x, 2, 3, 4) + e = mx.bind(y, mx.cpu(), Dict(:x => A)) + mx.forward(e) + out = e.outputs[1] + + @test size(out) == (2, 3, 4) + @test copy(out) == reshape(1:24, 2, 3, 4) + + info("SymbolicNode::reshape(sym, dim)") + + A = mx.NDArray(collect(1:24)) + x = mx.Variable(:x) + y = mx.reshape(x, (2, 3, 4)) + e = mx.bind(y, mx.cpu(), Dict(:x => A)) + mx.forward(e) + out = e.outputs[1] + + @test size(out) == (2, 3, 4) + @test copy(out) == reshape(1:24, 2, 3, 4) +end + function test_dot() info("SymbolicNode::dot") x = mx.Variable(:x) @@ -157,6 +183,7 @@ end test_saveload() test_attrs() test_functions() + test_reshape() test_dot() test_misc() end From 68d6ff7b9e73df93b97238da0451e4ff6deb7bc2 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 25 Sep 2017 15:11:18 +0800 Subject: [PATCH 513/630] sym-node: update deprecation for reshape --- src/deprecated.jl | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/src/deprecated.jl b/src/deprecated.jl index 4c9345126bde..33688d435a8e 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -1,3 +1,7 @@ -# reshape (#272) +# NDArray reshape (#272) @deprecate reshape(arr::NDArray; shape=()) reshape(arr, shape) @deprecate Reshape(arr::NDArray; shape=()) reshape(arr, shape) + +# SymbolicNode reshape (#279) +@deprecate reshape(sym::SymbolicNode; shape=()) reshape(sym, shape) +@deprecate Reshape(sym::SymbolicNode; shape=()) reshape(sym, shape) From a2e270e1fff696b8f869341ccf5d70ed87f994fa Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 25 Sep 2017 15:11:37 +0800 Subject: [PATCH 514/630] sym-node: update NEWS for reshape API --- NEWS.md | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/NEWS.md b/NEWS.md index 36f10ee2735d..913f92eaa719 100644 --- a/NEWS.md +++ b/NEWS.md @@ -7,6 +7,13 @@ * `reshape(NDArray, dim...; reverse=false)` * `Reshape` deprecated. + * `reshape` of SymbolicNode share the same interface with Base + and additional keyword argument (#279). + + * `reshape(SymbolicNode, dim; reverse=false, name)` + * `reshape(SymbolicNode, dim...; reverse=false, name)` + * `Reshape` deprecated. + # v0.2.2 (2017.05.14) * Updated supported version of MXNet to 0.9.4. * Improved build-system with support for auto-detecting GPU support. From 9e0844a069413a267d65fa3afb309b0d85d703b7 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 25 Sep 2017 19:54:49 +0800 Subject: [PATCH 515/630] sym-node: add reverse keyword arg --- src/symbolic-node.jl | 29 ++++++++++++++--------------- 1 file changed, 14 insertions(+), 15 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 620df2ed063d..737d0dc1b610 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -613,19 +613,6 @@ end import Base: reshape -reshape{N}(sym::SymbolicNode, dim::NTuple{N, Integer}; kwargs...) = - _reshape(sym, dim, kwargs...) -reshape(sym::SymbolicNode, dim::Integer...; kwargs...) = - _reshape(sym, dim, kwargs...) - -@inline function _reshape{N}(sym::SymbolicNode, dim::NTuple{N, Integer}; - reverse::Bool=false, name::String="") - op = _get_cached_libmx_op_handle("reshape") - node = _create_atomic_symbol(op.value, ["shape"], [dump_mx_param(dim)]) - name = get!(DEFAULT_NAME_MANAGER, name, "reshape") - _compose!(node, name=name, data=sym) -end - """ reshape(sym::SymbolicNode, dim; reverse=false, name) reshape(sym::SymbolicNode, dim...; reverse=false, name) @@ -676,7 +663,7 @@ The significance of each is explained below: Example: - - input shape = (2,3,4), shape = (-4,1,2,-2), output shape =(1,2,3,4) + - input shape = (2,3,4), shape = (-4,1,2,-2), output shape = (1,2,3,4) - input shape = (2,3,4), shape = (2,-4,-1,3,-2), output shape = (2,1,3,4) If the argument `reverse` is set to `1`, then the special values are inferred @@ -688,7 +675,19 @@ from right to left. output shape would be (40,5) - with `reverse=true`, output shape will be (50,4). """ -reshape +reshape{N}(sym::SymbolicNode, dim::NTuple{N, Integer}; kwargs...) = + _reshape(sym, dim; kwargs...) +reshape(sym::SymbolicNode, dim::Integer...; kwargs...) = + _reshape(sym, dim; kwargs...) + +@inline function _reshape{N}(sym::SymbolicNode, dim::NTuple{N, Integer}; + reverse::Bool=false, name::String="") + op = _get_cached_libmx_op_handle("reshape") + node = _create_atomic_symbol(op.value, ["shape", "reverse"], + [dump_mx_param(dim), dump_mx_param(!reverse)]) + name = get!(DEFAULT_NAME_MANAGER, name, "reshape") + _compose!(node, name=name, data=sym) +end ################################################################################ # Atomic SymbolicNode functions dynamically imported from libmxnet From 55ccbfa2adb346ab6c2fd8a2ab63cbae07f796bf Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 25 Sep 2017 19:55:48 +0800 Subject: [PATCH 516/630] sym-node: more test cases for reshape --- test/unittest/symbolic-node.jl | 66 ++++++++++++++++++++++++++++++++++ 1 file changed, 66 insertions(+) diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 26b049e8d63c..44f35142de9d 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -146,6 +146,72 @@ function test_reshape() @test size(out) == (2, 3, 4) @test copy(out) == reshape(1:24, 2, 3, 4) + + info("SymbolicNode::reshape::reverse") + + A = mx.zeros(10, 5, 4) + x = mx.Variable(:x) + y = mx.reshape(x, -1, 0, reverse=true) + e = mx.bind(y, mx.cpu(), Dict(:x => A)) + mx.forward(e) + out = e.outputs[1] + + @test size(out) == (50, 4) + + info("SymbolicNode::reshape::0") + + A = mx.zeros(2, 3, 4) + x = mx.Variable(:x) + y = mx.reshape(x, 4, 0, 2) + e = mx.bind(y, mx.cpu(), Dict(:x => A)) + mx.forward(e) + out = e.outputs[1] + + @test size(out) == (4, 3, 2) + + info("SymbolicNode::reshape::-1") + + A = mx.zeros(2, 3, 4) + x = mx.Variable(:x) + y = mx.reshape(x, 6, 1, -1) + e = mx.bind(y, mx.cpu(), Dict(:x => A)) + mx.forward(e) + out = e.outputs[1] + + @test size(out) == (6, 1, 4) + + info("SymbolicNode::reshape::-2") + + A = mx.zeros(2, 3, 4, 2) + x = mx.Variable(:x) + y = mx.reshape(x, 3, 2, -2) + e = mx.bind(y, mx.cpu(), Dict(:x => A)) + mx.forward(e) + out = e.outputs[1] + + @test size(out) == (3, 2, 4, 2) + + info("SymbolicNode::reshape::-3") + + A = mx.zeros(2, 3, 4, 5) + x = mx.Variable(:x) + y = mx.reshape(x, -3, -3) + e = mx.bind(y, mx.cpu(), Dict(:x => A)) + mx.forward(e) + out = e.outputs[1] + + @test size(out) == (6, 20) + + info("SymbolicNode::reshape::-4") + + A = mx.zeros(2, 3, 4) + x = mx.Variable(:x) + y = mx.reshape(x, 0, 0, -4, 2, 2) + e = mx.bind(y, mx.cpu(), Dict(:x => A)) + mx.forward(e) + out = e.outputs[1] + + @test size(out) == (2, 3, 2, 2) end function test_dot() From ff0556b13d92573214f3badc99c31cace5668fe7 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 13 Sep 2017 13:11:52 +0800 Subject: [PATCH 517/630] random: rename srand! to srand make it same as Base --- src/random.jl | 2 +- test/unittest/random.jl | 8 ++++---- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/src/random.jl b/src/random.jl index b5b53def8f54..47801512372e 100644 --- a/src/random.jl +++ b/src/random.jl @@ -22,6 +22,6 @@ function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}, ctx::Context) randn!(mean, stdvar, out) end -function srand!(seed_state::Int) +function srand(seed_state::Int) @mxcall(:MXRandomSeed, (Cint,), seed_state) end diff --git a/test/unittest/random.jl b/test/unittest/random.jl index 54d651482cd6..30995ecf79bf 100644 --- a/test/unittest/random.jl +++ b/test/unittest/random.jl @@ -8,10 +8,10 @@ function test_uniform() low = -10; high = 10 seed = 123 - mx.srand!(seed) + mx.srand(seed) ret1 = mx.rand(low, high, dims) - mx.srand!(seed) + mx.srand(seed) ret2 = mx.empty(dims) mx.rand!(low, high, ret2) @@ -25,10 +25,10 @@ function test_gaussian() μ = 10; σ = 2 seed = 456 - mx.srand!(seed) + mx.srand(seed) ret1 = mx.randn(μ, σ, dims) - mx.srand!(seed) + mx.srand(seed) ret2 = mx.empty(dims) mx.randn!(μ, σ, ret2) From 5b3c507f1a1ae11c033708d13087ec172c96e8c9 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 25 Sep 2017 23:18:39 +0800 Subject: [PATCH 518/630] random: update NEWS and deprecated.jl - update NEWS for deepcopy on NDArray as well (#273) --- NEWS.md | 10 ++++++++-- src/deprecated.jl | 3 +++ 2 files changed, 11 insertions(+), 2 deletions(-) diff --git a/NEWS.md b/NEWS.md index 913f92eaa719..773c2471c514 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,5 +1,9 @@ # v0.3.0 (TBD) +## New API + +* `deepcopy` for NDArray (#273) + ## API Changes * `reshape` of NDArray share the same interface with Base (#272). @@ -7,13 +11,15 @@ * `reshape(NDArray, dim...; reverse=false)` * `Reshape` deprecated. - * `reshape` of SymbolicNode share the same interface with Base - and additional keyword argument (#279). +* `reshape` of SymbolicNode share the same interface with Base + and additional keyword argument (#279). * `reshape(SymbolicNode, dim; reverse=false, name)` * `reshape(SymbolicNode, dim...; reverse=false, name)` * `Reshape` deprecated. +* `srand!` deprecated, please use `srand` (#282) + # v0.2.2 (2017.05.14) * Updated supported version of MXNet to 0.9.4. * Improved build-system with support for auto-detecting GPU support. diff --git a/src/deprecated.jl b/src/deprecated.jl index 33688d435a8e..b2816fad5432 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -5,3 +5,6 @@ # SymbolicNode reshape (#279) @deprecate reshape(sym::SymbolicNode; shape=()) reshape(sym, shape) @deprecate Reshape(sym::SymbolicNode; shape=()) reshape(sym, shape) + +# srand (#282) +@deprecate srand!(seed_state::Int) srand(seed_state) From 251a8b3661b5b5269788bf48d649a7fa35c2ff61 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 4 Oct 2017 15:16:58 +0800 Subject: [PATCH 519/630] random: upstream api change Ref: https://github.com/apache/incubator-mxnet/pull/7939 --- src/random.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/random.jl b/src/random.jl index b5b53def8f54..d031d9c2f2d2 100644 --- a/src/random.jl +++ b/src/random.jl @@ -1,6 +1,6 @@ function rand!(low::Real, high::Real, out::NDArray) # XXX: note we reverse shape because julia and libmx has different dim order - _sample_uniform(NDArray, low=low, high=high, shape=reverse(size(out)), out=out) + _random_uniform(NDArray, low=low, high=high, shape=reverse(size(out)), out=out) end function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}) rand(low, high, shape, cpu()) @@ -12,7 +12,7 @@ end function randn!(mean::Real, stdvar::Real, out::NDArray) # XXX: note we reverse shape because julia and libmx has different dim order - _sample_normal(NDArray, loc=mean, scale=stdvar, shape=reverse(size(out)), out=out) + _random_normal(NDArray, loc=mean, scale=stdvar, shape=reverse(size(out)), out=out) end function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}) randn(mean, stdvar, shape, cpu()) From 077a8cb2119edd6ffc63ef0eae92c2e52da32a57 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 4 Oct 2017 14:17:42 +0800 Subject: [PATCH 520/630] build: improve cuda detection - change ADD_LDFLAGS - https://github.com/apache/incubator-mxnet/pull/7856 - https://github.com/apache/incubator-mxnet/pull/7838 - guessing the CUDA_HOME if user not provides it. --- deps/build.jl | 22 ++++++++++++++++------ 1 file changed, 16 insertions(+), 6 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index b8ea163951c4..d6591c22c910 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -37,7 +37,6 @@ end HAS_CUDA = false HAS_CUDNN = false -cudnnver = -1 let cudalib = Libdl.find_library(["libcuda", "nvcuda.dll"], CUDAPATHS) HAS_CUDA = !isempty(cudalib) && Libdl.dlopen_e(cudalib) != C_NULL end @@ -53,9 +52,8 @@ end if HAS_CUDA # then check cudnn let cudnnlib = Libdl.find_library("libcudnn", CUDAPATHS) HAS_CUDNN = !isempty(cudnnlib) && Libdl.dlopen_e(cudnnlib) != C_NULL - if HAS_CUDNN - # TODO: do more version check? - cudnnver = dec(ccall((:cudnnGetVersion, cudnnlib), Csize_t, ())) + if HAS_CUDNN && !haskey(ENV, "CUDA_HOME") # inference `CUDA_HOME` + ENV["CUDA_HOME"] = dirname(dirname(cudnnlib)) end end end @@ -63,8 +61,9 @@ end if HAS_CUDA info("Found a CUDA installation.") if HAS_CUDNN - info("Found a CuDNN installation (version -> $cudnnver).") + info("Found a CuDNN installation.") end + info("CUDA_HOME -> $(ENV["CUDA_HOME"])") else info("Did not find a CUDA installation, using CPU-only version of MXNet.") end @@ -170,7 +169,11 @@ if !libmxnet_detected ChangeDirectory(_mxdir) `git submodule deinit --force .` `git fetch` - `git checkout $libmxnet_curr_ver` + if libmxnet_curr_ver != "master" + `git checkout $libmxnet_curr_ver` + else + `git merge --ff origin/$libmxnet_curr_ver` + end `git submodule update --init --recursive` `git -C mshadow checkout -- make/mshadow.mk` `make clean` @@ -192,9 +195,16 @@ if !libmxnet_detected if HAS_CUDA @build_steps begin `sed -i -s 's/USE_CUDA = 0/USE_CUDA = 1/' config.mk` + # address https://github.com/apache/incubator-mxnet/pull/7856 + `sed -i -s "s/ADD_LDFLAGS =\(.*\)/ADD_LDFLAGS =\1 -lcublas -lcusolver -lcurand -lcudart/" config.mk` if haskey(ENV, "CUDA_HOME") `sed -i -s "s@USE_CUDA_PATH = NONE@USE_CUDA_PATH = $(ENV["CUDA_HOME"])@" config.mk` end + if haskey(ENV, "CUDA_HOME") + # address https://github.com/apache/incubator-mxnet/pull/7838 + flag = "-L$(ENV["CUDA_HOME"])/lib64 -L$(ENV["CUDA_HOME"])/lib" + `sed -i -s "s@ADD_LDFLAGS =\(.*\)@ADD_LDFLAGS =\1 $flag@" config.mk` + end if HAS_CUDNN `sed -i -s 's/USE_CUDNN = 0/USE_CUDNN = 1/' config.mk` end From ac7bbd009b7745b5e96cdec934bacfbbce22e56a Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 7 Oct 2017 20:49:26 +0800 Subject: [PATCH 521/630] base: support MXGetVersion - Ref: https://github.com/apache/incubator-mxnet/pull/8013 --- src/base.jl | 11 +++++++++++ test/runtests.jl | 2 ++ 2 files changed, 13 insertions(+) diff --git a/src/base.jl b/src/base.jl index 2d3ec8f3d053..c013f17976ae 100644 --- a/src/base.jl +++ b/src/base.jl @@ -46,6 +46,8 @@ function __init__() _get_libmx_op_names() _populate_iter_creator_cache!() + global const LIB_VERSION = _get_lib_version() + atexit() do # notify libmxnet we are shutting down ccall( ("MXNotifyShutdown", MXNET_LIB), Cint, () ) @@ -74,6 +76,15 @@ macro mxcall(fv, argtypes, args...) end end +""" +Get libmxnet version +""" +function _get_lib_version() + ver = Ref{Cint}(0) + @mxcall :MXGetVersion (Ref{Cint},) ver + ver[] +end + ################################################################################ # Handle types ################################################################################ diff --git a/test/runtests.jl b/test/runtests.jl index 823830b54d0d..eb05ff2f5ca4 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -11,6 +11,8 @@ function test_dir(dir) end end +info("libmxnet version => $(mx.LIB_VERSION)") + include(joinpath(dirname(@__FILE__), "common.jl")) @testset "MXNet Test" begin test_dir(joinpath(dirname(@__FILE__), "unittest")) From 904eb20af96ced5363cb92017e985e09d339c498 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 10 Oct 2017 17:13:05 +0800 Subject: [PATCH 522/630] rand: docstring --- src/random.jl | 59 ++++++++++++++++++++++++++++++++++++++++++++------- 1 file changed, 51 insertions(+), 8 deletions(-) diff --git a/src/random.jl b/src/random.jl index b01e2bc184d7..c021ef9a0fe7 100644 --- a/src/random.jl +++ b/src/random.jl @@ -1,27 +1,70 @@ +""" + rand!(low, high, arr::NDArray) + +Draw random samples from a uniform distribution. +Samples are uniformly distributed over the half-open interval [low, high) +(includes low, but excludes high). + +# Examples + +```julia +julia> mx.rand(0, 1, mx.zeros(2, 2)) |> copy +2×2 Array{Float32,2}: + 0.405374 0.321043 + 0.281153 0.713927 +``` +""" function rand!(low::Real, high::Real, out::NDArray) # XXX: note we reverse shape because julia and libmx has different dim order _random_uniform(NDArray, low=low, high=high, shape=reverse(size(out)), out=out) end -function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}) - rand(low, high, shape, cpu()) -end -function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}, ctx::Context) + +""" + rand(low, high, shape, context=cpu()) + +Draw random samples from a uniform distribution. +Samples are uniformly distributed over the half-open interval [low, high) +(includes low, but excludes high). + +# Examples + +```julia +julia> mx.rand(0, 1, (2, 2)) |> copy +2×2 Array{Float32,2}: + 0.405374 0.321043 + 0.281153 0.713927 +``` +""" +function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}, ctx::Context=cpu()) out = empty(shape, ctx) rand!(low, high, out) end +""" + randn!(mean, std, arr::NDArray) + +Draw random samples from a normal (Gaussian) distribution. +""" function randn!(mean::Real, stdvar::Real, out::NDArray) # XXX: note we reverse shape because julia and libmx has different dim order _random_normal(NDArray, loc=mean, scale=stdvar, shape=reverse(size(out)), out=out) end -function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}) - randn(mean, stdvar, shape, cpu()) -end -function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}, ctx::Context) + +""" + randn(mean, std, shape, context=cpu()) + +Draw random samples from a normal (Gaussian) distribution. +""" +function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}, ctx::Context=cpu()) out = empty(shape, ctx) randn!(mean, stdvar, out) end +""" + srand(seed::Int) + +Set the random seed of libmxnet +""" function srand(seed_state::Int) @mxcall(:MXRandomSeed, (Cint,), seed_state) end From aae016c06c346607e7e7da63ef5eea99b395bafd Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 8 Oct 2017 01:12:23 +0800 Subject: [PATCH 523/630] ndarray: pretty printing MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Leverage `Base.showarray`. e.g. ```julia julia> mx.rand(0, 1, (5, 20)) 5x20 mx.NDArray{Float32} @ CPU0: 0.628982 0.425452 0.952792 … 0.785153 0.181631 5.53504f-5 0.798047 0.45613 0.984329 0.0639553 0.872651 0.885338 0.687488 0.28173 0.512393 0.31186 0.185636 0.483409 0.703495 0.485628 0.273542 0.679879 0.215508 0.58641 0.580447 ``` - test cases included --- src/ndarray.jl | 34 +++++++++++++++++++++++----------- test/unittest/ndarray.jl | 11 +++++++++++ 2 files changed, 34 insertions(+), 11 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index eba7e2169a7e..7e8ac40f9a03 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -99,7 +99,8 @@ type NDArray end function Base.show(io :: IO, arr :: NDArray) - print(io, "mx.NDArray{$(eltype(arr))}$(size(arr))") + println(io, "$(join(size(arr), "x")) mx.NDArray{$(eltype(arr))} @ $(context(arr)):") + Base.showarray(io, try_get_shared(arr, sync=:read), false, header=false) end function NDArray{T<:Real}(data :: Array{T}) @@ -299,7 +300,7 @@ function eltype{T <: Union{NDArray, MX_NDArrayHandle}}(arr :: T) if dtype_ref[] == -1 # arr->is_none() warn("Eltype of $arr is not defined") - Base.show_backtrace(STDOUT,backtrace()) + Base.show_backtrace(STDOUT, backtrace()) println() return Float32 else @@ -832,24 +833,35 @@ function _wait_to_write(arr :: NDArray) end """ - try_get_shared(arr) + try_get_shared(arr; sync=:nop) Try to create a Julia array by sharing the data with the underlying `NDArray`. # Arguments: + * `arr::NDArray`: the array to be shared. !!! note The returned array does not guarantee to share data with the underlying `NDArray`. In particular, data sharing is possible only when the `NDArray` lives on CPU. + +* `sync::Symbol`: `:nop`,`:write`, `:read` + On CPU, invoke `_wait_to_read` if `:read`; + invoke `_wait_to_write` if `:write`. """ -function try_get_shared(arr :: NDArray) +function try_get_shared(arr :: NDArray; sync::Symbol=:nop) if context(arr).device_type == CPU # try to do data sharing - return unsafe_wrap(Array, pointer(arr), size(arr)) + if sync == :read + _wait_to_read(arr) + elseif sync == :write + _wait_to_write(arr) + end + + unsafe_wrap(Array, pointer(arr), size(arr)) else # impossible to share, just copying - return copy(arr) + copy(arr) end end @@ -859,12 +871,12 @@ end Test whether `j_arr` is sharing data with `arr`. # Arguments: -* Array j_arr: the Julia Array. -* NDArray arr: the `NDArray`. + +* `j_arr::Array`: the Julia Array. +* `arr::NDArray`: the `NDArray`. """ -function is_shared(j_arr :: Array, arr :: NDArray) - false -end +is_shared(j_arr :: Array, arr :: NDArray) = false + function is_shared{T<:DType}(j_arr :: Array{T}, arr :: NDArray) if length(j_arr) != length(arr) return false diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 2185d920cc2a..67f395dbf95a 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -425,6 +425,16 @@ function test_kwargs() @test all(copy(tx) .== tA) end +function test_show() + let str = sprint(show, mx.NDArray([1 2 3 4])) + @test contains(str, "1x4") + @test contains(str, "mx.NDArray") + @test contains(str, "Int64") + @test contains(str, "CPU") + @test match(r"1\s+2\s+3\s+4", str) != nothing + end +end + ################################################################################ # Run tests ################################################################################ @@ -445,6 +455,7 @@ end test_dot() test_reshape() test_kwargs() + test_show() end end From 81b134ffa6af292d8c65b2de8d7a66d44b8eab5a Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 25 Oct 2017 05:39:06 +0800 Subject: [PATCH 524/630] ndarray: implement `fill` and `fill!` (#297) It serve as an API corresponds to Python's `mx.nd.full()` --- NEWS.md | 7 +++++++ src/ndarray.jl | 25 +++++++++++++++++++++++++ test/unittest/ndarray.jl | 37 +++++++++++++++++++++++++++++++++++++ 3 files changed, 69 insertions(+) diff --git a/NEWS.md b/NEWS.md index 773c2471c514..1ffca376c399 100644 --- a/NEWS.md +++ b/NEWS.md @@ -4,6 +4,13 @@ * `deepcopy` for NDArray (#273) +* `fill` and `fill!` for NDArray (#TBD) + An API correspond to Python's `mx.nd.full()` + + * `fill(x, dims, ctx=cpu())` + * `fill(x, dims...)` + * `fill!(x, arr::NDArray)` + ## API Changes * `reshape` of NDArray share the same interface with Base (#272). diff --git a/src/ndarray.jl b/src/ndarray.jl index 7e8ac40f9a03..5974c82f1972 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -703,6 +703,31 @@ function /(arg0 :: NDArray, arg :: Real) end +""" + fill!(x, arr::NDArray) + +Create an `NDArray` filled with the value `x`, like `Base.fill`. +""" +function fill!(x, arr::NDArray) + arr[:] = x + arr +end + +""" + fill(x, dims, ctx=cpu()) + fill(x, dims...) + +Create an `NDArray` filled with the value `x`, like `Base.fill`. +""" +function fill{N}(x, dims::NTuple{N, Integer}, ctx::Context=cpu()) + arr = empty(typeof(x), dims, ctx) + arr[:] = x + arr +end + +fill(x, dims::Integer...) = fill(x, dims) + + """ Manipulating as Julia Arrays ---------------------------- diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 67f395dbf95a..6944e7ed0829 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -413,6 +413,42 @@ function test_reshape() @test size(C) == (50, 4) end +function test_fill() + info("NDArray::fill") + thresh = 1e8 + + let x = mx.fill(42, 2, 3, 4) + @test eltype(x) == Int + @test size(x) == (2, 3, 4) + @test copy(x) == fill(42, 2, 3, 4) + end + + let x = mx.fill(Float32(42), 2, 3, 4) + @test eltype(x) == Float32 + @test size(x) == (2, 3, 4) + @test reldiff(copy(x), fill(Float32(42), 2, 3, 4)) < thresh + end + + let x = mx.fill(42, (2, 3, 4)) + @test eltype(x) == Int + @test size(x) == (2, 3, 4) + @test copy(x) == fill(42, 2, 3, 4) + end + + let x = mx.fill(Float32(42), (2, 3, 4)) + @test eltype(x) == Float32 + @test size(x) == (2, 3, 4) + @test reldiff(copy(x), fill(Float32(42), 2, 3, 4)) < thresh + end + + info("NDArray::fill!::arr") + let x = mx.fill!(42, mx.zeros(2, 3, 4)) + @test eltype(x) == Float32 + @test size(x) == (2, 3, 4) + @test reldiff(copy(x), fill(Float32(42), 2, 3, 4)) < thresh + end +end # function test_fill + function test_kwargs() info("NDArray::kwargs") dims1 = (2,3,4) @@ -454,6 +490,7 @@ end test_nd_as_jl() test_dot() test_reshape() + test_fill() test_kwargs() test_show() end From 71f2d40590bec90bc71583606a67de532e5adc74 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 26 Oct 2017 01:43:16 +0800 Subject: [PATCH 525/630] base: merge _julia_to_mx_param into dump_mx_param (#296) --- src/base.jl | 16 +++++++++------- src/ndarray.jl | 17 ++--------------- src/random.jl | 6 ++---- 3 files changed, 13 insertions(+), 26 deletions(-) diff --git a/src/base.jl b/src/base.jl index c013f17976ae..b078793d75e1 100644 --- a/src/base.jl +++ b/src/base.jl @@ -157,14 +157,16 @@ end # # TODO: find a better solution in case this cause issues in the future. ################################################################################ -function dump_mx_param(val :: Any) - string(val) -end -function dump_mx_param{N,T<:Integer}(shape :: NTuple{N, T}) - string(tuple(flipdim([shape...],1)...)) -end +dump_mx_param(val::Any) = string(val) +dump_mx_param(val::Float64) = @sprintf("%.16e", val) +dump_mx_param(val::Float32) = @sprintf("%.8e", val) +dump_mx_param(val::Float16) = @sprintf("%.4e", val) +dump_mx_param{N, T<:Integer}(shape::NTuple{N, T}) = + string(tuple(flipdim([shape...], 1)...)) -"""A convenient macro copied from Mocha.jl that could be used to define structs + +""" +A convenient macro copied from Mocha.jl that could be used to define structs with default values and type checks. For example ```julia @defstruct MyStruct Any ( diff --git a/src/ndarray.jl b/src/ndarray.jl index 5974c82f1972..abe5a150d9ff 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1012,19 +1012,6 @@ end ACCEPT_EMPTY_MUTATE_TARGET = (1 << 2) ) -function _julia_to_mx_param(val :: Any) - string(val) -end -function _julia_to_mx_param(val :: Float64) - @sprintf("%.16e", val) -end -function _julia_to_mx_param(val :: Float32) - @sprintf("%.8e", val) -end -function _julia_to_mx_param(val :: Float16) - @sprintf("%.4e", val) -end - # Import corresponding math functions from base so the automatically defined libmxnet # functions can overload them import Base: sqrt @@ -1086,7 +1073,7 @@ function _get_ndarray_function_def(name :: String) # and in libmxnet. # See https://github.com/dmlc/MXNet.jl/pull/123 if $name == "transpose" - kwargs = Any[key != :axes ? (key, arg) : (key, reverse(map(i->length(arg)-i, arg))) for (key, arg) in kwargs] + kwargs = Any[key != :axes ? (key, arg) : (key, map(i->length(arg)-i, arg)) for (key, arg) in kwargs] end if length(output_vars) > 0 @@ -1100,7 +1087,7 @@ function _get_ndarray_function_def(name :: String) num_outputs_p = [convert(Cint, num_outputs)] kw_keys_str = String[string(x[1]) for x in kwargs] - kw_vals_str = String[_julia_to_mx_param(x[2]) for x in kwargs] + kw_vals_str = String[dump_mx_param(x[2]) for x in kwargs] #op_handle = _get_cached_libmx_op_handle($(QuoteNode(name))) op_handle = _get_cached_libmx_op_handle($(name)) diff --git a/src/random.jl b/src/random.jl index c021ef9a0fe7..2d594014da1c 100644 --- a/src/random.jl +++ b/src/random.jl @@ -15,8 +15,7 @@ julia> mx.rand(0, 1, mx.zeros(2, 2)) |> copy ``` """ function rand!(low::Real, high::Real, out::NDArray) - # XXX: note we reverse shape because julia and libmx has different dim order - _random_uniform(NDArray, low=low, high=high, shape=reverse(size(out)), out=out) + _random_uniform(NDArray, low=low, high=high, shape=size(out), out=out) end """ @@ -46,8 +45,7 @@ end Draw random samples from a normal (Gaussian) distribution. """ function randn!(mean::Real, stdvar::Real, out::NDArray) - # XXX: note we reverse shape because julia and libmx has different dim order - _random_normal(NDArray, loc=mean, scale=stdvar, shape=reverse(size(out)), out=out) + _random_normal(NDArray, loc=mean, scale=stdvar, shape=size(out), out=out) end """ From 3824df0b33c0a860d1bf9205b41bee5b0b5557b5 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 27 Oct 2017 05:50:01 +0800 Subject: [PATCH 526/630] Fix mx.chain var reference in macro (#299) fix #298 --- src/nn-factory.jl | 2 +- src/symbolic-node.jl | 3 ++- test/unittest/symbolic-node.jl | 13 +++++++++++++ 3 files changed, 16 insertions(+), 2 deletions(-) diff --git a/src/nn-factory.jl b/src/nn-factory.jl index 76babffbe035..ab88d21adf29 100644 --- a/src/nn-factory.jl +++ b/src/nn-factory.jl @@ -21,7 +21,7 @@ fully connected layers. Returns the constructed MLP. """ -function MLP(input, spec; hidden_activation::Base.Symbol=:relu, prefix=gensym()) +function MLP(input, spec; hidden_activation::Symbol=:relu, prefix=gensym()) spec = convert(Vector{Union{Int,Tuple}}, spec) n_layer = length(spec) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 4e1ed433bb88..3ae545334953 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -893,7 +893,8 @@ macro chain(layers) return esc(layer) else if @capture(layer, f_(x__)) - return :($f($last_layer, $(x...))) + x′ = esc.(x) + return :($f($last_layer, $(x′...))) else throw(AssertionError("$layer is not a valid function call and cannot be chained.")) end diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 688a010794f7..e81ef52055b1 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -23,6 +23,19 @@ function test_chain() @test mx.list_arguments(model) == [:data,:fc1_weight,:fc1_bias,:fc2_weight,:fc2_bias] @test mx.list_outputs(model) == [:fc2_output] @test mx.list_auxiliary_states(model) == Symbol[] + + let layerconfig = [20, 10, 6] + model = @mx.chain mx.Variable(:data) => + mx.MLP(layerconfig, prefix=:magic_) => + mx.LinearRegressionOutput(mx.Variable(:label)) + + @test mx.list_arguments(model) == [ + :data, + :magic_fc1_weight, :magic_fc1_bias, + :magic_fc2_weight, :magic_fc2_bias, + :magic_fc3_weight, :magic_fc3_bias, + :label] + end end function test_internal() From 41f8f55129676b9eaf0fef76052c0369aa175b3b Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 31 Oct 2017 23:57:18 +0800 Subject: [PATCH 527/630] visualize: fix node_attr on upstream master (#301) Ref: https://github.com/dmlc/nnvm/pull/152/files#diff-8fb4ac5650c04b74642d321b992f8db0R82 --- src/visualize.jl | 9 +++++---- test/unittest/visualize.jl | 2 +- 2 files changed, 6 insertions(+), 5 deletions(-) diff --git a/src/visualize.jl b/src/visualize.jl index ea700b704266..91bbd0c48481 100644 --- a/src/visualize.jl +++ b/src/visualize.jl @@ -51,10 +51,11 @@ function to_graphviz(network :: SymbolicNode; title="Network Visualization", inp attr = deepcopy(node_attr) label = op - # Up to 0.8 version of mxnet additional info was stored in - # node["param"]. Staring from pre0.9 `param` was changed to `attr`. - if haskey(node, "param") - node_info = node["param"] + # Up to 0.11.0 version of mxnet additional info was stored in + # node["attr"]. Staring from 0.12 `attr` was changed to `attrs`. + # See: https://github.com/dmlc/nnvm/pull/152 + if haskey(node, "attrs") + node_info = node["attrs"] elseif haskey(node, "attr") node_info = node["attr"] end diff --git a/test/unittest/visualize.jl b/test/unittest/visualize.jl index 3bdaa12824d2..f4ccbf0e5a81 100644 --- a/test/unittest/visualize.jl +++ b/test/unittest/visualize.jl @@ -12,7 +12,7 @@ function test_basic() info("Visualize::basic") mlp = mlp2() - + # Order of elements or default color values can change, but length of the output should be more or less stable @test length(mx.to_graphviz(mlp)) == length( """ From 9fcab401182f9212eea0da88b7a55ebcf113c238 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 6 Nov 2017 23:57:00 +0800 Subject: [PATCH 528/630] symbol: add Base.show (#302) --- src/symbolic-node.jl | 3 +++ 1 file changed, 3 insertions(+) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 3ae545334953..9312ea5dd7c5 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -220,6 +220,9 @@ function get_name(self :: mx.SymbolicNode) return Symbol(unsafe_string(name[])) end +Base.show(io::IO, sym::SymbolicNode) = + print(io, "$(typeof(sym)) $(get_name(sym))") + import Base: print function print(io :: IO, sym :: SymbolicNode) From 4f182ee42cec55b9dc9aef078fd66c38c42ff266 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 7 Nov 2017 03:35:50 +0800 Subject: [PATCH 529/630] ndarray: more Base-like APIs (#303) * ndarray: make API of `sum` and `mean` be Base-like - also fix the axis value mapping - `mean(arr, axis=0)` is not Julian * ndarray: Base-like `maximum` and `minimum` - remove `mx.max`, `mx.min`, `mx.max_axis` and `mx.min_axis` * ndarray: simple doc while remapping with `@_remap` * ndarray: more test cases for dim as tuple * ndarray: remap dot, the elegent way * ndarray: remap `transpose` and add `permutedims` * ndarray: docs of _remap * ndarray: remap `prod` * util: add _sig_checker for discovering non-Julian APIs * travis: add _sig_checker after testing --- .travis.yml | 3 + NEWS.md | 32 ++++++++- src/ndarray.jl | 148 +++++++++++++++++++++++++++++---------- src/util.jl | 25 +++++++ test/unittest/ndarray.jl | 96 ++++++++++++++++++++++--- 5 files changed, 254 insertions(+), 50 deletions(-) diff --git a/.travis.yml b/.travis.yml index 68b1cb1b8b00..aed248bcb23d 100644 --- a/.travis.yml +++ b/.travis.yml @@ -41,6 +41,9 @@ script: - travis_wait 60 ${TRAVIS_DIR}/run_test.sh after_success: + # See https://github.com/dmlc/MXNet.jl/pull/303#issuecomment-341171774 + - julia -e 'using MXNet; mx._sig_checker()' + - source ${TRAVIS_DIR}/run_coverage.sh - echo $TRAVIS_JULIA_VERSION - julia -e 'Pkg.add("Documenter")' diff --git a/NEWS.md b/NEWS.md index 1ffca376c399..b538b7160c3f 100644 --- a/NEWS.md +++ b/NEWS.md @@ -13,12 +13,12 @@ ## API Changes -* `reshape` of NDArray share the same interface with Base (#272). +* `reshape` of NDArray shares the same interface with Base (#272). * `reshape(NDArray, dim; reverse=false)` * `reshape(NDArray, dim...; reverse=false)` * `Reshape` deprecated. -* `reshape` of SymbolicNode share the same interface with Base +* `reshape` of SymbolicNode shares the same interface with Base and additional keyword argument (#279). * `reshape(SymbolicNode, dim; reverse=false, name)` @@ -27,6 +27,34 @@ * `srand!` deprecated, please use `srand` (#282) +* `mean` and `sum` of NDArray share the same interface with Base + and fix the `axis` indexing (#TBD). + + * This is a breaking change; no deprecated warning. + * Before: `mean(arr, axis=0)` + * After: `mean(arr, 1)` + +* `max` and `min` of NDArray renamed to `maximum` and `minimum` and share the + same interface with Base. The `axis` indexing is fixed, also. (#TBD) + + * This is a breaking change; no deprecated warning. + * Before: `mx.max(arr, axis=0)` or `mx.max_axis(arr, axis=0)` + * After: `maximum(arr, 1)` + +* `mx.transpose` for high dimension NDArray has been renamed to `permutedims` + and shares the same interface with Base. (#TBD) + + * This is a breaking changes; no deprecated warning. + * Before: `mx.transpose(A, axis=[2, 1, 3])` + * After: `permutedims(A, [2, 1, 3])` + +* `prod` of `NDArray` shares the same interface with Base and fix + the `axis` indexing. (#TBD). + + * This is a breaking change; no deprecated warning. + * Before: `prod(arr, axis=-1)` + * After: `prod(arr, 1)` + # v0.2.2 (2017.05.14) * Updated supported version of MXNet to 0.9.4. * Improved build-system with support for auto-detecting GPU support. diff --git a/src/ndarray.jl b/src/ndarray.jl index abe5a150d9ff..458c67f5745c 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -99,7 +99,7 @@ type NDArray end function Base.show(io :: IO, arr :: NDArray) - println(io, "$(join(size(arr), "x")) mx.NDArray{$(eltype(arr))} @ $(context(arr)):") + println(io, "$(join(size(arr), "×")) mx.NDArray{$(eltype(arr))} @ $(context(arr)):") Base.showarray(io, try_get_shared(arr, sync=:read), false, header=false) end @@ -971,31 +971,106 @@ function save(filename::String, data::Dict{Base.Symbol,NDArray}) filename, length(names), arrays, names) end -import Base: reshape +################################################################################ +# Mapping NDArray functions to Base-like API +################################################################################ -""" - reshape(arr::NDArray, dim...; reverse=false) - reshape(arr::NDArray, dim; reverse=false) -""" -reshape{N}(arr::NDArray, dim::NTuple{N, Integer}; reverse::Bool=false) = - _reshape(arr, dim, reverse) -reshape{N}(arr::NDArray, dim::Vararg{Integer, N}; reverse::Bool=false) = - _reshape(arr, dim, reverse) +const _mxsig = Dict{Symbol,Expr}() + +function _autoimport(name::Symbol) + if isdefined(Base, name) + :(import Base: $name) + else + :() + end +end + +macro _remap(sig::Expr, imp::Expr) + fname = sig.args[1] + opname = string(imp.args[1]) -@inline function _reshape{N}(arr::NDArray, dim::NTuple{N, Integer}, reverse::Bool) - op_handle = _get_cached_libmx_op_handle("reshape") - n_output = Ref(Cint(0)) - hdls_ref = Ref{Ptr{MX_handle}}(C_NULL) - @mxcall(:MXImperativeInvoke, - (MX_handle, Cint, Ptr{MX_handle}, Ref{Cint}, Ref{Ptr{MX_handle}}, - Cint, char_pp, char_pp), - op_handle, 1, [arr.handle], n_output, hdls_ref, - 2, ["shape", "reverse"], [dump_mx_param(dim), dump_mx_param(!reverse)]) - # not a typo ^^^^^^^^ - @assert n_output[] == 1 - NDArray(MX_NDArrayHandle(unsafe_load(hdls_ref[], 1))) + import_expr = _autoimport(fname) + + if isa(imp.args[2], Expr) && imp.args[2].head == :parameters + ndin = imp.args[3:end] + mxargs = imp.args[2].args + else # no keyword arguments + ndin = imp.args[2:end] + mxargs = [] + end + + mxkeys = map(x -> string(x.args[1]), mxargs) + mxvals = Expr(:vect, map(x -> :(dump_mx_param($(x.args[2]))), mxargs)...) + ndhlds = Expr(:vect, map(x -> :($(x).handle), ndin)...) + + func_body = quote + op_handle = _get_cached_libmx_op_handle($opname) + n_output = Ref(Cint(0)) + hdls_ref = Ref{Ptr{MX_handle}}(C_NULL) + @mxcall(:MXImperativeInvoke, + (MX_handle, + Cint, + Ptr{MX_handle}, + Ref{Cint}, + Ref{Ptr{MX_handle}}, + Cint, + char_pp, + char_pp), + op_handle, + $(length(ndin)), + $(ndhlds), + n_output, + hdls_ref, + $(length(mxargs)), + $mxkeys, + $mxvals) + NDArray(MX_NDArrayHandle(unsafe_load(hdls_ref[], 1))) + end + + docstr = " $sig" + func_def = Expr(:function, sig, func_body) + + esc(quote + $import_expr + @doc $docstr -> + $func_def + end) end +macro _remap(sig::Expr, imp::Symbol) + imp = _mxsig[imp] + + esc(quote + @_remap($sig, $imp) + end) +end + +_mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) +@_remap reshape(arr::NDArray, dim...; reverse = false) reshape +@_remap reshape(arr::NDArray, dim; reverse = false) reshape + +@_remap mean(arr::NDArray) mean(arr) +@_remap mean(arr::NDArray, region) mean(arr; axis = 0 .- region, keepdims = true) + +@_remap sum(arr::NDArray) sum(arr) +@_remap sum(arr::NDArray, dims) sum(arr; axis = 0 .- dims, keepdims = true) + +@_remap maximum(arr::NDArray) max(arr) +@_remap maximum(arr::NDArray, dims) max(arr; axis = 0 .- dims, keepdims = true) + +@_remap minimum(arr::NDArray) min(arr) +@_remap minimum(arr::NDArray, dims) min(arr; axis = 0 .- dims, keepdims = true) + +# See https://github.com/dmlc/MXNet.jl/issues/55 +@_remap dot(x::NDArray, y::NDArray) dot(y, x) + +# See https://github.com/dmlc/MXNet.jl/pull/123 +@_remap transpose(arr::NDArray) transpose(_only2d(arr)) +@_remap permutedims(arr::NDArray, axes) transpose(arr; axes = length(axes) .- tuple(axes...)) + +@_remap prod(arr::NDArray) prod(arr) +@_remap prod(arr::NDArray, dims) prod(arr; axis = 0 .- dims, keepdims = true) + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -1063,19 +1138,6 @@ function _get_ndarray_function_def(name :: String) args = MX_handle[] end - # XXX: hacky way of solving the problem that the arguments of `dot` should be swapped - # See https://github.com/dmlc/MXNet.jl/issues/55 - if $name == "dot" - args = reverse(args) - end - - # XXX: hacky way of solving the semantic difference of the axes parameter in Julia - # and in libmxnet. - # See https://github.com/dmlc/MXNet.jl/pull/123 - if $name == "transpose" - kwargs = Any[key != :axes ? (key, arg) : (key, map(i->length(arg)-i, arg)) for (key, arg) in kwargs] - end - if length(output_vars) > 0 output_handles = map((x) -> Base.cconvert(MX_handle, x), output_vars) # XXX: Julia 0.4 has bug: [Array{MX_handle}] == Array{MX_handle} @@ -1123,9 +1185,21 @@ function _get_ndarray_function_def(name :: String) return func_def, func_def2 end +const _op_import_bl = [ # import black list; do not import these funcs + "mean", + "reshape", + "sum", + "max", + "max_axis", + "min", + "min_axis", + "dot", + "transpose", + "prod", +] + macro _import_ndarray_functions() - black_list = ["reshape"] # do not import these funcs - names = filter(n -> ∉(lowercase(n), black_list), _get_libmx_op_names()) + names = filter(n -> ∉(lowercase(n), _op_import_bl), _get_libmx_op_names()) func_exprs = map(names) do name op_handle = _get_libmx_op_handle(name) diff --git a/src/util.jl b/src/util.jl index 6f7dc1ba73ac..54a633fbb73a 100644 --- a/src/util.jl +++ b/src/util.jl @@ -163,3 +163,28 @@ function _format_signature(narg::Int, arg_names::Ref{char_pp}) return join([unsafe_string(name) for name in arg_names] , ", ") end +@inline function _only2d(x) + @assert ndims(x) == 2 + x +end + +""" +libmxnet operators signature checker. +""" +function _sig_checker() + names = filter(n -> ∉(lowercase(n), _op_import_bl), _get_libmx_op_names()) + foreach(names) do name + op_handle = _get_libmx_op_handle(name) + + desc, key_narg = _get_libmx_op_description(name, op_handle) + _sig = desc |> s -> split(s, '\n') |> first |> strip + _m = match(r"(axis|axes|keepdims|shape)", _sig) + + if _m === nothing + return + end + + warn(_sig) + + end +end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 6944e7ed0829..61161f2c7fd8 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -413,6 +413,71 @@ function test_reshape() @test size(C) == (50, 4) end +function test_sum() + info("NDArray::sum") + + let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + @test copy(sum(X))[] == sum(A) + @test copy(sum(X, 1)) == sum(A, 1) + @test copy(sum(X, 2)) == sum(A, 2) + @test copy(sum(X, 3)) == sum(A, 3) + @test copy(sum(X, [1, 2])) == sum(A, [1, 2]) + @test copy(sum(X, (1, 2))) == sum(A, (1, 2)) + end +end + +function test_mean() + info("NDArray::mean") + + let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + @test copy(mean(X))[] == mean(A) + @test copy(mean(X, 1)) == mean(A, 1) + @test copy(mean(X, 2)) == mean(A, 2) + @test copy(mean(X, 3)) == mean(A, 3) + @test copy(mean(X, [1, 2])) == mean(A, [1, 2]) + @test copy(mean(X, (1, 2))) == mean(A, (1, 2)) + end +end + +function test_maximum() + info("NDArray::maximum") + + let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + @test copy(maximum(X))[] == maximum(A) + @test copy(maximum(X, 1)) == maximum(A, 1) + @test copy(maximum(X, 2)) == maximum(A, 2) + @test copy(maximum(X, 3)) == maximum(A, 3) + @test copy(maximum(X, [1, 2])) == maximum(A, [1, 2]) + @test copy(maximum(X, (1, 2))) == maximum(A, (1, 2)) + end +end + +function test_minimum() + info("NDArray::minimum") + + let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + @test copy(minimum(X))[] == minimum(A) + @test copy(minimum(X, 1)) == minimum(A, 1) + @test copy(minimum(X, 2)) == minimum(A, 2) + @test copy(minimum(X, 3)) == minimum(A, 3) + @test copy(minimum(X, [1, 2])) == minimum(A, [1, 2]) + @test copy(minimum(X, (1, 2))) == minimum(A, (1, 2)) + end +end + +function test_prod() + info("NDArray::prod") + + let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + @test copy(prod(X))[] == prod(A) + @test copy(prod(X, 1)) == prod(A, 1) + @test copy(prod(X, 2)) == prod(A, 2) + @test copy(prod(X, 3)) == prod(A, 3) + @test copy(prod(X, [1, 2])) == prod(A, [1, 2]) + @test copy(prod(X, (1, 2))) == prod(A, (1, 2)) + end +end + function test_fill() info("NDArray::fill") thresh = 1e8 @@ -449,21 +514,25 @@ function test_fill() end end # function test_fill -function test_kwargs() - info("NDArray::kwargs") - dims1 = (2,3,4) +function test_transpose() + info("NDArray::transpose") + let A = rand(Float32, 2, 3), x = mx.NDArray(A) + @test size(x) == (2, 3) + @test size(x') == (3, 2) + end - A = rand(Float32, dims1) - x = mx.NDArray(A) - tx = mx.transpose(x, axes=(2,1,3)) - tA = permutedims(A, [2,1,3]) - @test size(tx) == size(tA) - @test all(copy(tx) .== tA) + info("NDArray::permutedims") + let A = collect(Float32, reshape(1.0:24, 2, 3, 4)), x = mx.NDArray(A) + A′ = permutedims(A, [2, 1, 3]) + x′ = permutedims(x, [2, 1, 3]) + @test size(A′) == size(x′) + @test A′ == copy(x′) + end end function test_show() let str = sprint(show, mx.NDArray([1 2 3 4])) - @test contains(str, "1x4") + @test contains(str, "1×4") @test contains(str, "mx.NDArray") @test contains(str, "Int64") @test contains(str, "CPU") @@ -490,8 +559,13 @@ end test_nd_as_jl() test_dot() test_reshape() + test_sum() + test_mean() + test_maximum() + test_minimum() + test_prod() test_fill() - test_kwargs() + test_transpose() test_show() end From a3317f13dff102ffd2a113811d5ee77ea51ab72d Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 7 Nov 2017 03:39:48 +0800 Subject: [PATCH 530/630] ndarray: implement rdiv (#292) * ndarray: implement rdiv e.g. ```julia 1 ./ mx.NDArray(Float32[1 2; 3 4]) ``` * typo --- NEWS.md | 2 +- src/ndarray.jl | 31 ++++++++++++++++++++++++------- test/unittest/ndarray.jl | 40 ++++++++++++++++++++++++++++++++++++++++ 3 files changed, 65 insertions(+), 8 deletions(-) diff --git a/NEWS.md b/NEWS.md index b538b7160c3f..9840cc52ce6c 100644 --- a/NEWS.md +++ b/NEWS.md @@ -3,7 +3,7 @@ ## New API * `deepcopy` for NDArray (#273) - +* `scalar ./ NDArray` is available now. (#292) * `fill` and `fill!` for NDArray (#TBD) An API correspond to Python's `mx.nd.full()` diff --git a/src/ndarray.jl b/src/ndarray.jl index 458c67f5745c..1a1a3b9f347c 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -682,25 +682,42 @@ function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) end end +""" +Elementwise division of NDArray +""" +div(x::NDArray, y::NDArray) = _div(x, y) +div(x::NDArray, s::Real) = _div_scalar(x, scalar=s) +div(s::Real, x::NDArray) = _rdiv_scalar(x, scalar=s) + import Base: / """ ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) Elementwise dividing an `NDArray` by a scalar or another `NDArray` of the same shape. """ -@compatdot function Base.broadcast(::typeof(/), arg0 :: NDArray, arg :: Union{Real, NDArray}) - ret = copy(arg0, context(arg0)) - div_from!(ret, arg) +@compatdot function Base.broadcast(::typeof(/), arg0 :: NDArray, + arg :: Union{Real, NDArray}) + div(arg0, arg) +end + +@compatdot function Base.broadcast(::typeof(/), arg0 :: Real, arg :: NDArray) + div(arg0, arg) end """ /(arg0 :: NDArray, arg :: Real) -Divide an `NDArray` by a scalar. Matrix division (solving linear systems) is not implemented yet. +Divide an `NDArray` by a scalar. +Matrix division (solving linear systems) is not implemented yet. """ -function /(arg0 :: NDArray, arg :: Real) - arg0 ./ arg -end +/(arg0 :: NDArray, arg :: Real) = div(arg0, arg) + +""" + /(arg0 :: Real, arg :: NDArray) + +Elementwise divide a scalar by an `NDArray`. +""" +/(arg0 :: Real, arg :: NDArray) = div(arg0, arg) """ diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 61161f2c7fd8..2b731f6beded 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -264,8 +264,47 @@ function test_div() t6, a6 = rand_tensors(Float16, dims) scalar_large = 1e4 @test reldiff(t6 / scalar_large, copy(a6 ./ scalar_large)) < 1e-1 + + let x = mx.NDArray([1 2; 3 4]) + @test eltype(x) == Int + @test copy(x / 2) == [0 1; 1 2] + @test copy(x / 2.5) == [0 1; 1 2] + @test copy(x / 2.9) == [0 1; 1 2] + end end + +function test_rdiv() + info("NDarray::rdiv") + + info("NDarray::rdiv::Inf16") + let x = 1 ./ mx.zeros(Float16, 4) + @test copy(x) == [Inf16, Inf16, Inf16, Inf16] + end + + info("NDarray::rdiv::Inf32") + let x = 1 ./ mx.zeros(Float32, 4) + @test copy(x) == [Inf32, Inf32, Inf32, Inf32] + end + + info("NDarray::rdiv::Inf64") + let x = 1 ./ mx.zeros(Float64, 4) + @test copy(x) == [Inf64, Inf64, Inf64, Inf64] + end + + info("NDarray::rdiv::Int") + let x = 1 ./ mx.NDArray([1 2; 3 4]) + @test copy(x) == [1 0; 0 0] + end + + info("NDarray::rdiv::Float32") + let x = 1 ./ mx.NDArray(Float32[1 2; 3 4]) + y = 1 ./ Float32[1 2; 3 4] + @test reldiff(copy(x), y) < 1e8 + end +end # function test_rdiv + + function test_gd() dims = rand_dims() tw, aw = rand_tensors(dims) @@ -551,6 +590,7 @@ end test_minus() test_mul() test_div() + test_rdiv() test_gd() test_saveload() test_clip() From 8cc5c1c44864d10e9475e80aa6c01700cdbaa60a Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 7 Nov 2017 13:27:29 +0800 Subject: [PATCH 531/630] util: docstring of _sig_checker (#305) --- src/util.jl | 14 ++++++++++++++ 1 file changed, 14 insertions(+) diff --git a/src/util.jl b/src/util.jl index 54a633fbb73a..6877200d87b8 100644 --- a/src/util.jl +++ b/src/util.jl @@ -170,6 +170,20 @@ end """ libmxnet operators signature checker. + +C/Python have different convernsion of accessing array. Those languages +handle arrays in row-major and zero-indexing which differs from Julia's +colume-major and 1-indexing. + +This function scans the docstrings of NDArray's APIs, +filter out the signature which contain `axis`, `axes`, `keepdims` and `shape` +as its function argument. + +We invoks this checker in Travis CI build and pop up the warning message +if the functions does not get manually mapped +(imply it's dimension refering may looks weird). + +If you found any warning in Travis CI build, please open an issue on GitHub. """ function _sig_checker() names = filter(n -> ∉(lowercase(n), _op_import_bl), _get_libmx_op_names()) From a488d7a564418bc1eae288d664fb16cc9f512226 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 7 Nov 2017 23:25:02 +0800 Subject: [PATCH 532/630] ndarray: intro TakingBroadcastSeriously and broadcast unfusing (#300) * ndarray: TakingBroadcastSeriously and broadcast unfusing * ndarray: test cases for elementwise mul close #253 * Drop 0.5 support * fixup! ndarray: TakingBroadcastSeriously and broadcast unfusing --- .travis.yml | 3 +- NEWS.md | 15 +++++ REQUIRE | 3 +- appveyor.yml | 1 - docs/make.jl | 2 +- docs/mkdocs.yml | 2 +- src/MXNet.jl | 2 + src/ndarray.jl | 137 +++++++++++++++------------------------ test/unittest/ndarray.jl | 31 +++++---- 9 files changed, 93 insertions(+), 103 deletions(-) diff --git a/.travis.yml b/.travis.yml index aed248bcb23d..734de9e1eff9 100644 --- a/.travis.yml +++ b/.travis.yml @@ -6,7 +6,6 @@ os: - osx osx_image: xcode8 julia: - - 0.5 - 0.6 # - nightly 0.6 supports depends on #170 @@ -38,7 +37,7 @@ script: # bump the time limit of no ouput # the `travis_wait` wrapper can be removed once this issue fixed: # https://github.com/JuliaLang/julia/pull/23601 - - travis_wait 60 ${TRAVIS_DIR}/run_test.sh + - ${TRAVIS_DIR}/run_test.sh after_success: # See https://github.com/dmlc/MXNet.jl/pull/303#issuecomment-341171774 diff --git a/NEWS.md b/NEWS.md index 9840cc52ce6c..a848a72c9b02 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,5 +1,7 @@ # v0.3.0 (TBD) +* Drop 0.5 support. (#TBD) + ## New API * `deepcopy` for NDArray (#273) @@ -11,6 +13,19 @@ * `fill(x, dims...)` * `fill!(x, arr::NDArray)` +* Matrix (2D NDArray) multiplication is available now. (#TBD) + + ```julia + julia> x + 1x2 mx.NDArray{Float64} @ CPU0: + 1.0 2.0 + + julia> x' * x + 2x2 mx.NDArray{Float64} @ CPU0: + 1.0 2.0 + 2.0 4.0 + ``` + ## API Changes * `reshape` of NDArray shares the same interface with Base (#272). diff --git a/REQUIRE b/REQUIRE index ca30ebc84ff9..8c07e3f8b273 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,6 +1,7 @@ -julia 0.5.2 +julia 0.6 Compat 0.25.2 Formatting BinDeps JSON MacroTools +TakingBroadcastSeriously diff --git a/appveyor.yml b/appveyor.yml index e3d1984f4732..449465246eff 100644 --- a/appveyor.yml +++ b/appveyor.yml @@ -1,6 +1,5 @@ environment: matrix: - - JULIA_URL: "https://julialang-s3.julialang.org/bin/winnt/x64/0.5/julia-0.5-latest-win64.exe" - JULIA_URL: "https://julialang-s3.julialang.org/bin/winnt/x64/0.6/julia-0.6-latest-win64.exe" branches: diff --git a/docs/make.jl b/docs/make.jl index a84f680711a5..0a2b01d25cc8 100644 --- a/docs/make.jl +++ b/docs/make.jl @@ -8,5 +8,5 @@ makedocs( deploydocs( deps = Deps.pip("pygments", "mkdocs", "mkdocs-material", "python-markdown-math"), repo = "github.com/dmlc/MXNet.jl.git", - julia = "0.5", + julia = "0.6", ) diff --git a/docs/mkdocs.yml b/docs/mkdocs.yml index ed18e479ae37..e636a194196d 100644 --- a/docs/mkdocs.yml +++ b/docs/mkdocs.yml @@ -33,7 +33,7 @@ pages: - Installation Guide: user-guide/install.md - Overview: user-guide/overview.md - FAQ: user-guide/faq.md - - API Documentation: + - API Documentation: - Context: api/context.md - Models: api/model.md - Initializers: api/initializer.md diff --git a/src/MXNet.jl b/src/MXNet.jl index 142f1a06d5be..a527eb6ec4c2 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -17,6 +17,8 @@ end using Formatting using MacroTools +using TakingBroadcastSeriously: @unfuse +import TakingBroadcastSeriously: broadcast_ # Functions from base that we can safely extend and that are defined by libmxnet. import Base: round, ceil, floor, cos, sin, abs, sign, exp, sqrt, exp, log, norm, diff --git a/src/ndarray.jl b/src/ndarray.jl index 1a1a3b9f347c..c3d80fb43914 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -98,6 +98,10 @@ type NDArray end end +const NDArrayOrReal = Union{NDArray, Real} + +@unfuse NDArray + function Base.show(io :: IO, arr :: NDArray) println(io, "$(join(size(arr), "×")) mx.NDArray{$(eltype(arr))} @ $(context(arr)):") Base.showarray(io, try_get_shared(arr, sync=:read), false, header=false) @@ -553,7 +557,6 @@ function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) return dst end -import Base.broadcast import Base: + """ @@ -561,23 +564,13 @@ import Base: + .+(args...) Summation. Multiple arguments of either scalar or `NDArray` could be -added together. Note at least the first or second argument needs to be an `NDArray` to -avoid ambiguity of built-in summation. +added together. Note at least the first or second argument needs to be an +`NDArray` to avoid ambiguity of built-in summation. """ -function +(arg0 :: NDArray, args :: Union{Real, NDArray}...) - ret = copy(arg0, context(arg0)) - add_to!(ret, args...) -end -@compatdot function Base.broadcast(::typeof(+), arg0 :: NDArray, args :: Union{Real, NDArray}...) - +(arg0, args...) -end -function +(arg0 :: Real, arg1 :: NDArray, args :: Union{Real, NDArray}...) - +(arg1, arg0, args...) -end -@compatdot function Base.broadcast(::typeof(+), arg0 :: Real, arg1 :: NDArray, - args :: Union{Real, NDArray}...) - broadcast(+, arg1, arg0, args...) -end ++(x::NDArray, ys::NDArrayOrReal...) = add_to!(copy(x, context(x)), ys...) + +broadcast_(::typeof(+), x::NDArray, y::NDArrayOrReal) = x + y +broadcast_(::typeof(+), x::Real, y::NDArray) = x + y """ sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) @@ -596,32 +589,19 @@ end import Base: - """ - -(arg0, arg1) - -(arg0) - .-(arg0, arg1) + -(x::NDArray) + -(x, y) + .-(x, y) -Subtraction `arg0 - arg1`, of scalar types or `NDArray`. Or create -the negative of `arg0`. +Subtraction `x - y`, of scalar types or `NDArray`. +Or create the negative of `x`. """ -function -(arg0 :: NDArray, arg1 :: Union{Real, NDArray}) - ret = copy(arg0, context(arg0)) - sub_from!(ret, arg1) -end -@compatdot function Base.broadcast(::typeof(-), arg0 :: NDArray, arg1 :: Union{Real, NDArray}) - -(arg0, arg1) -end -function -(arg0 :: Real, arg1 :: NDArray) - ret = -arg1 - add_to!(ret, arg0) - return ret -end -@compatdot function Base.broadcast(::typeof(-), arg0 :: Real, arg1 :: NDArray) - -(arg0, arg1) -end +-(x::NDArray) = _mul_scalar(x, scalar=-one(eltype(x))) +-(x::NDArray, y::NDArrayOrReal) = sub_from!(copy(x, context(x)), y) +-(x::Real, y::NDArray) = -y .+ x -function -(arg0 :: NDArray) - _mul_scalar(arg0, scalar=-one(eltype(arg0))) -end +broadcast_(::typeof(-), x::NDArray, y::NDArrayOrReal) = x - y +broadcast_(::typeof(-), x::Real, y::NDArray) = x - y """ mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) @@ -636,36 +616,31 @@ function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) else _mul(dst, arg, out=dst) end - return dst end import Base: * """ - .*(arg0, arg1) + .*(x, y) -Elementwise multiplication of `arg0` and `arg`, could be either scalar or `NDArray`. +Currently only multiplication a scalar with an `NDArray` is implemented. """ -@compatdot function Base.broadcast(::typeof(*), arg0 :: NDArray, arg :: Union{Real, NDArray}) - ret = copy(arg0, context(arg0)) - mul_to!(ret, arg) -end -@compatdot function Base.broadcast(::typeof(*), arg0 :: Real, arg :: NDArray) - arg .* arg0 -end +*(x:: NDArray, y::Real) = x .* y +*(x::Real, y::NDArray) = y .* x + +broadcast_(::typeof(*), x::NDArray, y::NDArrayOrReal) = + mul_to!(copy(x, context(x)), y) +broadcast_(::typeof(*), x::Real, y::NDArray) = y .* x """ - *(arg0, arg1) + *(A::NDArray, B::NDArray) -Currently only multiplication a scalar with an `NDArray` is implemented. Matrix multiplication -is to be added soon. +Matrix (2D NDArray) multiplication. """ -function *(arg0 :: NDArray, arg :: Real) - ret = copy(arg0, context(arg0)) - mul_to!(ret, arg) -end -function *(arg0 :: Real, arg :: NDArray) - *(arg, arg0) +function *(x::NDArray, y::NDArray) + @assert ndims(x) == 2 + @assert ndims(y) == 2 + dot(x, y) end """ @@ -683,42 +658,36 @@ function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) end """ -Elementwise division of NDArray -""" -div(x::NDArray, y::NDArray) = _div(x, y) -div(x::NDArray, s::Real) = _div_scalar(x, scalar=s) -div(s::Real, x::NDArray) = _rdiv_scalar(x, scalar=s) + rdiv_from!(x:: Real, y::NDArray) -import Base: / +Elementwise divide a scalar by an `NDArray`. Inplace updating. """ - ./(arg0 :: NDArray, arg :: Union{Real, NDArray}) - -Elementwise dividing an `NDArray` by a scalar or another `NDArray` of the same shape. -""" -@compatdot function Base.broadcast(::typeof(/), arg0 :: NDArray, - arg :: Union{Real, NDArray}) - div(arg0, arg) +function rdiv_from!(x::Real, y::NDArray) + @assert y.writable + _rdiv_scalar(y, scalar=convert(eltype(y), x), out=y) end -@compatdot function Base.broadcast(::typeof(/), arg0 :: Real, arg :: NDArray) - div(arg0, arg) -end +import Base: / """ - /(arg0 :: NDArray, arg :: Real) + ./(x::NDArray, y::NDArray) + ./(x::NDArray, y::Real) + ./(x:: Real, y::NDArray) -Divide an `NDArray` by a scalar. -Matrix division (solving linear systems) is not implemented yet. -""" -/(arg0 :: NDArray, arg :: Real) = div(arg0, arg) +* Elementwise dividing an `NDArray` by a scalar or another `NDArray` +of the same shape. -""" - /(arg0 :: Real, arg :: NDArray) +* Elementwise divide a scalar by an `NDArray`. -Elementwise divide a scalar by an `NDArray`. +* Matrix division (solving linear systems) is not implemented yet. """ -/(arg0 :: Real, arg :: NDArray) = div(arg0, arg) +/(x::NDArray, y::Real) = x ./ y + +broadcast_(::typeof(/), x::NDArray, y::NDArrayOrReal) = + div_from!(copy(x, context(x)), y) +broadcast_(::typeof(/), x::Real, y::NDArray) = + rdiv_from!(x, copy(y, context(y))) """ fill!(x, arr::NDArray) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 2b731f6beded..a15291f8b3fe 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -223,6 +223,18 @@ function test_mul() t6, a6 = rand_tensors(Float16, dims) scalar_small = Float16(1e-5) @test reldiff(t6 * scalar_small, copy(a6 .* scalar_small)) < 1e-1 + + info("NDArray::mul::matrix multiplication") + let x = mx.NDArray([1. 2]) + y = x' * x + @test copy(y) == [1. 2; 2 4] + end + + info("NDArray::mul::elementwise::issue 253") + let x = mx.NDArray([1. 2]) + y = x .* x + @test copy(y) == [1. 4.] + end end function test_div() @@ -246,31 +258,24 @@ function test_div() # test scalar scalar = rand() + 2 - @test reldiff(t2./scalar, copy(a2./scalar)) < thresh + @test reldiff(t2 ./ scalar, copy(a2 ./ scalar)) < thresh # test small and large scalar t4, a4 = rand_tensors(Float32, dims) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t4 / scalar_small, copy(a4 ./ scalar_small)) < thresh - @test reldiff(t4 / scalar_large, copy(a4 ./ scalar_large)) < thresh + @test reldiff(t4 ./ scalar_small, copy(a4 ./ scalar_small)) < thresh + @test reldiff(t4 ./ scalar_large, copy(a4 ./ scalar_large)) < thresh t5, a5 = rand_tensors(Float64, dims) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t5 / scalar_small, copy(a5 ./ scalar_small)) < thresh - @test reldiff(t5 / scalar_large, copy(a5 ./ scalar_large)) < thresh + @test reldiff(t5 ./ scalar_small, copy(a5 ./ scalar_small)) < thresh + @test reldiff(t5 ./ scalar_large, copy(a5 ./ scalar_large)) < thresh t6, a6 = rand_tensors(Float16, dims) scalar_large = 1e4 - @test reldiff(t6 / scalar_large, copy(a6 ./ scalar_large)) < 1e-1 - - let x = mx.NDArray([1 2; 3 4]) - @test eltype(x) == Int - @test copy(x / 2) == [0 1; 1 2] - @test copy(x / 2.5) == [0 1; 1 2] - @test copy(x / 2.9) == [0 1; 1 2] - end + @test reldiff(t6 ./ scalar_large, copy(a6 ./ scalar_large)) < 1e-1 end From 57cc677c5403fee9f7244fae8b18e1e0d63f1e5d Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 9 Nov 2017 00:55:46 +0800 Subject: [PATCH 533/630] ndarray: elementwise power (#293) * ndarray: elementwise power ```julia x.^2 2.^x x.^y ``` * ndarray: elementwise power unfusion * Update NEWS --- NEWS.md | 6 ++++ src/ndarray.jl | 16 ++++++++- test/unittest/ndarray.jl | 72 ++++++++++++++++++++++++++++++++++++++++ 3 files changed, 93 insertions(+), 1 deletion(-) diff --git a/NEWS.md b/NEWS.md index a848a72c9b02..77ef0b766f16 100644 --- a/NEWS.md +++ b/NEWS.md @@ -26,6 +26,12 @@ 2.0 4.0 ``` +* Elementwise power of `NDArray`. (#293) + * `x.^2` + * `2.^x` + * `x.^y` + * where `x` and `y` are `NDArray`s. + ## API Changes * `reshape` of NDArray shares the same interface with Base (#272). diff --git a/src/ndarray.jl b/src/ndarray.jl index c3d80fb43914..d8b13e96cfe8 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -689,6 +689,21 @@ broadcast_(::typeof(/), x::NDArray, y::NDArrayOrReal) = broadcast_(::typeof(/), x::Real, y::NDArray) = rdiv_from!(x, copy(y, context(y))) +import Base: ^ + +""" + .^(x::NDArray, y::NDArray) + .^(x::NDArray, s::Real) + .^(s::Real, x::NDArray) + +Elementwise power of NDArray. +""" +^ + +broadcast_(::typeof(^), x::NDArray, y::NDArray) = _power(x, y) +broadcast_(::typeof(^), x::NDArray, s::Real) = _power_scalar(x, scalar=s) +broadcast_(::typeof(^), s::Real, x::NDArray) = _rpower_scalar(x, scalar=s) + """ fill!(x, arr::NDArray) @@ -713,7 +728,6 @@ end fill(x, dims::Integer...) = fill(x, dims) - """ Manipulating as Julia Arrays ---------------------------- diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index a15291f8b3fe..4552b79b6bcf 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -380,6 +380,77 @@ function test_clip() @test all(clip_down .<= copy(clipped) .<= clip_up) end +function test_power() + info("NDArray::power") + thresh = 1e8 + + info("NDArray::power::Int::x.^n") + let x = mx.NDArray([1 2; 3 4]) + @test eltype(x) == Int + @test copy(x.^-1) == [1 0; 0 0] + @test copy(x.^0) == [1 1; 1 1] + @test copy(x.^1) == [1 2; 3 4] + @test copy(x.^1.1) == [1 2; 3 4] + @test copy(x.^2) == [1 4; 9 16] + @test copy(x.^2.9) == [1 4; 9 16] + @test copy(x.^3) == [1 8; 27 64] + end + + info("NDArray::power::Int::n.^x") + let x = mx.NDArray([1 2; 3 4]) + @test eltype(x) == Int + @test copy(0.^x) == [0 0; 0 0] + @test copy(1.^x) == [1 1; 1 1] + @test copy(1.1.^x) == [1 1; 1 1] + @test copy(2.^x) == [2 4; 8 16] + @test copy(2.9.^x) == [2 4; 8 16] + @test copy(3.^x) == [3 9; 27 81] + end + + info("NDArray::power::Int::x.^y") + let x = mx.NDArray([1 2; 3 4]), y = mx.NDArray([2 2; 2 2]) + @test eltype(x) == Int + @test eltype(y) == Int + @test copy(x.^y) == [1 4; 9 16] + @test copy(y.^x) == [2 4; 8 16] + end + + info("NDArray::power::Float32::x.^n") + let x = mx.NDArray(Float32[1 2; 3 4]), A = Float32[1 2; 3 4] + @test eltype(x) == Float32 + @test copy(x.^0) == Float32[1 1; 1 1] + @test copy(x.^1) == Float32[1 2; 3 4] + @test copy(x.^2) == Float32[1 4; 9 16] + @test copy(x.^3) == Float32[1 8; 27 64] + + @test reldiff(copy(x.^-1), A.^-1) < thresh + @test reldiff(copy(x.^1.1), A.^1.1) < thresh + @test reldiff(copy(x.^2.9), A.^2.9) < thresh + end + + info("NDArray::power::Float32::n.^x") + let x = mx.NDArray(Float32[1 2; 3 4]), A = Float32[1 2; 3 4] + @test eltype(x) == Float32 + @test copy(0.^x) == Float32[0 0; 0 0] + @test copy(1.^x) == Float32[1 1; 1 1] + @test copy(2.^x) == Float32[2 4; 8 16] + @test copy(3.^x) == Float32[3 9; 27 81] + + @test reldiff(copy(1.1.^x), 1.1.^A) < thresh + @test reldiff(copy(2.9.^x), 2.9.^A) < thresh + end + + info("NDArray::power::Float32::x.^y") + let x = mx.NDArray(Float32[1 2; 3 4]), y = mx.NDArray(Float32[2 2; 2 2]) + @test eltype(x) == Float32 + @test eltype(y) == Float32 + @test copy(x.^y) == Float32[1 4; 9 16] + @test copy(y.^x) == Float32[2 4; 8 16] + end + + # TODO: Float64: wait for https://github.com/apache/incubator-mxnet/pull/8012 +end # function test_power + function test_sqrt() dims = rand_dims() info("NDArray::sqrt::dims = $dims") @@ -599,6 +670,7 @@ end test_gd() test_saveload() test_clip() + test_power() test_sqrt() test_eltype() test_nd_as_jl() From eea128af54b0eb82fef03bae139f5cc81af7b7af Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 9 Nov 2017 01:18:24 +0800 Subject: [PATCH 534/630] ndarray: fix `add` broadcasting and more tests (#308) --- src/ndarray.jl | 19 ++++++++++--------- test/unittest/ndarray.jl | 6 ++++++ 2 files changed, 16 insertions(+), 9 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index d8b13e96cfe8..56b8869b1758 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -541,11 +541,11 @@ macro inplace(stmt) end """ - add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) + add_to!(dst::NDArray, args::NDArrayOrReal...) Add a bunch of arguments into `dst`. Inplace updating. """ -function add_to!(dst :: NDArray, args :: Union{Real, NDArray}...) +function add_to!(dst::NDArray, args::NDArrayOrReal...) @assert dst.writable for arg in args if isa(arg, Real) @@ -567,17 +567,18 @@ Summation. Multiple arguments of either scalar or `NDArray` could be added together. Note at least the first or second argument needs to be an `NDArray` to avoid ambiguity of built-in summation. """ -+(x::NDArray, ys::NDArrayOrReal...) = add_to!(copy(x, context(x)), ys...) ++(x::NDArray, ys::NDArrayOrReal...) = add_to!(copy(x, context(x)), ys...) ++(x::Real, y::NDArray, zs::NDArrayOrReal...) = add_to!(copy(y, context(y)), x, zs...) broadcast_(::typeof(+), x::NDArray, y::NDArrayOrReal) = x + y broadcast_(::typeof(+), x::Real, y::NDArray) = x + y """ - sub_from!(dst :: NDArray, args :: Union{Real, NDArray}...) + sub_from!(dst::NDArray, args::NDArrayOrReal...) Subtract a bunch of arguments from `dst`. Inplace updating. """ -function sub_from!(dst :: NDArray, arg :: Union{Real, NDArray}) +function sub_from!(dst::NDArray, arg::NDArrayOrReal) @assert dst.writable if isa(arg, Real) _minus_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) @@ -604,12 +605,12 @@ broadcast_(::typeof(-), x::NDArray, y::NDArrayOrReal) = x - y broadcast_(::typeof(-), x::Real, y::NDArray) = x - y """ - mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) + mul_to!(dst::NDArray, arg::NDArrayOrReal) Elementwise multiplication into `dst` of either a scalar or an `NDArray` of the same shape. Inplace updating. """ -function mul_to!(dst :: NDArray, arg :: Union{Real, NDArray}) +function mul_to!(dst::NDArray, arg::NDArrayOrReal) @assert dst.writable if isa(arg, Real) _mul_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) @@ -644,11 +645,11 @@ function *(x::NDArray, y::NDArray) end """ - div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) + div_from!(dst::NDArray, arg::NDArrayOrReal) Elementwise divide a scalar or an `NDArray` of the same shape from `dst`. Inplace updating. """ -function div_from!(dst :: NDArray, arg :: Union{Real, NDArray}) +function div_from!(dst::NDArray, arg::NDArrayOrReal) @assert dst.writable if isa(arg, Real) _div_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 4552b79b6bcf..0b9c7cf6dd09 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -132,6 +132,12 @@ function test_plus() scalar_large = Float16(1e4) @test reldiff(t6 + scalar_small, copy(a6 .+ scalar_small)) < 1e-1 @test reldiff(t6 + scalar_large, copy(a6 .+ scalar_large)) < 1e-1 + + let x = mx.NDArray([1 2; 3 4]), y = mx.NDArray([1 1; 1 1]) + @test copy(42 .+ x) == [43 44; 45 46] + @test copy(x .+ 42) == [43 44; 45 46] + @test copy(0 .+ x .+ y .+ 41) == [43 44; 45 46] + end end function test_minus() From f839be1fecef0356cced6e6227c74bfbc69ff38e Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 9 Nov 2017 01:22:30 +0800 Subject: [PATCH 535/630] Fix deprecations (#307) --- deps/build.jl | 6 +--- examples/char-lstm/lstm.jl | 6 ++-- examples/char-lstm/seq-data.jl | 2 +- plugins/io/svmlight.jl | 2 +- src/MXNet.jl | 4 +-- src/base.jl | 12 +++---- src/callback.jl | 12 +++---- src/compat.jl | 13 ++----- src/context.jl | 2 +- src/executor.jl | 2 +- src/initializer.jl | 10 +++--- src/io.jl | 26 +++++++------- src/kvstore.jl | 2 +- src/metric.jl | 28 +++++++-------- src/model.jl | 10 +++--- src/name.jl | 6 ++-- src/ndarray.jl | 62 +++++++++++++++++----------------- src/optimizer.jl | 22 ++++++------ src/optimizers/adadelta.jl | 4 +-- src/optimizers/adagrad.jl | 2 +- src/optimizers/adam.jl | 4 +-- src/optimizers/adamax.jl | 4 +-- src/optimizers/nadam.jl | 4 +-- src/optimizers/rmsprop.jl | 2 +- src/optimizers/sgd.jl | 2 +- src/random.jl | 4 +-- src/symbolic-node.jl | 8 ++--- test/unittest/bind.jl | 2 +- test/unittest/metric.jl | 8 ++--- test/unittest/ndarray.jl | 4 +-- 30 files changed, 128 insertions(+), 147 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index d6591c22c910..86d6a9839287 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -117,11 +117,7 @@ if !libmxnet_detected blas_path = Libdl.dlpath(Libdl.dlopen(Base.libblas_name)) - if VERSION >= v"0.5.0-dev+4338" - blas_vendor = Base.BLAS.vendor() - else - blas_vendor = Base.blas_vendor() - end + blas_vendor = Base.BLAS.vendor() ilp64 = "" if blas_vendor == :openblas64 diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index dcd1e6ddb60c..d930240ba1a2 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -2,14 +2,14 @@ using MXNet #--LSTMState -immutable LSTMState +struct LSTMState c :: mx.SymbolicNode h :: mx.SymbolicNode end #--/LSTMState #--LSTMParam -immutable LSTMParam +struct LSTMParam i2h_W :: mx.SymbolicNode h2h_W :: mx.SymbolicNode i2h_b :: mx.SymbolicNode @@ -116,7 +116,7 @@ end # Negative Log-likelihood -type NLL <: mx.AbstractEvalMetric +mutable struct NLL <: mx.AbstractEvalMetric nll_sum :: Float64 n_sample :: Int diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index fb7c8378a5f1..0aac5609dac5 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -32,7 +32,7 @@ function build_vocabulary(corpus_fn::AbstractString, vocab_fn::AbstractString; m end #--CharSeqProvider -type CharSeqProvider <: mx.AbstractDataProvider +mutable struct CharSeqProvider <: mx.AbstractDataProvider text :: AbstractString batch_size :: Int seq_len :: Int diff --git a/plugins/io/svmlight.jl b/plugins/io/svmlight.jl index 500c040394ee..46b79743b87f 100644 --- a/plugins/io/svmlight.jl +++ b/plugins/io/svmlight.jl @@ -5,7 +5,7 @@ datasets in this format could be found at http://www.csie.ntu.edu.tw/~cjlin/libs using MXNet using SVMLightLoader -type SVMLightProvider <: mx.AbstractDataProvider +mutable struct SVMLightProvider <: mx.AbstractDataProvider filename :: AbstractString batch_size :: Int fea_dim :: Int diff --git a/src/MXNet.jl b/src/MXNet.jl index a527eb6ec4c2..85991473d14c 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -11,9 +11,7 @@ using Compat import Compat.String import Compat.view -if VERSION >= v"0.6.0-dev.1024" - import Base.Iterators: filter -end +import Base.Iterators: filter using Formatting using MacroTools diff --git a/src/base.jl b/src/base.jl index b078793d75e1..5df0de509eec 100644 --- a/src/base.jl +++ b/src/base.jl @@ -1,5 +1,5 @@ "Exception thrown when an error occurred calling MXNet API." -immutable MXError <: Exception +struct MXError <: Exception msg :: AbstractString end @@ -91,7 +91,7 @@ end macro mx_define_handle_t(name, destructor) name = esc(name) quote - type $name + mutable struct $name value :: MX_handle function $name(value = C_NULL) @@ -161,7 +161,7 @@ dump_mx_param(val::Any) = string(val) dump_mx_param(val::Float64) = @sprintf("%.16e", val) dump_mx_param(val::Float32) = @sprintf("%.8e", val) dump_mx_param(val::Float16) = @sprintf("%.4e", val) -dump_mx_param{N, T<:Integer}(shape::NTuple{N, T}) = +dump_mx_param(shape::NTuple{N, T}) where {N, T<:Integer} = string(tuple(flipdim([shape...], 1)...)) @@ -203,7 +203,7 @@ end """Internal use only, this value is used to indicate a required value is not specified. """ -immutable __Undefined +struct __Undefined end function _defstruct_impl(is_immutable, name, fields) @@ -285,7 +285,7 @@ function _defstruct_impl(is_immutable, name, fields) if is_immutable quote - immutable $(name) <: $(super_name) + struct $(name) <: $(super_name) $type_body end @@ -293,7 +293,7 @@ function _defstruct_impl(is_immutable, name, fields) end else quote - type $(name) <: $(super_name) + mutable struct $(name) <: $(super_name) $type_body end diff --git a/src/callback.jl b/src/callback.jl index 780869daf9f0..289fdd066aa9 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -3,23 +3,23 @@ Abstract type of callback functions used in training. """ -@compat abstract type AbstractCallback end +abstract type AbstractCallback end """ AbstractBatchCallback Abstract type of callbacks to be called every mini-batch. """ -@compat abstract type AbstractBatchCallback <: AbstractCallback end +abstract type AbstractBatchCallback <: AbstractCallback end """ AbstractEpochCallback Abstract type of callbacks to be called every epoch. """ -@compat abstract type AbstractEpochCallback <: AbstractCallback end +abstract type AbstractEpochCallback <: AbstractCallback end -type BatchCallback <: AbstractBatchCallback +mutable struct BatchCallback <: AbstractBatchCallback frequency :: Int call_on_0 :: Bool callback :: Function @@ -86,7 +86,7 @@ function speedometer(;frequency::Int=50) end -type EpochCallback <: AbstractEpochCallback +mutable struct EpochCallback <: AbstractEpochCallback frequency :: Int call_on_0 :: Bool callback :: Function @@ -107,7 +107,7 @@ See also [`every_n_batch`](@ref). function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) EpochCallback(n, call_on_0, callback) end -function (cb :: EpochCallback){T<:Real}(model :: Any, state :: OptimizationState, metric :: Vector{Tuple{Base.Symbol, T}}) +function (cb :: EpochCallback)(model :: Any, state :: OptimizationState, metric :: Vector{Tuple{Base.Symbol, T}}) where T<:Real if state.curr_epoch == 0 if cb.call_on_0 cb.callback(model, state, metric) diff --git a/src/compat.jl b/src/compat.jl index 7357632174e5..257f1c2863ed 100644 --- a/src/compat.jl +++ b/src/compat.jl @@ -1,17 +1,12 @@ # this file contains code used for enabling backward compatibility with 0.5 # have to import base dotted operators if in 0.5 -if VERSION < v"0.6.0-dev" - import Base: .+, .-, .*, ./, .^ -end # this is for declaring broadcasted functions in 0.5 # TODO this macro should be removed when 0.5 support is dropped macro compatdot(fblock) - if VERSION ≥ v"0.6.0-dev" - return esc(fblock) - end + return esc(fblock) @capture(fblock, function Base.broadcast(::typeof(op_), args__) body_ end) @@ -24,9 +19,5 @@ macro compatdot(fblock) end macro compatmul(expr1, expr2) - if VERSION ≥ v"0.6.0-dev" - esc(:(broadcast(*, $expr1, $expr2))) - else - esc(:($expr1 .* $expr2)) - end + esc(:(broadcast(*, $expr1, $expr2))) end diff --git a/src/context.jl b/src/context.jl index 410a80ca8b4c..d627e7b5e7f7 100644 --- a/src/context.jl +++ b/src/context.jl @@ -5,7 +5,7 @@ A context describes the device type and id on which computation should be carried on. """ -immutable Context +struct Context device_type :: CONTEXT_TYPE device_id :: Int end diff --git a/src/executor.jl b/src/executor.jl index 8d10102f5c75..38f3925293c1 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -5,7 +5,7 @@ An executor is a realization of a symbolic architecture defined by a `SymbolicNo The actual forward and backward computation specified by the network architecture can be carried out with an executor. """ -type Executor +mutable struct Executor handle :: MX_ExecutorHandle symbol :: SymbolicNode arg_arrays :: Vector{NDArray} diff --git a/src/initializer.jl b/src/initializer.jl index 80e6026d1bf4..f741d3e5a279 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -15,9 +15,9 @@ Or, if full behavior customization is needed, override the following function init(self :: AbstractInitializer, name :: Base.Symbol, array :: NDArray) """ -@compat abstract type AbstractInitializer end +abstract type AbstractInitializer end -function init{T<:AbstractInitializer}(self :: T, name :: Base.Symbol, array :: NDArray) +function init(self :: T, name :: Base.Symbol, array :: NDArray) where T<:AbstractInitializer strname = string(name) if startswith(strname,"upsampling") _init_bilinear(self,name, array) @@ -94,7 +94,7 @@ end Initialize weights according to a uniform distribution within the provided scale. """ -immutable UniformInitializer <: AbstractInitializer +struct UniformInitializer <: AbstractInitializer scale :: AbstractFloat end """ @@ -113,7 +113,7 @@ end Initialize weights according to a univariate Gaussian distribution. """ -immutable NormalInitializer <: AbstractInitializer +struct NormalInitializer <: AbstractInitializer μ :: AbstractFloat σ :: AbstractFloat end @@ -150,7 +150,7 @@ used by various libraries. @enum XavierDistribution xv_uniform xv_normal @enum XavierRegularization xv_avg xv_in xv_out -immutable XavierInitializer <: AbstractInitializer +struct XavierInitializer <: AbstractInitializer distribution :: XavierDistribution regularization :: XavierRegularization magnitude :: Float64 diff --git a/src/io.jl b/src/io.jl index 242a9ad98d1a..2ba0bf78a584 100644 --- a/src/io.jl +++ b/src/io.jl @@ -15,7 +15,7 @@ Normally this involves defining: * `Base.done(provider, state) -> Bool` * `Base.next(provider, state) -> (AbstractDataBatch, AbstractDataProvider)` """ -@compat abstract type AbstractDataProvider end +abstract type AbstractDataProvider end """ get_batch_size(provider) -> Int @@ -53,7 +53,7 @@ function provide_label end Base type for data provider states. """ -@compat abstract type AbstractDataProviderState end +abstract type AbstractDataProviderState end """ AbstractDataBatch @@ -70,7 +70,7 @@ The following utility functions will be automatically defined: * [`load_data!`](@ref) * [`load_label!`](@ref) """ -@compat abstract type AbstractDataBatch end +abstract type AbstractDataBatch end """ count_samples(provider, batch) -> Int @@ -113,14 +113,14 @@ function get_label end A basic subclass of `AbstractDataBatch`, that implement the interface by accessing member fields. """ -type DataBatch <: AbstractDataBatch +mutable struct DataBatch <: AbstractDataBatch data :: Vector{NDArray} label :: Vector{NDArray} count :: Int end count_samples(batch :: DataBatch) = batch.count -get_data{Provider<:AbstractDataProvider}(::Provider, batch :: DataBatch) = batch.data -get_label{Provider<:AbstractDataProvider}(::Provider, batch :: DataBatch) = batch.label +get_data(::Provider, batch :: DataBatch) where {Provider<:AbstractDataProvider} = batch.data +get_label(::Provider, batch :: DataBatch) where {Provider<:AbstractDataProvider} = batch.label """ SlicedNDArray @@ -252,7 +252,7 @@ Construct a data provider from `NDArray` or Julia Arrays. TODO: remove `data_padding` and `label_padding`, and implement rollover that copies the last or first several training samples to feed the padding. """ -type ArrayDataProvider <: AbstractDataProvider +mutable struct ArrayDataProvider <: AbstractDataProvider data_arrays :: Vector{Array} data_names :: Vector{Base.Symbol} label_arrays :: Vector{Array} @@ -277,7 +277,7 @@ function ArrayDataProvider(data::Any; batch_size::Int=0, shuffle::Bool=false, da ArrayDataProvider(data, [], batch_size=batch_size, shuffle=shuffle, data_padding=data_padding, label_padding=label_padding) end function ArrayDataProvider(data::Any, label::Any; batch_size::Int=0, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) - asarr{T}(arr :: Array{T}) = convert(Array{MX_float}, arr) + asarr(arr :: Array{T}) where {T} = convert(Array{MX_float}, arr) asarr(arr :: NDArray) = copy(arr) if isa(data, Union{NDArray, Array}) && eltype(data) <: Real @@ -362,7 +362,7 @@ end get_batch_size(provider::ArrayDataProvider) = provider.batch_size -immutable ArrayDataProviderState <: AbstractDataProviderState +struct ArrayDataProviderState <: AbstractDataProviderState curr_idx :: Int end @@ -385,7 +385,7 @@ function Base.done(provider::ArrayDataProvider, state :: ArrayDataProviderState) return state.curr_idx > provider.sample_count end -immutable ArrayDataBatch <: AbstractDataBatch +struct ArrayDataBatch <: AbstractDataBatch idx :: UnitRange{Int} end function Base.next(provider :: ArrayDataProvider, state :: ArrayDataProviderState) @@ -423,7 +423,7 @@ end A data provider that wrap built-in data iterators from libmxnet. See below for a list of built-in data iterators. """ -type MXDataProvider <: AbstractDataProvider +mutable struct MXDataProvider <: AbstractDataProvider handle :: MX_DataIterHandle data_shape :: Vector{Tuple{Base.Symbol, Tuple}} label_shape:: Vector{Tuple{Base.Symbol, Tuple}} @@ -474,10 +474,10 @@ provide_data(provider::MXDataProvider) = provider.data_shape provide_label(provider::MXDataProvider) = provider.label_shape get_batch_size(provider::MXDataProvider) = provider.batch_size -type MXDataProviderState <: AbstractDataProviderState +mutable struct MXDataProviderState <: AbstractDataProviderState has_next :: Bool end -immutable MXDataBatch <: AbstractDataBatch +struct MXDataBatch <: AbstractDataBatch end function Base.eltype(provider :: MXDataProvider) diff --git a/src/kvstore.jl b/src/kvstore.jl index a1d835f8a6c2..1ac56260b401 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -1,4 +1,4 @@ -type KVStore +mutable struct KVStore handle :: MX_KVStoreHandle updater_c :: Ptr{Void} updater :: Function diff --git a/src/metric.jl b/src/metric.jl index b39309f6275c..db38060c933e 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -8,7 +8,7 @@ interfaces: * [`reset!`](@ref) * [`get`](@ref) """ -@compat abstract type AbstractEvalMetric end +abstract type AbstractEvalMetric end """ hasNDArraySupport(metric) -> Val{true/false} @@ -30,11 +30,11 @@ Update and accumulate metrics. * `labels::Vector{NDArray}`: the labels from the data provider. * `preds::Vector{NDArray}`: the outputs (predictions) of the network. """ -function update!{T <: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}) +function update!(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}) where T <: AbstractEvalMetric _update!(metric, labels, preds, hasNDArraySupport(metric)) end -function _update!{T<: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}, :: Val{true}) +function _update!(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}, :: Val{true}) where T<: AbstractEvalMetric if length(labels) != length(preds) Base.warn_once( "The number of labels ($(length(labels))) does not correspond to the\ @@ -45,7 +45,7 @@ function _update!{T<: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray} end end -function _update!{T<: AbstractEvalMetric}(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}, :: Val{false}) +function _update!(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}, :: Val{false}) where T<: AbstractEvalMetric if length(labels) != length(preds) Base.warn_once( "The number of labels ($(length(labels))) does not correspond to the\ @@ -88,7 +88,7 @@ end A metric that calculates nothing. Can be used to ignore an output during training. """ -type NullMetric <: mx.AbstractEvalMetric +mutable struct NullMetric <: mx.AbstractEvalMetric end function update!(metric :: NullMetric, labels :: Vector{NDArray}, preds :: Vector{NDArray}) @@ -114,7 +114,7 @@ To calculate both mean-squared error [`Accuracy`](@ref) and log-loss [`ACE`](@re mx.fit(..., eval_metric = mx.MultiMetric([mx.Accuracy(), mx.ACE()])) ``` """ -type MultiMetric <: mx.AbstractEvalMetric +mutable struct MultiMetric <: mx.AbstractEvalMetric metrics :: Vector{mx.AbstractEvalMetric} end @@ -146,7 +146,7 @@ and log-loss [`ACE`](@ref) for the second output: mx.fit(..., eval_metric = mx.SeqMetric([mx.Accuracy(), mx.ACE()])) ``` """ -type SeqMetric <: mx.AbstractEvalMetric +mutable struct SeqMetric <: mx.AbstractEvalMetric metrics :: Vector{mx.AbstractEvalMetric} end @@ -176,7 +176,7 @@ Multiclass classification accuracy. Calculates the mean accuracy per sample for softmax in one dimension. For a multi-dimensional softmax the mean accuracy over all dimensions is calculated. """ -type Accuracy <: AbstractEvalMetric +mutable struct Accuracy <: AbstractEvalMetric acc_sum :: Float64 n_sample :: Int @@ -235,7 +235,7 @@ Calculates the mean squared error regression loss. Requires that label and prediction have the same shape. """ -type MSE <: AbstractEvalMetric +mutable struct MSE <: AbstractEvalMetric mse_sum :: Vector{NDArray} n_sample :: Int @@ -310,7 +310,7 @@ For more discussion about normalized MSE, please see [#211](https://github.com/dmlc/MXNet.jl/pull/211) also. """ -type NMSE <: AbstractEvalMetric +mutable struct NMSE <: AbstractEvalMetric nmse_sum :: Float64 n_sample :: Int @@ -349,7 +349,7 @@ Calculates the averaged cross-entropy (logloss) for classification. # Arguments: * `eps::Float64`: Prevents returning `Inf` if `p = 0`. """ -type ACE <: AbstractEvalMetric +mutable struct ACE <: AbstractEvalMetric ace_sum :: Float64 n_sample :: Int eps :: Float64 @@ -368,7 +368,7 @@ end hasNDArraySupport(::ACE) = Val{false}() -function _update_single_output{T}(metric :: ACE, label :: Array{T}, pred :: Array{T}) +function _update_single_output(metric :: ACE, label :: Array{T}, pred :: Array{T}) where T eps = convert(T, metric.eps) # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) @@ -411,7 +411,7 @@ end Calculates the averaged cross-entropy per class and overall (see [`ACE`](@ref)). This can be used to quantify the influence of different classes on the overall loss. """ -type MultiACE <: AbstractEvalMetric +mutable struct MultiACE <: AbstractEvalMetric aces :: Vector{Float64} counts :: Vector{Int} eps :: Float64 @@ -432,7 +432,7 @@ end hasNDArraySupport(::MultiACE) = Val{false}() -function _update_single_output{T}(metric :: MultiACE, label :: Array{T}, pred :: Array{T}) +function _update_single_output(metric :: MultiACE, label :: Array{T}, pred :: Array{T}) where T eps = convert(T, metric.eps) # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) diff --git a/src/model.jl b/src/model.jl index a592b500e9cb..df15e4cace0a 100644 --- a/src/model.jl +++ b/src/model.jl @@ -3,7 +3,7 @@ The abstract super type of all models in MXNet.jl. """ -@compat abstract type AbstractModel end +abstract type AbstractModel end """ FeedForward @@ -14,7 +14,7 @@ explicitly handling of *time index*, but it is relatively easy to implement unrolled RNN / LSTM under this framework (*TODO*: add example). For models that handles sequential data explicitly, please use *TODO*... """ -type FeedForward <: AbstractModel +mutable struct FeedForward <: AbstractModel arch :: SymbolicNode ctx :: Vector{Context} @@ -292,9 +292,9 @@ end verbosity :: Int = 3 ) -function _invoke_callbacks{T<:Real}(self::FeedForward, callbacks::Vector{AbstractCallback}, - state::OptimizationState, type_filter::Type; - metric::Vector{Tuple{Base.Symbol, T}} = Vector{Tuple{Base.Symbol, Real}}()) +function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, + state::OptimizationState, type_filter::Type; + metric::Vector{Tuple{Base.Symbol, T}} = Vector{Tuple{Base.Symbol, Real}}()) where T<:Real map(callbacks) do cb if isa(cb, type_filter) if type_filter == AbstractEpochCallback diff --git a/src/name.jl b/src/name.jl index 8ba0f707ff1a..d281770eb357 100644 --- a/src/name.jl +++ b/src/name.jl @@ -1,4 +1,4 @@ -@compat abstract type AbstractNameManager end +abstract type AbstractNameManager end const NameType = Union{Base.Symbol, AbstractString} const NameCounter = Dict{Base.Symbol, Int} @@ -21,7 +21,7 @@ function _default_get_name!(counter :: NameCounter, name :: NameType, hint :: Na return name end -type BasicNameManager <: AbstractNameManager +mutable struct BasicNameManager <: AbstractNameManager counter :: NameCounter end BasicNameManager() = BasicNameManager(NameCounter()) @@ -30,7 +30,7 @@ function get!(manager :: BasicNameManager, name :: NameType, hint :: NameType) _default_get_name!(manager.counter, name, hint) end -type PrefixNameManager <: AbstractNameManager +mutable struct PrefixNameManager <: AbstractNameManager prefix :: Base.Symbol counter :: NameCounter end diff --git a/src/ndarray.jl b/src/ndarray.jl index 56b8869b1758..3e7625e3fdf6 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -3,7 +3,7 @@ const DType = Union{Float32, Float64, Float16, UInt8, Int32, Int8, Int64} @enum TypeFlag kFloat32 kFloat64 kFloat16 kUint8 kInt32 kInt8 kInt64 const DEFAULT_DTYPE = Float32 # MSHADOW_DEFAULT_DTYPE -function toTypeFlag{T <: DType}(:: Type{T}) +function toTypeFlag(:: Type{T}) where T <: DType if T == Float32 return kFloat32 elseif T == Float64 @@ -44,7 +44,7 @@ function fromTypeFlag(T :: TypeFlag) end # create a NDArray handle of specific shape -function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) +function _ndarray_alloc(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) where N h_ref = Ref{MX_handle}(0) shape = flipdim(MX_uint[shape...],1) @mxcall(:MXNDArrayCreate, (Ptr{MX_uint}, MX_uint, Cint, Cint, Cint, Ref{MX_handle}), @@ -54,7 +54,7 @@ function _ndarray_alloc{N}(shape :: NTuple{N, Int}, ctx :: Context, delay_alloc end # create a NDArray handle of specific shape type -function _ndarray_alloc{T <: DType,N}(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) +function _ndarray_alloc(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context, delay_alloc :: Bool) where {T <: DType,N} h_ref = Ref{MX_handle}(0) shape = flipdim(MX_uint[shape...],1) dtype = toTypeFlag(T) @@ -89,7 +89,7 @@ of tensor-based computation. C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory have shape (28,28,1,100). """ -type NDArray +mutable struct NDArray handle :: MX_NDArrayHandle writable :: Bool @@ -107,7 +107,7 @@ function Base.show(io :: IO, arr :: NDArray) Base.showarray(io, try_get_shared(arr, sync=:read), false, header=false) end -function NDArray{T<:Real}(data :: Array{T}) +function NDArray(data :: Array{T}) where T<:Real copy(data, cpu()) end @@ -141,13 +141,13 @@ end Allocate memory for an uninitialized `NDArray` with a specified type. """ -function empty{N,T<:DType}(::Type{T}, shape :: NTuple{N, Int}) +function empty(::Type{T}, shape :: NTuple{N, Int}) where {N,T<:DType} empty(T, shape, cpu()) end -function empty{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) +function empty(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) where {N,T<:DType} NDArray(_ndarray_alloc(T, shape, ctx, false)) end -function empty{T<:DType}(:: Type{T}, shape :: Int...) +function empty(:: Type{T}, shape :: Int...) where T<:DType empty(T, shape) end @@ -158,10 +158,10 @@ end Allocate memory for an uninitialized `NDArray` with specific shape of type Float32. """ -function empty{N}(shape :: NTuple{N, Int}) +function empty(shape :: NTuple{N, Int}) where N empty(shape, cpu()) end -function empty{N}(shape :: NTuple{N, Int}, ctx :: Context) +function empty(shape :: NTuple{N, Int}, ctx :: Context) where N NDArray(_ndarray_alloc(shape, ctx, false)) end function empty(shape :: Int...) @@ -186,15 +186,15 @@ end Create zero-ed `NDArray` with specific shape and type """ -function zeros{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}) +function zeros(:: Type{T}, shape :: NTuple{N, Int}) where {N,T<:DType} zeros(T, shape, cpu()) end -function zeros{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) +function zeros(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) where {N,T<:DType} arr = empty(T, shape, ctx) arr[:] = zero(T) return arr end -function zeros{T<:DType}(:: Type{T}, shape :: Int...) +function zeros(:: Type{T}, shape :: Int...) where T<:DType zeros(T, shape) end @@ -205,10 +205,10 @@ end Create zero-ed `NDArray` with specific shape. """ -function zeros{N}(shape :: NTuple{N, Int}) +function zeros(shape :: NTuple{N, Int}) where N zeros(shape, cpu()) end -function zeros{N}(shape :: NTuple{N, Int}, ctx :: Context) +function zeros(shape :: NTuple{N, Int}, ctx :: Context) where N arr = empty(shape, ctx) arr[:] = 0 return arr @@ -224,15 +224,15 @@ end Create an `NDArray` with specific shape & type, and initialize with 1. """ -function ones{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}) +function ones(:: Type{T}, shape :: NTuple{N, Int}) where {N,T<:DType} ones(T, shape, cpu()) end -function ones{N,T<:DType}(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) +function ones(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) where {N,T<:DType} arr = empty(T, shape, ctx) arr[:] = one(T) return arr end -function ones{T<:DType}(:: Type{T}, shape :: Int...) +function ones(:: Type{T}, shape :: Int...) where T<:DType ones(T, shape) end @@ -243,10 +243,10 @@ end Create an `NDArray` with specific shape and initialize with 1. """ -function ones{N}(shape :: NTuple{N, Int}) +function ones(shape :: NTuple{N, Int}) where N ones(shape, cpu()) end -function ones{N}(shape :: NTuple{N, Int}, ctx :: Context) +function ones(shape :: NTuple{N, Int}, ctx :: Context) where N arr = empty(shape, ctx) arr[:] = 1 return arr @@ -298,7 +298,7 @@ end Get the element type of an `NDArray`. """ -function eltype{T <: Union{NDArray, MX_NDArrayHandle}}(arr :: T) +function eltype(arr :: T) where T <: Union{NDArray, MX_NDArrayHandle} dtype_ref = Ref{Cint}(0) @mxcall(:MXNDArrayGetDType, (MX_handle, Ptr{Cint}), arr, dtype_ref) @@ -359,13 +359,13 @@ function setindex!(arr :: NDArray, val :: Real, ::Colon) _set_value(out=arr, src=convert(eltype(arr), val)) return arr end -function setindex!{T<:Real}(arr :: NDArray, val :: Array{T}, ::Colon) +function setindex!(arr :: NDArray, val :: Array{T}, ::Colon) where T<:Real copy!(arr, val) end function setindex!(arr :: NDArray, val :: NDArray, ::Colon) copy!(arr, val) end -function setindex!{T<:Real}(arr :: NDArray, val :: Union{T,Array{T},NDArray}, idx::UnitRange{Int}) +function setindex!(arr :: NDArray, val :: Union{T,Array{T},NDArray}, idx::UnitRange{Int}) where T<:Real setindex!(slice(arr, idx), val, Colon()) end @@ -426,18 +426,18 @@ function copy!(dst :: NDArray, src :: NDArray) return dst end -function copy!{T<:DType}(dst :: Array{T}, src :: NDArray) +function copy!(dst :: Array{T}, src :: NDArray) where T<:DType @assert T == eltype(src) @assert size(dst) == size(src) @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{Void}, Csize_t), src, pointer(dst), length(dst)) return dst end -function copy!{T<:Real}(dst :: Array{T}, src :: NDArray) +function copy!(dst :: Array{T}, src :: NDArray) where T<:Real copy!(dst, copy(src)) end -function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) +function copy!(dst :: NDArray, src :: Array{T}) where T<:Real @assert dst.writable @assert size(dst) == size(src) src = convert(Array{eltype(dst)}, src) # this might involve copying @@ -446,7 +446,7 @@ function copy!{T<:Real}(dst :: NDArray, src :: Array{T}) return dst end -function copy_ignore_shape!{T<:Real}(dst :: NDArray, src :: Array{T}) +function copy_ignore_shape!(dst :: NDArray, src :: Array{T}) where T<:Real @assert dst.writable @assert length(dst) == length(src) src = convert(Array{eltype(dst)}, src) # this might involve copying @@ -477,7 +477,7 @@ function copy(arr :: NDArray, ctx :: Context) end # Create copy: Julia Array -> NDArray in a given context -function copy{T<:DType}(arr :: Array{T}, ctx :: Context) +function copy(arr :: Array{T}, ctx :: Context) where T<:DType dst = empty(T, size(arr), ctx) copy!(dst, arr) end @@ -487,7 +487,7 @@ end Convert an `NDArray` into a Julia `Array` of specific type. Data will be copied. """ -function convert{T<:Real}(t::Type{Array{T}}, arr :: NDArray) +function convert(t::Type{Array{T}}, arr :: NDArray) where T<:Real convert(t, copy(arr)) end @@ -721,7 +721,7 @@ end Create an `NDArray` filled with the value `x`, like `Base.fill`. """ -function fill{N}(x, dims::NTuple{N, Integer}, ctx::Context=cpu()) +function fill(x, dims::NTuple{N, Integer}, ctx::Context=cpu()) where N arr = empty(typeof(x), dims, ctx) arr[:] = x arr @@ -903,7 +903,7 @@ Test whether `j_arr` is sharing data with `arr`. """ is_shared(j_arr :: Array, arr :: NDArray) = false -function is_shared{T<:DType}(j_arr :: Array{T}, arr :: NDArray) +function is_shared(j_arr :: Array{T}, arr :: NDArray) where T<:DType if length(j_arr) != length(arr) return false end diff --git a/src/optimizer.jl b/src/optimizer.jl index 11508bf22035..89df56ba7050 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -3,21 +3,21 @@ Base type for all optimizers. """ -@compat abstract type AbstractOptimizer end +abstract type AbstractOptimizer end """ AbstractLearningRateScheduler Base type for all learning rate scheduler. """ -@compat abstract type AbstractLearningRateScheduler end +abstract type AbstractLearningRateScheduler end """ AbstractMomentumScheduler Base type for all momentum scheduler. """ -@compat abstract type AbstractMomentumScheduler end +abstract type AbstractMomentumScheduler end @@ -39,7 +39,7 @@ Base type for all momentum scheduler. but unlike the mini-batch count, the iteration count does **not** reset in each epoch. So it track the *total* number of mini-batches seen so far. """ -type OptimizationState +mutable struct OptimizationState batch_size :: Int curr_epoch :: Int curr_batch :: Int @@ -70,7 +70,7 @@ import ..mx: AbstractLearningRateScheduler, OptimizationState, get_learning_rate Fixed learning rate scheduler always return the same learning rate. """ -type Fixed <: AbstractLearningRateScheduler +mutable struct Fixed <: AbstractLearningRateScheduler learning_rate :: Float64 end get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rate @@ -81,7 +81,7 @@ get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rat ``\eta_t = \eta_0\gamma^t``. Here ``t`` is the epoch count, or the iteration count if `decay_on_iteration` is set to true. """ -type Exp <: AbstractLearningRateScheduler +mutable struct Exp <: AbstractLearningRateScheduler learning_rate :: Float64 gamma :: Float64 on_iteration :: Bool @@ -99,7 +99,7 @@ get_learning_rate(self :: Exp, state :: OptimizationState) = Here ``t`` is the epoch count, or the iteration count if `decay_on_iteration` is set to true. """ -type Inv <: AbstractLearningRateScheduler +mutable struct Inv <: AbstractLearningRateScheduler learning_rate :: Float64 gamma :: Float64 power :: Float64 @@ -147,7 +147,7 @@ import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum The null momentum scheduler always returns 0 for momentum. It is also used to explicitly indicate momentum should not be used. """ -immutable Null <: AbstractMomentumScheduler +struct Null <: AbstractMomentumScheduler end get_momentum(self :: Null, state :: OptimizationState) = 0.0 @@ -156,7 +156,7 @@ get_momentum(self :: Null, state :: OptimizationState) = 0.0 Fixed momentum scheduler always returns the same value. """ -type Fixed <: AbstractMomentumScheduler +mutable struct Fixed <: AbstractMomentumScheduler momentum :: Float64 end get_momentum(self :: Fixed, state :: OptimizationState) = self.momentum @@ -178,7 +178,7 @@ Here * ``\alpha``: default `0.96` * ``\mu_0``: default `0.99` """ -type NadamScheduler <: AbstractMomentumScheduler +mutable struct NadamScheduler <: AbstractMomentumScheduler mu0 :: Float64 delta :: Float64 gamma :: Float64 @@ -242,7 +242,7 @@ end Base class for all optimizer options. """ -@compat abstract type AbstractOptimizerOptions end +abstract type AbstractOptimizerOptions end """ normalized_gradient(opts, state, weight, grad) diff --git a/src/optimizers/adadelta.jl b/src/optimizers/adadelta.jl index aec81445fbb2..f15ff93c7beb 100644 --- a/src/optimizers/adadelta.jl +++ b/src/optimizers/adadelta.jl @@ -49,7 +49,7 @@ s_t &= \rho s_{t-1} + (1-\rho)*(\eta_t*g)^2`` ADADELTA: An Adaptive Learning Rate Method. arXiv Preprint arXiv:1212.5701. """ -type AdaDelta <: AbstractOptimizer +mutable struct AdaDelta <: AbstractOptimizer opts :: AdaDeltaOptions state :: OptimizationState @@ -61,7 +61,7 @@ type AdaDelta <: AbstractOptimizer end end -type AdaDeltaState +mutable struct AdaDeltaState acc :: NDArray delta_acc :: NDArray end diff --git a/src/optimizers/adagrad.jl b/src/optimizers/adagrad.jl index 2df3c07efd44..d12ca43d15b2 100644 --- a/src/optimizers/adagrad.jl +++ b/src/optimizers/adagrad.jl @@ -40,7 +40,7 @@ Epsilon is not included in the typical formula, see [2]. (http://www.ark.cs.cmu.edu/cdyer/adagrad.pdf) """ -type AdaGrad <: AbstractOptimizer +mutable struct AdaGrad <: AbstractOptimizer opts :: AdaGradOptions state :: OptimizationState diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl index a6b5c69eefc3..b8a6e9d385c0 100644 --- a/src/optimizers/adam.jl +++ b/src/optimizers/adam.jl @@ -28,7 +28,7 @@ Stochastic Optimization*. arXiv:1412.6980 [cs.LG]. * `weight_decay::Real`: default `0.00001`, weight decay is equivalent to adding a global l2 regularizer for all the parameters. """ -type ADAM <: AbstractOptimizer +mutable struct ADAM <: AbstractOptimizer opts :: ADAMOptions state :: OptimizationState @@ -40,7 +40,7 @@ type ADAM <: AbstractOptimizer end end -type ADAMState +mutable struct ADAMState current_lr :: Float64 # current learning rate mt :: NDArray vt :: NDArray diff --git a/src/optimizers/adamax.jl b/src/optimizers/adamax.jl index 838264360e1b..adcdb78bf255 100644 --- a/src/optimizers/adamax.jl +++ b/src/optimizers/adamax.jl @@ -37,7 +37,7 @@ See [1] for further description. (http://arxiv.org/abs/1412.6980v8). """ -type AdaMax <: AbstractOptimizer +mutable struct AdaMax <: AbstractOptimizer opts :: AdaMaxOptions state :: OptimizationState @@ -49,7 +49,7 @@ type AdaMax <: AbstractOptimizer end end -type AdaMaxState +mutable struct AdaMaxState mt :: NDArray ut :: NDArray beta1Power :: Float64 diff --git a/src/optimizers/nadam.jl b/src/optimizers/nadam.jl index b90b7a106984..3b39c0aaefbe 100644 --- a/src/optimizers/nadam.jl +++ b/src/optimizers/nadam.jl @@ -47,7 +47,7 @@ at their default values. [http://www.cs.toronto.edu/~fritz/absps/momentum.pdf] (http://www.cs.toronto.edu/~fritz/absps/momentum.pdf) """ -type Nadam <: AbstractOptimizer +mutable struct Nadam <: AbstractOptimizer opts :: NadamOptions state :: OptimizationState @@ -61,7 +61,7 @@ type Nadam <: AbstractOptimizer end end -type NadamState +mutable struct NadamState mt :: NDArray nt :: NDArray momentum :: Float64 diff --git a/src/optimizers/rmsprop.jl b/src/optimizers/rmsprop.jl index 0c6c2d45a753..274e510f6cfe 100644 --- a/src/optimizers/rmsprop.jl +++ b/src/optimizers/rmsprop.jl @@ -43,7 +43,7 @@ learning rate ``\eta_t`` is calculated as: (http://www.youtube.com/watch?v=O3sxAc4hxZU) (formula @5:20) """ -type RMSProp <: AbstractOptimizer +mutable struct RMSProp <: AbstractOptimizer opts :: RMSPropOptions state :: OptimizationState diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index cd0b998fbed0..6e8ab34f1409 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -28,7 +28,7 @@ Stochastic gradient descent optimizer. * `weight_decay::Real`: default `0.0001`, weight decay is equivalent to adding a global l2 regularizer to the parameters. """ -type SGD <: AbstractOptimizer +mutable struct SGD <: AbstractOptimizer opts :: SGDOptions state :: OptimizationState diff --git a/src/random.jl b/src/random.jl index 2d594014da1c..3c5f1dcb564b 100644 --- a/src/random.jl +++ b/src/random.jl @@ -34,7 +34,7 @@ julia> mx.rand(0, 1, (2, 2)) |> copy 0.281153 0.713927 ``` """ -function rand{N}(low::Real, high::Real, shape::NTuple{N, Int}, ctx::Context=cpu()) +function rand(low::Real, high::Real, shape::NTuple{N, Int}, ctx::Context=cpu()) where N out = empty(shape, ctx) rand!(low, high, out) end @@ -53,7 +53,7 @@ end Draw random samples from a normal (Gaussian) distribution. """ -function randn{N}(mean::Real, stdvar::Real, shape::NTuple{N,Int}, ctx::Context=cpu()) +function randn(mean::Real, stdvar::Real, shape::NTuple{N,Int}, ctx::Context=cpu()) where N out = empty(shape, ctx) randn!(mean, stdvar, out) end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 9312ea5dd7c5..80daae1f53de 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -9,7 +9,7 @@ SymbolicNode is the basic building block of the symbolic graph in MXNet.jl. Make a new node by composing `self` with `args`. Or the arguments can be specified using keyword arguments. """ -type SymbolicNode +mutable struct SymbolicNode handle :: MX_SymbolHandle end function Base.unsafe_convert(::Type{MX_handle}, obj::SymbolicNode) @@ -723,13 +723,13 @@ from right to left. output shape would be (40,5) - with `reverse=true`, output shape will be (50,4). """ -reshape{N}(sym::SymbolicNode, dim::NTuple{N, Integer}; kwargs...) = +reshape(sym::SymbolicNode, dim::NTuple{N, Integer}; kwargs...) where {N} = _reshape(sym, dim; kwargs...) reshape(sym::SymbolicNode, dim::Integer...; kwargs...) = _reshape(sym, dim; kwargs...) -@inline function _reshape{N}(sym::SymbolicNode, dim::NTuple{N, Integer}; - reverse::Bool=false, name::String="") +@inline function _reshape(sym::SymbolicNode, dim::NTuple{N, Integer}; + reverse::Bool=false, name::String="") where N op = _get_cached_libmx_op_handle("reshape") node = _create_atomic_symbol(op.value, ["shape", "reverse"], [dump_mx_param(dim), dump_mx_param(!reverse)]) diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl index 0e32446b9e0f..77be97745926 100644 --- a/test/unittest/bind.jl +++ b/test/unittest/bind.jl @@ -7,7 +7,7 @@ using ..Main: rand_dims, reldiff ################################################################################ # Test Implementations ################################################################################ -function test_arithmetic{T <: mx.DType}(::Type{T}, uf, gf) +function test_arithmetic(::Type{T}, uf, gf) where T <: mx.DType shape = rand_dims() info("Bind::arithmetic::$T::$uf::dims = $shape") diff --git a/test/unittest/metric.jl b/test/unittest/metric.jl index 5b5632a87c76..ca51f83671d9 100644 --- a/test/unittest/metric.jl +++ b/test/unittest/metric.jl @@ -26,7 +26,7 @@ function generate_probs(n, m) end -function loglikelihood{T <: AbstractFloat}(labels::Vector{T}, probs::Array{T, 2}) +function loglikelihood(labels::Vector{T}, probs::Array{T, 2}) where T <: AbstractFloat LL = 0.0 eps = convert(T, 1.0e-8) for i = 1:size(labels, 1) @@ -50,11 +50,7 @@ function test_ace() metric = mx.ACE() # For categorical variables, ACE == -LL mx._update_single_output(metric, labels, probs) LL_v2 = metric.ace_sum / metric.n_sample - @static if VERSION >= v"0.6.0-dev.2075" - @test LL ≈ LL_v2 atol=1e-12 - else - @test_approx_eq_eps LL LL_v2 1e-12 - end + @test LL ≈ LL_v2 atol=1e-12 end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 0b9c7cf6dd09..2299e04836bd 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -7,8 +7,8 @@ using ..Main: rand_dims, reldiff ################################################################################ # Test Implementations ################################################################################ -rand_tensors{N}(dims::NTuple{N, Int}) = rand_tensors(mx.MX_float, dims) -function rand_tensors{N, T}(::Type{T}, dims::NTuple{N, Int}) +rand_tensors(dims::NTuple{N, Int}) where {N} = rand_tensors(mx.MX_float, dims) +function rand_tensors(::Type{T}, dims::NTuple{N, Int}) where {N, T} tensor = rand(T, dims) array = copy(tensor, mx.cpu()) return (tensor, array) From 4919273ed2e4ed8704b0e5c1d70aa26c86d69d37 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 9 Nov 2017 23:01:41 +0800 Subject: [PATCH 536/630] ndarray: getindex/setindex! linear indexing (#294) * ndarray: getindex/setindex! linear indexing ```julia x = mx.zeros(2, 5) x[5] = 42 ``` * ndarray: implement first --- NEWS.md | 19 ++++++++++ src/ndarray.jl | 77 ++++++++++++++++++++++++++++++++-------- test/unittest/ndarray.jl | 64 +++++++++++++++++++++++++++++++++ 3 files changed, 146 insertions(+), 14 deletions(-) diff --git a/NEWS.md b/NEWS.md index 77ef0b766f16..fc998538f580 100644 --- a/NEWS.md +++ b/NEWS.md @@ -26,6 +26,25 @@ 2.0 4.0 ``` +* `NDArray` `getindex`/`setindex!` linear indexing support and `first` for extracting scalar value. (#TBD) + + ```julia + julia> x = mx.zeros(2, 5) + + julia> x[5] = 42 # do synchronization and set the value + ``` + + ```julia + julia> y = x[5] # actually, getindex won't do synchronization, but REPL's showing did it for you + 1 mx.NDArray{Float32} @ CPU0: + 42.0 + + julia> first(y) # do sync and get the value + 42.0f0 + + julia> y[] # this is available, also + 42.0f0 + ``` * Elementwise power of `NDArray`. (#293) * `x.^2` * `2.^x` diff --git a/src/ndarray.jl b/src/ndarray.jl index 3e7625e3fdf6..fb495af34ff1 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -312,6 +312,9 @@ function eltype(arr :: T) where T <: Union{NDArray, MX_NDArrayHandle} end end +@inline _first(arr::NDArray) = try_get_shared(arr, sync = :read) |> first + +Base.first(arr::NDArray) = _first(arr) """ slice(arr :: NDArray, start:stop) @@ -341,37 +344,58 @@ function slice(arr :: NDArray, slice::UnitRange{Int}) return NDArray(MX_NDArrayHandle(hdr_ref[]), arr.writable) end +function _at(handle::Union{MX_NDArrayHandle, MX_handle}, idx::Integer) + h_ref = Ref{MX_handle}(C_NULL) + @mxcall(:MXNDArrayAt, (MX_handle, MX_uint, Ref{MX_handle}), + handle, idx, h_ref) + h_ref[] +end + import Base: setindex! """ - setindex!(arr :: NDArray, val, idx) + setindex!(arr::NDArray, val, idx) -Assign values to an `NDArray`. Elementwise assignment is not implemented, only the following -scenarios are supported +Assign values to an `NDArray`. +The following scenarios are supported + +* single value assignment via linear indexing: `arr[42] = 24` * `arr[:] = val`: whole array assignment, `val` could be a scalar or an array (Julia `Array` or `NDArray`) of the same shape. * `arr[start:stop] = val`: assignment to a *slice*, `val` could be a scalar or an array of the same shape to the slice. See also [`slice`](@ref). """ -function setindex!(arr :: NDArray, val :: Real, ::Colon) - @assert(arr.writable) +function setindex!(arr::NDArray, val::Real, idx::Integer) + # linear indexing + @assert arr.writable + _set_value(out=arr[idx], src=val) +end + +function setindex!(arr::NDArray, val::Real, ::Colon) + @assert arr.writable _set_value(out=arr, src=convert(eltype(arr), val)) - return arr end -function setindex!(arr :: NDArray, val :: Array{T}, ::Colon) where T<:Real + +function setindex!(arr::NDArray, val::Array{T}, ::Colon) where T<:Real + @assert arr.writable copy!(arr, val) end -function setindex!(arr :: NDArray, val :: NDArray, ::Colon) + +function setindex!(arr::NDArray, val::NDArray, ::Colon) + @assert arr.writable copy!(arr, val) end -function setindex!(arr :: NDArray, val :: Union{T,Array{T},NDArray}, idx::UnitRange{Int}) where T<:Real + +function setindex!(arr::NDArray, val::Union{T,Array{T},NDArray}, + idx::UnitRange{Int}) where T<:Real + @assert arr.writable setindex!(slice(arr, idx), val, Colon()) end import Base: getindex """ - getindex(arr :: NDArray, idx) + getindex(arr::NDArray, idx) Shortcut for [`slice`](@ref). A typical use is to write @@ -396,18 +420,43 @@ which furthur translates into create a **copy** of the sub-array for Julia `Array`, while for `NDArray`, this is a *slice* that shares the memory. """ -function getindex(arr :: NDArray, ::Colon) +function getindex(arr::NDArray, ::Colon) return arr end """ -Shortcut for [`slice`](@ref). **NOTE** the behavior for Julia's built-in index slicing is to create a -copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. +Shortcut for [`slice`](@ref). +**NOTE** the behavior for Julia's built-in index slicing is to create a +copy of the sub-array, while here we simply call `slice`, +which shares the underlying memory. """ -function getindex(arr :: NDArray, idx::UnitRange{Int}) +function getindex(arr::NDArray, idx::UnitRange{Int}) slice(arr, idx) end +getindex(arr::NDArray) = _first(arr) + +function getindex(arr::NDArray, idx::Integer) + # linear indexing + len = length(arr) + size_ = size(arr) + + if idx <= 0 || idx > len + throw(BoundsError( + "attempt to access $(join(size_, 'x')) NDArray at index $(idx)")) + end + + idx -= 1 + offsets = size_[1:end-1] |> reverse ∘ cumprod ∘ collect + handle = arr.handle + for offset ∈ offsets + handle = _at(handle, idx ÷ offset) + idx %= offset + end + + _at(handle, idx) |> MX_NDArrayHandle |> x -> NDArray(x, arr.writable) +end + import Base: copy!, copy, convert, deepcopy """ diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 2299e04836bd..ac9090e3ca33 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -85,6 +85,68 @@ function test_slice() @test copy(mx.slice(array, 2:3)) == [1 1; 1 1] end +function test_linear_idx() + info("NDArray::getindex::linear indexing") + let A = reshape(collect(1:30), 3, 10) + x = mx.NDArray(A) + + @test copy(x) == A + @test copy(x[1]) == [1] + @test copy(x[2]) == [2] + @test copy(x[3]) == [3] + @test copy(x[12]) == [12] + @test copy(x[13]) == [13] + @test copy(x[14]) == [14] + + @test_throws BoundsError x[-1] + @test_throws BoundsError x[0] + @test_throws BoundsError x[31] + @test_throws BoundsError x[42] + end + + let A = reshape(collect(1:24), 3, 2, 4) + x = mx.NDArray(A) + + @test copy(x) == A + @test copy(x[1]) == [1] + @test copy(x[2]) == [2] + @test copy(x[3]) == [3] + @test copy(x[11]) == [11] + @test copy(x[12]) == [12] + @test copy(x[13]) == [13] + @test copy(x[14]) == [14] + end + + info("NDArray::setindex!::linear indexing") + let A = reshape(collect(1:24), 3, 2, 4) + x = mx.NDArray(A) + + @test copy(x) == A + + x[4] = -4 + @test copy(x[4]) == [-4] + + x[11] = -11 + @test copy(x[11]) == [-11] + + x[24] = 42 + @test copy(x[24]) == [42] + end +end # function test_linear_idx + +function test_first() + info("NDArray::first") + let A = reshape(collect(1:30), 3, 10) + x = mx.NDArray(A) + + @test x[] == 1 + @test x[5][] == 5 + + @test first(x) == 1 + @test first(x[5]) == 5 + end +end # function test_first + function test_plus() dims = rand_dims() t1, a1 = rand_tensors(dims) @@ -668,6 +730,8 @@ end test_assign() test_copy() test_slice() + test_linear_idx() + test_first() test_plus() test_minus() test_mul() From 1fc03f2721f7407f5375f12cb97bcfe79a337543 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 9 Nov 2017 23:03:31 +0800 Subject: [PATCH 537/630] ndarray: elementwise power for irrational (#310) --- NEWS.md | 5 +++++ src/base.jl | 11 ++++++----- src/ndarray.jl | 4 ++++ test/unittest/ndarray.jl | 16 ++++++++++++++++ 4 files changed, 31 insertions(+), 5 deletions(-) diff --git a/NEWS.md b/NEWS.md index fc998538f580..d5eed516db95 100644 --- a/NEWS.md +++ b/NEWS.md @@ -51,6 +51,11 @@ * `x.^y` * where `x` and `y` are `NDArray`s. +* Elementwise power of irrational and `NDArray` (#TBD) + * `e.^x` + * `x.^e` + * `π.^x` + ## API Changes * `reshape` of NDArray shares the same interface with Base (#272). diff --git a/src/base.jl b/src/base.jl index 5df0de509eec..e75dc3b6ac65 100644 --- a/src/base.jl +++ b/src/base.jl @@ -157,11 +157,12 @@ end # # TODO: find a better solution in case this cause issues in the future. ################################################################################ -dump_mx_param(val::Any) = string(val) -dump_mx_param(val::Float64) = @sprintf("%.16e", val) -dump_mx_param(val::Float32) = @sprintf("%.8e", val) -dump_mx_param(val::Float16) = @sprintf("%.4e", val) -dump_mx_param(shape::NTuple{N, T}) where {N, T<:Integer} = +dump_mx_param(val::Any) = string(val) +dump_mx_param(val::Float64) = @sprintf("%.16e", val) +dump_mx_param(val::Float32) = @sprintf("%.8e", val) +dump_mx_param(val::Float16) = @sprintf("%.4e", val) +dump_mx_param(val::Irrational) = @sprintf("%.16e", val) +dump_mx_param(shape::NTuple{N, <:Integer}) where N = string(tuple(flipdim([shape...], 1)...)) diff --git a/src/ndarray.jl b/src/ndarray.jl index fb495af34ff1..98f7dddc6fa1 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -754,6 +754,10 @@ broadcast_(::typeof(^), x::NDArray, y::NDArray) = _power(x, y) broadcast_(::typeof(^), x::NDArray, s::Real) = _power_scalar(x, scalar=s) broadcast_(::typeof(^), s::Real, x::NDArray) = _rpower_scalar(x, scalar=s) +broadcast_(::typeof(^), ::Irrational{:e}, x::NDArray) = exp(x) +broadcast_(::typeof(^), x::NDArray, s::Irrational) = _power_scalar(x, scalar=s) +broadcast_(::typeof(^), s::Irrational, x::NDArray) = _rpower_scalar(x, scalar=s) + """ fill!(x, arr::NDArray) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index ac9090e3ca33..26d40463adb4 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -516,6 +516,22 @@ function test_power() @test copy(y.^x) == Float32[2 4; 8 16] end + info("NDArray::power::e.^x::x.^e") + let x = mx.zeros(2, 3), A = [1 1 1; 1 1 1] + @test copy(e.^x) ≈ A + end + + let A = Float32[1 2; 3 4], x = mx.NDArray(A) + @test copy(e.^x) ≈ e.^A + @test copy(x.^e) ≈ A.^e + end + + info("NDArray::power::π.^x::x.^π") + let A = Float32[1 2; 3 4], x = mx.NDArray(A) + @test copy(π.^x) ≈ π.^A + @test copy(x.^π) ≈ A.^π + end + # TODO: Float64: wait for https://github.com/apache/incubator-mxnet/pull/8012 end # function test_power From 00d61d237319277b042e1235c8524ef40029a141 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 9 Nov 2017 23:07:23 +0800 Subject: [PATCH 538/630] executor: return `outputs` on forward (#312) --- src/executor.jl | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/src/executor.jl b/src/executor.jl index 38f3925293c1..036c5743b7c0 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -156,7 +156,7 @@ function simple_bind(self :: SymbolicNode, ctx :: Context; end -function forward(self :: Executor; is_train::Bool=false, kwargs...) +function forward(self::Executor; is_train::Bool = false, kwargs...) for (k,v) in kwargs @assert(k ∈ self.arg_dict, "Unknown argument $k") @assert(isa(v, NDArray), "Keyword argument $k must be an NDArray") @@ -164,6 +164,8 @@ function forward(self :: Executor; is_train::Bool=false, kwargs...) end @mxcall(:MXExecutorForward, (MX_handle, Cint), self, is_train) + + self.outputs end function backward(self :: Executor) From 3f93ffc42cf159381b8b5e1459d8f0523bd60ba5 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 9 Nov 2017 23:08:40 +0800 Subject: [PATCH 539/630] git: union merge policy for NEWS.md (#309) --- .gitattributes | 1 + 1 file changed, 1 insertion(+) create mode 100644 .gitattributes diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 000000000000..4b76ca8606cb --- /dev/null +++ b/.gitattributes @@ -0,0 +1 @@ +NEWS.md merge=union From 678b49e433f6c8f69255461301858cf12101114a Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 9 Nov 2017 23:41:05 +0800 Subject: [PATCH 540/630] ndarray: regularize fill! API (#311) In Base, it's fill!(A, x) --- NEWS.md | 2 +- src/ndarray.jl | 6 +++--- test/unittest/ndarray.jl | 4 ++-- 3 files changed, 6 insertions(+), 6 deletions(-) diff --git a/NEWS.md b/NEWS.md index d5eed516db95..fcd48dc3f81e 100644 --- a/NEWS.md +++ b/NEWS.md @@ -11,7 +11,7 @@ * `fill(x, dims, ctx=cpu())` * `fill(x, dims...)` - * `fill!(x, arr::NDArray)` + * `fill!(arr::NDArray, x)` * Matrix (2D NDArray) multiplication is available now. (#TBD) diff --git a/src/ndarray.jl b/src/ndarray.jl index 98f7dddc6fa1..18db4f38b9ea 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -759,11 +759,11 @@ broadcast_(::typeof(^), x::NDArray, s::Irrational) = _power_scalar(x, scalar=s) broadcast_(::typeof(^), s::Irrational, x::NDArray) = _rpower_scalar(x, scalar=s) """ - fill!(x, arr::NDArray) + fill!(arr::NDArray, x) -Create an `NDArray` filled with the value `x`, like `Base.fill`. +Create an `NDArray` filled with the value `x`, like `Base.fill!`. """ -function fill!(x, arr::NDArray) +function Base.fill!(arr::NDArray, x) arr[:] = x arr end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 26d40463adb4..81093376ad2d 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -706,10 +706,10 @@ function test_fill() end info("NDArray::fill!::arr") - let x = mx.fill!(42, mx.zeros(2, 3, 4)) + let x = fill!(mx.zeros(2, 3, 4), 42) @test eltype(x) == Float32 @test size(x) == (2, 3, 4) - @test reldiff(copy(x), fill(Float32(42), 2, 3, 4)) < thresh + @test copy(x) ≈ fill(Float32(42), 2, 3, 4) end end # function test_fill From e083e5f295d35daa4820a21bd50d296ba230942f Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 11 Nov 2017 00:19:42 +0800 Subject: [PATCH 541/630] doc: cleanup useless enc file (#315) --- docs/.documenter.enc | Bin 1680 -> 0 bytes 1 file changed, 0 insertions(+), 0 deletions(-) delete mode 100644 docs/.documenter.enc diff --git a/docs/.documenter.enc b/docs/.documenter.enc deleted file mode 100644 index 48bd92bc4742234f2364e62fe899efdf64a1f5d8..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 1680 zcmV;B25rWS<*O0{K{-TA^4}R}MY#~pBnC~nXf)$xi`VgJ=(}CLo z99B@ySk*kZH{=OD%kZt*$@gI0bE~V&8IFr)?w5O6@f*MXO1rRL!8xs5b~i-YSaAz8 z?Oa!ONEJ)LuTIWymjXYs=Oi>jHonzG$sc;Z*bK0{asSaCl)K8Dt9hwefjeLh>CozO zqh;;QUGT7%|V}q;lmM@=0X9JJ!pB?v8#q`2cOu+ zU@YKi4jzn?`JhZiTmUfQFk4;S}Pw~t=F}U z$%Rz&t@nw^pFcHC2L-yI$Y*cB3#7Rxc^W0K%)Ks79+Uzgm`KXYOBtz%nbUK)6W{GD z6vGFcsUm(_XRIWEX3zin!FjO}Sz?&zh2<}q#6!7T#mDR*Upz5b8j3x4wws>0y8d2U zgr4|K1?&yV3gZfVwYp8Mk)r^>44lPXYH~*@OrgnM4=fOdZBZK!f2-)hDy5ti9w|to z3b(Q=|AHjoLA#w>fJ(S+W#2{r*t{_IpAvCG#Dzda4Y6A710Z2cBun5P^+T7Tm*oQd z1GpiOufpgUcuJQvxFw|HHB`nA_*$k*K{RRaP4)YfMu!gzCr!upY4?3CSKuLt4nsHk z7GV%hH^^e+!1|r&n~=xskC>gi03^36$z|~i_qZ2JUcTV%POTl65g}~L$K<+;J@wUSt;2vLL4Ojd?W zBFdaPoa|QQmU>G641cN1B)OdmcaScG-0Zu4 zafkd|kBaQySh0;{(bK&+u)17jYVSCTLTJ3Yud0x;nOIIGq{LUyoxoez_PJcAA=DK< znsoy=qR64tOErR%#{xT9UVX&!%X)SR<|qo_MO@5o2!lje^^fxFuyLo!EM`7@P9Z(`Iqdg=4#^%Q8z=!DfcOz&iz zHt+S7=xTE<>f>P?R*4NHpCz5FiKsVp^Ld zd5$9(3lZ3}iDb`iIty37map_wc;xQPUfE59I#tt(Kp2#wv?ea~%%2gdJ4%Mt(%~9d zRHCY}3szlG0?5myNXNw9CBbPl_uoPVNqr%~LyW*k;fnaIS6ZXp9i@{Y}u8$kaBHuAgSBe z29Hcga%%BupHsJhkLpmccg5yF!GveSFS*-xYBpnpNO-TiIzIo+%#)oUKoVD`UI~HO z$TkJN-PR>vZr&d{r9ca1?@0Y3U{V?O`WSuiW!9;0Uh2#KbU_q{C38*|0zxhApkC&X zeUx~}r7VL8qdBHi48~Lh&rPXZviPvjgScMatjU&#pKvk^C8E`Wu{OUd>%v70GDn2S aF;ziPu#v|oq3fM$n|LCvE&l?FaMg<7X*&S` From 09b9718952582bea5d9e149025024568461c9bb3 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 13 Nov 2017 10:47:58 +0800 Subject: [PATCH 542/630] build: prevent CUDA_HOME KeyError (#316) address: https://github.com/dmlc/MXNet.jl/issues/316#issuecomment-343660751 --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 86d6a9839287..c1463da5c04f 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -63,7 +63,7 @@ if HAS_CUDA if HAS_CUDNN info("Found a CuDNN installation.") end - info("CUDA_HOME -> $(ENV["CUDA_HOME"])") + info("CUDA_HOME -> $(get(ENV, "CUDA_HOME", nothing))") else info("Did not find a CUDA installation, using CPU-only version of MXNet.") end From 9304e6e36a36488209ecc5a37f20ddaa7a8c4ebb Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 13 Nov 2017 11:51:23 +0800 Subject: [PATCH 543/630] sym: broadcast unfusion (#314) * sym: broadcast unfusion for `add` * sym: broadcast unfusion for `minus` * sym: broadcast unfusion for `multiplication` * sym: broadcast unfusion for `div` * sym: broadcast unfusion for `power` * sym: broadcast unfusion for `power` with irrational --- src/ndarray.jl | 4 +- src/symbolic-node.jl | 173 ++++++++++++------------ test/common.jl | 12 ++ test/unittest/symbolic-node.jl | 233 ++++++++++++++++++++++++++++++++- 4 files changed, 338 insertions(+), 84 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 18db4f38b9ea..3e4cff5591d5 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -722,7 +722,7 @@ import Base: / """ ./(x::NDArray, y::NDArray) ./(x::NDArray, y::Real) - ./(x:: Real, y::NDArray) + ./(x::Real, y::NDArray) * Elementwise dividing an `NDArray` by a scalar or another `NDArray` of the same shape. @@ -746,7 +746,7 @@ import Base: ^ .^(x::NDArray, s::Real) .^(s::Real, x::NDArray) -Elementwise power of NDArray. +Elementwise power of `NDArray`. """ ^ diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 80daae1f53de..72eb60b3a8c0 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -10,11 +10,15 @@ Make a new node by composing `self` with `args`. Or the arguments can be specified using keyword arguments. """ mutable struct SymbolicNode - handle :: MX_SymbolHandle + handle::MX_SymbolHandle end -function Base.unsafe_convert(::Type{MX_handle}, obj::SymbolicNode) + +const SymbolicNodeOrReal = Union{SymbolicNode, Real} + +@unfuse SymbolicNode # for broadcasting + +Base.unsafe_convert(::Type{MX_handle}, obj::SymbolicNode) = Base.unsafe_convert(MX_handle, obj.handle) -end Base.convert(t::Type{MX_handle}, obj::SymbolicNode) = Base.unsafe_convert(t, obj) Base.cconvert(t::Type{MX_handle}, obj::SymbolicNode) = Base.unsafe_convert(t, obj) @@ -483,105 +487,112 @@ function Base.getindex(self :: SymbolicNode, idx :: Int) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end -import Base.broadcast import Base: + -function +(self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) - ret = self - for arg in args - if isa(arg, SymbolicNode) - ret = _Plus(ret, arg) + +""" + +(args...) + .+(args...) + +Elementwise summation of `SymbolicNode`. +""" +function +(x::SymbolicNode, ys::SymbolicNodeOrReal...) + ret = x + for y ∈ ys + if y isa SymbolicNode + ret = _plus(ret, y) else - ret = _PlusScalar(ret, scalar=MX_float(arg)) + ret = _plus_scalar(ret, scalar=MX_float(y)) end end ret end -@compatdot function Base.broadcast(::typeof(+), self::SymbolicNode, args::Union{SymbolicNode,Real}...) - +(self, args...) -end -function +(s1 :: Real, self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) - +(self, s1, args...) -end -@compatdot function Base.broadcast(::typeof(+), s1::Real, self::SymbolicNode, - args::Union{SymbolicNode,Real}...) - +(self, s1, args...) -end + ++(s::Real, x::SymbolicNode, ys::SymbolicNodeOrReal...) = +(x + s, ys...) + +broadcast_(::typeof(+), x::SymbolicNode, ys::SymbolicNodeOrReal...) = +(x, ys...) +broadcast_(::typeof(+), s::Real, x::SymbolicNode, ys::SymbolicNodeOrReal...) = +(x + s, ys...) import Base: - -function -(self :: SymbolicNode, arg :: SymbolicNode) - _Minus(self, arg) -end -@compatdot function Base.broadcast(::typeof(-), self :: SymbolicNode, arg :: SymbolicNode) - -(self, arg) -end -function -(self :: SymbolicNode, arg :: Real) - _MinusScalar(self, scalar=MX_float(arg)) -end -@compatdot function Base.broadcast(::typeof(-), self :: SymbolicNode, arg :: Real) - -(self, arg) -end -function -(arg :: Real, self :: SymbolicNode) - _RMinusScalar(self, scalar=arg) -end -@compatdot function Base.broadcast(::typeof(-), arg :: Real, self :: SymbolicNode) - -(arg, self) -end +""" + -(x, y) + .-(x, y) -function -(self :: SymbolicNode) - -(0, self) -end +Elementwise substraction of `SymbolicNode`. +Operating with `Real` is available. +""" +x::SymbolicNode - y::SymbolicNode = _minus(x, y) +x::SymbolicNode - s::Real = _minus_scalar(x, scalar=MX_float(s)) +s::Real - x::SymbolicNode = _rminus_scalar(x, scalar=MX_float(s)) + +-(x::SymbolicNode) = 0 - x + +broadcast_(::typeof(-), x::SymbolicNode, y::SymbolicNodeOrReal) = x - y +broadcast_(::typeof(-), s::Real, x::SymbolicNode) = s - x import Base: * -@compatdot function Base.broadcast(::typeof(*), self :: SymbolicNode, args :: Union{SymbolicNode,Real}...) - ret = self - for arg in args - if isa(arg, SymbolicNode) - ret = _Mul(ret, arg) + +""" + .*(x, y) + +Elementwise multiplication of `SymbolicNode`. +""" +x::SymbolicNode * s::Real = _mul_scalar(x, scalar=MX_float(s)) +s::Real * x::SymbolicNode = _mul_scalar(x, scalar=MX_float(s)) + +function broadcast_(::typeof(*), x::SymbolicNode, ys::SymbolicNodeOrReal...) + ret = x + for y in ys + if y isa SymbolicNode + ret = _mul(ret, y) else - ret = _MulScalar(ret, scalar=MX_float(arg)) + ret = _mul_scalar(ret, scalar=MX_float(y)) end end ret end -@compatdot function Base.broadcast(::typeof(*), arg :: Real, self :: SymbolicNode, - args :: Union{SymbolicNode,Real}...) - broadcast(*, self, arg, args...) -end -function *(arg :: Real, self :: SymbolicNode) - _MulScalar(self, scalar=arg) -end -function *(self :: SymbolicNode, arg :: Real) - *(arg, self) -end + +broadcast_(::typeof(*), s::Real, x::SymbolicNode, ys::SymbolicNodeOrReal...) = + broadcast_(*, x * s, ys...) import Base: / -@compatdot function Base.broadcast(::typeof(/), self :: SymbolicNode, arg :: SymbolicNode) - _Div(self, arg) -end -@compatdot function Base.broadcast(::typeof(/), self :: SymbolicNode, arg :: Real) - _DivScalar(self, scalar=MX_float(arg)) -end -function /(self :: SymbolicNode, arg :: Real) - self ./ arg -end -function /(arg :: Real, self :: SymbolicNode) - _RDivScalar(self, scalar=arg) -end -@compatdot function Base.broadcast(::typeof(/), arg :: Real, self :: SymbolicNode) - _RDivScalar(self, scalar=arg) -end + +""" + ./(x, y) + +* Elementwise dividing a `SymbolicNode` by a scalar or another `SymbolicNode` +of the same shape. + +* Elementwise divide a scalar by an `SymbolicNode`. + +* Matrix division (solving linear systems) is not implemented yet. +""" +x::SymbolicNode / s::Real = _DivScalar(x, scalar=MX_float(s)) + +broadcast_(::typeof(/), x::SymbolicNode, y::SymbolicNode) = _div(x, y) +broadcast_(::typeof(/), x::SymbolicNode, s::Real) = _div_scalar(x, scalar=MX_float(s)) +broadcast_(::typeof(/), s::Real, x::SymbolicNode) = _rdiv_scalar(x, scalar=MX_float(s)) + import Base: ^ -@compatdot function Base.broadcast(::typeof(^), self :: SymbolicNode, pow :: SymbolicNode) - _Power(self, pow) -end -@compatdot function Base.broadcast(::typeof(^), self :: SymbolicNode, pow :: AbstractFloat) - _PowerScalar(self, scalar=pow) -end -function ^(self :: SymbolicNode, pow :: AbstractFloat) - self .^ pow -end + +""" + .^(x, y) + +Elementwise power of `SymbolicNode`. +Operating with `Real` is available. +""" +^ + +broadcast_(::typeof(^), x::SymbolicNode, y::SymbolicNode) = _power(x, y) +broadcast_(::typeof(^), x::SymbolicNode, s::Real) = _power_scalar(x, scalar=MX_float(s)) +broadcast_(::typeof(^), s::Real, x::SymbolicNode) = _rpower_scalar(x, scalar=MX_float(s)) + +broadcast_(::typeof(^), ::Irrational{:e}, x::SymbolicNode) = exp(x) +broadcast_(::typeof(^), x::SymbolicNode, s::Irrational) = + _power_scalar(x, scalar=MX_float(s)) +broadcast_(::typeof(^), s::Irrational, x::SymbolicNode) = + _rpower_scalar(x, scalar=MX_float(s)) function _compose!(node :: SymbolicNode; kwargs...) name = char_p(0) diff --git a/test/common.jl b/test/common.jl index 035650e74f72..53c9c251ef06 100644 --- a/test/common.jl +++ b/test/common.jl @@ -25,3 +25,15 @@ function mlpchain() mx.Activation(act_type=:relu) => mx.FullyConnected(name=:fc2, num_hidden=10) end + +""" +execution helper of SymbolicNode +""" +function exec(x::mx.SymbolicNode; feed...) + ks, vs = zip(feed...) + vs′ = mx.NDArray.(vs) + + e = mx.bind(x, context = mx.cpu(), args = Dict(zip(ks, vs′))) + mx.forward(e) + e.outputs +end diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index e81ef52055b1..39eda86b1bb2 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -2,7 +2,7 @@ module TestSymbolicNode using MXNet using Base.Test -using ..Main: mlp2, mlpchain, reldiff +using ..Main: mlp2, mlpchain, reldiff, exec ################################################################################ # Test Implementations @@ -256,6 +256,232 @@ function test_misc() symb = mx.ElementWiseSum(a,b) end +function test_add() + info("SymbolicNode::elementwise add") + let x = mx.Variable(:x), A = Float32[1 2; 3 4] + let y = exec(x .+ 42; :x => A)[] + @test size(y) == size(A) + @test copy(y) == A .+ 42 + end + + let y = exec(42 .+ x; :x => A)[] + @test size(y) == size(A) + @test copy(y) == 42 .+ A + end + + let y = exec(-1 .+ x .+ 42; :x => A)[] + @test size(y) == size(A) + @test copy(y) == -1 .+ A .+ 42 + end + end + + let A = Float32[1 2; 3 4], B = Float32[2 4; 6 8] + x = mx.Variable(:x) + y = mx.Variable(:y) + + let z = x .+ y + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) == A .+ B + end + + let z = y .+ x + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) == B .+ A + end + end +end # function test_add + +function test_minus() + info("SymbolicNode::elementwise minus") + let x = mx.Variable(:x), A = Float32[1 2; 3 4] + let y = exec(x .- 42; :x => A)[] + @test size(y) == size(A) + @test copy(y) == A .- 42 + end + + let y = exec(42 .- x; :x => A)[] + @test size(y) == size(A) + @test copy(y) == 42 .- A + end + + let y = exec(-1 .- x .- 42; :x => A)[] + @test size(y) == size(A) + @test copy(y) == -1 .- A .- 42 + end + + let y = exec(-x; :x => A)[] + @test size(y) == size(A) + @test copy(y) == -A + end + end + + let A = Float32[1 2; 3 4], B = Float32[2 4; 6 8] + x = mx.Variable(:x) + y = mx.Variable(:y) + + let z = x .- y + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) == A .- B + end + + let z = y .- x + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) == B .- A + end + end +end # function test_minus + +function test_mul() + info("SymoblicNode::elementwise mul") + let x = mx.Variable(:x), A = Float32[1 2; 3 4] + let y = exec(x .* 42; :x => A)[] + @test size(y) == size(A) + @test copy(y) == A .* 42 + end + + let y = exec(42 .* x; :x => A)[] + @test size(y) == size(A) + @test copy(y) == 42 .* A + end + + let y = exec(-1 .* x .* 42; :x => A)[] + @test size(y) == size(A) + @test copy(y) == -1 .* A .* 42 + end + end + + let A = Float32[1 2; 3 4], B = Float32[2 4; 6 8] + x = mx.Variable(:x) + y = mx.Variable(:y) + + let z = x .* y + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) == A .* B + end + + let z = y .* x + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) == B .* A + end + end +end # function test_mul + +function test_div() + info("SymoblicNode::elementwise div") + let x = mx.Variable(:x), A = Float32[1 2; 3 4] + let y = exec(x ./ 42; :x => A)[] + @test size(y) == size(A) + @test copy(y) ≈ A ./ 42 + end + + let y = exec(42 ./ x; :x => A)[] + @test size(y) == size(A) + @test copy(y) ≈ 42 ./ A + end + + let y = exec(-1 ./ x ./ 42; :x => A)[] + @test size(y) == size(A) + @test copy(y) ≈ -1 ./ A ./ 42 + end + end + + let A = Float32[1 2; 3 4], B = Float32[2 4; 6 8] + x = mx.Variable(:x) + y = mx.Variable(:y) + + let z = x ./ y + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) ≈ A ./ B + end + + let z = y ./ x + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) ≈ B ./ A + end + end +end # function test_div + +function test_power() + info("SymoblicNode::elementwise power") + let x = mx.Variable(:x), A = Float32[1 2; 3 4] + let y = exec(x.^42; :x => A)[] + @test size(y) == size(A) + @test copy(y) ≈ A.^42 + end + + let y = exec(42.^x; :x => A)[] + @test size(y) == size(A) + @test copy(y) ≈ 42.^A + end + end + + let A = Float32[1 2; 3 4], B = Float32[2 4; 6 8] + x = mx.Variable(:x) + y = mx.Variable(:y) + + let z = x.^y + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) ≈ A.^B + end + + let z = y.^x + z = exec(z; :x => A, :y => B)[] + + @test size(z) == size(A) + @test copy(z) ≈ B.^A + end + end + + info("NDArray::power::e.^x::x.^e") + let x = mx.Variable(:x), A = [0 0 0; 0 0 0] + y = exec(e.^x; :x => A)[] + @test copy(y) ≈ ones(A) + end + + let x = mx.Variable(:x), A = Float32[1 2; 3 4] + let y = e.^x + z = exec(y; :x => A)[] + @test copy(z) ≈ e.^A + end + + let y = x.^e + z = exec(y; :x => A)[] + @test copy(z) ≈ A.^e + end + end + + info("NDArray::power::π.^x::x.^π") + let x = mx.Variable(:x), A = Float32[1 2; 3 4] + let y = π.^x + z = exec(y; :x => A)[] + @test copy(z) ≈ π.^A + end + + let y = x.^π + z = exec(y; :x => A)[] + @test copy(z) ≈ A.^π + end + end +end # function test_power + ################################################################################ # Run tests ################################################################################ @@ -273,6 +499,11 @@ end test_dot() test_print() test_misc() + test_add() + test_minus() + test_mul() + test_div() + test_power() end end From f8e1938e5096c9522e84f523f4bd2e43db11446e Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 13 Nov 2017 13:34:29 +0800 Subject: [PATCH 544/630] Remove Compat and src/compat.jl (#318) --- REQUIRE | 1 - src/MXNet.jl | 2 -- src/compat.jl | 23 ----------------------- src/optimizers/adadelta.jl | 6 +++--- src/optimizers/adagrad.jl | 2 +- src/optimizers/adam.jl | 4 ++-- src/optimizers/nadam.jl | 2 +- src/optimizers/rmsprop.jl | 2 +- 8 files changed, 8 insertions(+), 34 deletions(-) delete mode 100644 src/compat.jl diff --git a/REQUIRE b/REQUIRE index 8c07e3f8b273..22caea9072b7 100644 --- a/REQUIRE +++ b/REQUIRE @@ -1,5 +1,4 @@ julia 0.6 -Compat 0.25.2 Formatting BinDeps JSON diff --git a/src/MXNet.jl b/src/MXNet.jl index 85991473d14c..d80bbd3d3cdd 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -24,8 +24,6 @@ import Base: round, ceil, floor, cos, sin, abs, sign, exp, sqrt, exp, log, norm, include("base.jl") -include("compat.jl") - include("context.jl") include("util.jl") diff --git a/src/compat.jl b/src/compat.jl deleted file mode 100644 index 257f1c2863ed..000000000000 --- a/src/compat.jl +++ /dev/null @@ -1,23 +0,0 @@ -# this file contains code used for enabling backward compatibility with 0.5 - -# have to import base dotted operators if in 0.5 - - -# this is for declaring broadcasted functions in 0.5 -# TODO this macro should be removed when 0.5 support is dropped -macro compatdot(fblock) - return esc(fblock) - @capture(fblock, function Base.broadcast(::typeof(op_), args__) - body_ - end) - opdot = Symbol(string('.',op)) - esc(quote - function $opdot($(args...)) - $body - end - end) -end - -macro compatmul(expr1, expr2) - esc(:(broadcast(*, $expr1, $expr2))) -end diff --git a/src/optimizers/adadelta.jl b/src/optimizers/adadelta.jl index f15ff93c7beb..3915d036496a 100644 --- a/src/optimizers/adadelta.jl +++ b/src/optimizers/adadelta.jl @@ -78,14 +78,14 @@ function update(self :: AdaDelta, index :: Int, weight :: NDArray, # Update state.acc as in RMSProp @inplace state.acc .*= self.opts.rho - @inplace state.acc .+= (1 - self.opts.rho) * @compatmul(grad, grad) + @inplace state.acc .+= (1 - self.opts.rho) * grad .* grad # Compute update using the "old" state.delta_acc - update = @compatmul(grad, sqrt(state.delta_acc + self.opts.epsilon)) ./ + update = grad .* sqrt(state.delta_acc + self.opts.epsilon) ./ (sqrt(state.acc + self.opts.epsilon)) @inplace weight .+= -lr * update # update state.delta_acc using update @inplace state.delta_acc .*= self.opts.rho - @inplace state.delta_acc .+= (1 - self.opts.rho) * @compatmul(update, update) + @inplace state.delta_acc .+= (1 - self.opts.rho) * update .* update end diff --git a/src/optimizers/adagrad.jl b/src/optimizers/adagrad.jl index d12ca43d15b2..a5eee0bbd102 100644 --- a/src/optimizers/adagrad.jl +++ b/src/optimizers/adagrad.jl @@ -61,6 +61,6 @@ function update(self :: AdaGrad, index :: Int, weight :: NDArray, lr = get_learning_rate(self.opts.lr_scheduler, self.state) grad = normalized_gradient(self.opts, self.state, weight, grad) - @inplace state .+= @compatmul(grad, grad) + @inplace state .+= grad .* grad @inplace weight .+= -lr * grad ./ (sqrt(state + self.opts.epsilon)) end diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl index b8a6e9d385c0..aa1bc90f9f78 100644 --- a/src/optimizers/adam.jl +++ b/src/optimizers/adam.jl @@ -60,8 +60,8 @@ function update(self :: ADAM, index :: Int, weight :: NDArray, grad :: NDArray, lr = state.current_lr grad = normalized_gradient(self.opts, self.state, weight, grad) - state.mt = self.opts.beta1 * state.mt + (1 - self.opts.beta1) * grad - state.vt = self.opts.beta2 * state.vt + (1 - self.opts.beta2) * @compatmul(grad, grad) + state.mt = self.opts.beta1 * state.mt + (1 - self.opts.beta1) .* grad + state.vt = self.opts.beta2 * state.vt + (1 - self.opts.beta2) .* grad .* grad at = sqrt(1.0 - state.beta2Power)/(1.0 - state.beta1Power) diff --git a/src/optimizers/nadam.jl b/src/optimizers/nadam.jl index 3b39c0aaefbe..c3ac18dcc11a 100644 --- a/src/optimizers/nadam.jl +++ b/src/optimizers/nadam.jl @@ -91,7 +91,7 @@ function update(self :: Nadam, index :: Int, weight :: NDArray, mt = state.mt / (1.0 - momentum_next) @inplace state.nt .*= self.opts.beta2 - @inplace state.nt .+= (1.0 - self.opts.beta2) * @compatmul(grad, grad) + @inplace state.nt .+= (1.0 - self.opts.beta2) .* grad .* grad nt = state.nt / (1.0 - state.beta2Power) state.beta2Power *= self.opts.beta2 diff --git a/src/optimizers/rmsprop.jl b/src/optimizers/rmsprop.jl index 274e510f6cfe..8afed0adc81d 100644 --- a/src/optimizers/rmsprop.jl +++ b/src/optimizers/rmsprop.jl @@ -65,7 +65,7 @@ function update(self :: RMSProp, index :: Int, weight :: NDArray, grad = normalized_gradient(self.opts, self.state, weight, grad) @inplace state .*= self.opts.rho - @inplace state .+= (1 - self.opts.rho) * @compatmul(grad, grad) + @inplace state .+= (1 - self.opts.rho) * grad .* grad @inplace weight .+= -lr * grad ./ (sqrt(state + self.opts.epsilon)) end From a19fc93859b17882615e45b7d23d02fc579cd688 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 14 Nov 2017 01:15:16 +0800 Subject: [PATCH 545/630] test: replace `reldiff` with `isapprox` (#321) * test/ndarray: replace `reldiff` with `isapprox` * test/symbolic-node: replace `reldiff` with `isapprox` * test/operator: replace `reldiff` with `isapprox` * test/io: replace `reldiff` with `isapprox` * test: remove `reldiff` --- test/common.jl | 6 -- test/unittest/bind.jl | 2 +- test/unittest/io.jl | 14 +-- test/unittest/ndarray.jl | 169 ++++++++++++++++----------------- test/unittest/operator.jl | 7 +- test/unittest/symbolic-node.jl | 15 +-- 6 files changed, 104 insertions(+), 109 deletions(-) diff --git a/test/common.jl b/test/common.jl index 53c9c251ef06..5854fc6659d0 100644 --- a/test/common.jl +++ b/test/common.jl @@ -1,12 +1,6 @@ ################################################################################ # Common models used in testing ################################################################################ -function reldiff(a, b) - diff = sum(abs.(a .- b)) - norm = sum(abs.(a)) - return diff / (norm + 1e-10) -end - function rand_dims(max_ndim=6) tuple(rand(1:10, rand(1:max_ndim))...) end diff --git a/test/unittest/bind.jl b/test/unittest/bind.jl index 77be97745926..3bac43f2345c 100644 --- a/test/unittest/bind.jl +++ b/test/unittest/bind.jl @@ -2,7 +2,7 @@ module TestBind using MXNet using Base.Test -using ..Main: rand_dims, reldiff +using ..Main: rand_dims ################################################################################ # Test Implementations diff --git a/test/unittest/io.jl b/test/unittest/io.jl index 88d77bd3c16b..f8e558613c99 100644 --- a/test/unittest/io.jl +++ b/test/unittest/io.jl @@ -1,8 +1,9 @@ module TestIO + using MXNet using Base.Test -using ..Main: rand_dims, reldiff +using ..Main: rand_dims function test_mnist() info("IO::MNIST") @@ -64,7 +65,7 @@ function test_arrays_impl(data::Vector, label::Vector, provider::mx.ArrayDataPro data_get = mx.get_data(provider, batch) for (d_real, d_get) in zip(data_batch, data_get) - @test reldiff(d_real, copy(d_get)[[1:n for n in size(d_real)]...]) < 1e-6 + @test d_real ≈ copy(d_get)[[1:n for n in size(d_real)]...] @test mx.count_samples(provider, batch) == size(d_real)[end] end end @@ -97,7 +98,7 @@ function test_arrays_shuffle() sample_count = 15 batch_size = 4 - data = rand(1, sample_count) + data = rand(mx.MX_float, 1, sample_count) label = collect(1:sample_count) provider = mx.ArrayDataProvider(data, :index => label, batch_size=batch_size, shuffle=true) @@ -107,14 +108,15 @@ function test_arrays_shuffle() for (idx, batch) in zip(idx_all, provider) data_batch = mx.get(provider, batch, :data) label_batch = mx.get(provider, batch, :index) - ns_batch = mx.count_samples(provider, batch) - data_got[idx:idx+ns_batch-1] = copy(data_batch)[1:ns_batch] + ns_batch = mx.count_samples(provider, batch) + data_got[idx:idx+ns_batch-1] = copy(data_batch)[1:ns_batch] label_got[idx:idx+ns_batch-1] = copy(label_batch)[1:ns_batch] end @test label_got != label @test sort(label_got) == label - @test reldiff(data_got, data[:,Int[label_got...]]) < 1e-6 + @test size(data_got) == size(data[:, Int[label_got...]]) + @test data_got ≈ data[:, Int[label_got...]] end @testset "IO Test" begin diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 81093376ad2d..0e1837bdd5a3 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -1,8 +1,9 @@ module TestNDArray + using MXNet using Base.Test -using ..Main: rand_dims, reldiff +using ..Main: rand_dims ################################################################################ # Test Implementations @@ -23,12 +24,12 @@ function test_copy() # copy to NDArray and back array = copy(tensor, mx.cpu()) tensor2 = copy(array) - @test reldiff(tensor, tensor2) < 1e-6 + @test tensor ≈ tensor2 # copy between NDArray array2 = copy(array, mx.cpu()) tensor2 = copy(array2) - @test reldiff(tensor, tensor2) < 1e-6 + @test tensor ≈ tensor2 end function test_deepcopy() @@ -43,44 +44,43 @@ end function test_assign() dims = rand_dims() tensor = rand(mx.MX_float, dims) - thresh = 1e-3 info("NDArray::assign::dims = $dims") # Julia Array -> NDArray assignment array = mx.empty(size(tensor)) array[:]= tensor - @test reldiff(tensor, copy(array)) < thresh + @test tensor ≈ copy(array) array2 = mx.zeros(size(tensor)) - @test reldiff(zeros(size(tensor)), copy(array2)) < thresh + @test zeros(size(tensor)) ≈ copy(array2) array3 = mx.zeros(Float16, size(tensor)) - @test reldiff(zeros(Float16, size(tensor)), copy(array2)) < thresh + @test zeros(Float16, size(tensor)) ≈ copy(array2) # scalar -> NDArray assignment scalar = rand() array2[:] = scalar - @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < thresh + @test zeros(size(tensor)) + scalar ≈ copy(array2) scalar = rand(Float16) array2[:] = scalar - @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < thresh + @test zeros(size(tensor)) + scalar ≈ copy(array2) scalar = rand(Float64) array2[:] = scalar array3[:] = scalar - @test reldiff(zeros(size(tensor))+scalar, copy(array2)) < thresh - @test reldiff(zeros(Float16,size(tensor))+scalar, copy(array3)) < thresh + @test zeros(size(tensor)) + scalar ≈ copy(array2) + @test zeros(Float16, size(tensor)) + scalar ≈ copy(array3) # NDArray -> NDArray assignment array[:] = array2 - @test reldiff(zeros(size(tensor))+scalar, copy(array)) < thresh + @test zeros(size(tensor)) + scalar ≈ copy(array) end function test_slice() - array = mx.zeros((2,4)) - array[2:3] = ones(2,2) + array = mx.zeros((2, 4)) + array[2:3] = ones(2, 2) @test copy(array) == [0 1 1 0; 0 1 1 0] @test copy(mx.slice(array, 2:3)) == [1 1; 1 1] end @@ -152,48 +152,47 @@ function test_plus() t1, a1 = rand_tensors(dims) t2, a2 = rand_tensors(dims) t3, a3 = rand_tensors(dims) - thresh = 1e-6 info("NDArray::plus::dims = $dims") - @test reldiff(t1+t2, copy(a1+a2)) < thresh - @test reldiff(t1.+t2, copy(a1.+a2)) < thresh + @test t1 + t2 ≈ copy(a1 + a2) + @test t1 .+ t2 ≈ copy(a1 .+ a2) - @test reldiff(t1+t2+t3, copy(a1+a2+a3)) < thresh + @test t1 + t2 + t3 ≈ copy(a1 + a2 + a3) # test inplace += operation a0 = a1 # keep a reference to a1 @mx.inplace a1 += a2 # perform inplace += @test a0 == a1 # make sure they are still the same object - @test reldiff(copy(a0), copy(a1)) < thresh - @test reldiff(copy(a1), t1+t2) < thresh + @test copy(a0) ≈ copy(a1) + @test copy(a1) ≈ t1 + t2 # test scalar scalar = rand() - @test reldiff(t3 + scalar, copy(a3 + scalar)) < thresh - @test reldiff(t2+scalar+t3, copy(a2+scalar+a3)) < thresh + @test t3 + scalar ≈ copy(a3 + scalar) + @test t2 + scalar + t3 ≈ copy(a2 + scalar + a3) # test small and large scalar t4 = zeros(Float32, dims) a4 = copy(t4, mx.cpu()) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t4 + scalar_small, copy(a4 .+ scalar_small)) < thresh - @test reldiff(t4 + scalar_large, copy(a4 .+ scalar_large)) < thresh + @test t4 + scalar_small ≈ copy(a4 .+ scalar_small) + @test t4 + scalar_large ≈ copy(a4 .+ scalar_large) t5 = zeros(Float64, dims) a5 = copy(t5, mx.cpu()) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t5 + scalar_small, copy(a5 .+ scalar_small)) < thresh - @test reldiff(t5 + scalar_large, copy(a5 .+ scalar_large)) < thresh + @test t5 + scalar_small ≈ copy(a5 .+ scalar_small) + @test t5 + scalar_large ≈ copy(a5 .+ scalar_large) t6 = zeros(Float16, dims) a6 = copy(t6, mx.cpu()) scalar_small = Float16(1e-5) scalar_large = Float16(1e4) - @test reldiff(t6 + scalar_small, copy(a6 .+ scalar_small)) < 1e-1 - @test reldiff(t6 + scalar_large, copy(a6 .+ scalar_large)) < 1e-1 + @test t6 + scalar_small ≈ copy(a6 .+ scalar_small) + @test t6 + scalar_large ≈ copy(a6 .+ scalar_large) let x = mx.NDArray([1 2; 3 4]), y = mx.NDArray([1 1; 1 1]) @test copy(42 .+ x) == [43 44; 45 46] @@ -206,51 +205,51 @@ function test_minus() dims = rand_dims() t1, a1 = rand_tensors(dims) t2, a2 = rand_tensors(dims) - thresh = 1e-6 info("NDArray::minus::dims = $dims") - @test reldiff(t1-t2, copy(a1-a2)) < thresh - @test reldiff(t1.-t2, copy(a1.-a2)) < thresh + @test t1 - t2 ≈ copy(a1 - a2) + @test t1 .- t2 ≈ copy(a1 .- a2) - @test reldiff(-t1, copy(-a1)) < thresh + @test -t1 ≈ copy(-a1) # make sure the negation is not in-place, so a1 is not changed after previous # statement is executed - @test reldiff(t1, copy(a1)) < thresh + @test t1 ≈ copy(a1) # test inplace -= operation a0 = a1 # keep a reference to a1 @mx.inplace a1 -= a2 # perform inplace -= @test a0 == a1 # make sure they are still the same object - @test reldiff(copy(a0), copy(a1)) < thresh - @test reldiff(copy(a1), t1-t2) < thresh + @test a0.handle == a1.handle + @test copy(a0) ≈ copy(a1) + @test copy(a1) ≈ t1 - t2 # test scalar scalar = rand() - @test reldiff(t2 - scalar, copy(a2 - scalar)) < thresh + @test t2 - scalar ≈ copy(a2 - scalar) # test small and large scalar t4 = zeros(Float32, dims) a4 = copy(t4, mx.cpu()) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t4 - scalar_small, copy(a4 .- scalar_small)) < thresh - @test reldiff(t4 - scalar_large, copy(a4 .- scalar_large)) < thresh + @test t4 - scalar_small ≈ copy(a4 .- scalar_small) + @test t4 - scalar_large ≈ copy(a4 .- scalar_large) t5 = zeros(Float64, dims) a5 = copy(t5, mx.cpu()) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t5 - scalar_small, copy(a5 .- scalar_small)) < thresh - @test reldiff(t5 - scalar_large, copy(a5 .- scalar_large)) < thresh + @test t5 - scalar_small ≈ copy(a5 .- scalar_small) + @test t5 - scalar_large ≈ copy(a5 .- scalar_large) t6 = zeros(Float16, dims) a6 = copy(t6, mx.cpu()) scalar_small = Float16(1e-5) scalar_large = Float16(1e4) - @test reldiff(t6 - scalar_small, copy(a6 .- scalar_small)) < 1e-1 - @test reldiff(t6 - scalar_large, copy(a6 .- scalar_large)) < 1e-1 + @test t6 - scalar_small ≈ copy(a6 .- scalar_small) + @test t6 - scalar_large ≈ copy(a6 .- scalar_large) end function test_mul() @@ -258,39 +257,39 @@ function test_mul() t1, a1 = rand_tensors(dims) t2, a2 = rand_tensors(dims) t3, a3 = rand_tensors(dims) - thresh = 1e-6 info("NDArray::mul::dims = $dims") - @test reldiff(t1.*t2, copy(a1.*a2)) < thresh + @test t1 .* t2 ≈ copy(a1.*a2) # test inplace .*= operation a0 = a1 # keep a reference to a1 @mx.inplace a1 .*= a2 # perform inplace .*= @test a0 == a1 # make sure they are still the same object - @test reldiff(copy(a0), copy(a1)) < thresh - @test reldiff(copy(a1), t1.*t2) < thresh + @test a0.handle == a1.handle + @test copy(a0) ≈ copy(a1) + @test copy(a1) ≈ t1 .* t2 # test scalar scalar = mx.MX_float(rand()) - @test reldiff(t3 * scalar, copy(a3 .* scalar)) < thresh + @test t3 * scalar ≈ copy(a3 .* scalar) # test small and large scalar t4, a4 = rand_tensors(Float32, dims) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t4 * scalar_small, copy(a4 .* scalar_small)) < thresh - @test reldiff(t4 * scalar_large, copy(a4 .* scalar_large)) < thresh + @test t4 * scalar_small ≈ copy(a4 .* scalar_small) + @test t4 * scalar_large ≈ copy(a4 .* scalar_large) t5, a5 = rand_tensors(Float64, dims) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t5 * scalar_small, copy(a5 .* scalar_small)) < thresh - @test reldiff(t5 * scalar_large, copy(a5 .* scalar_large)) < thresh + @test t5 * scalar_small ≈ copy(a5 .* scalar_small) + @test t5 * scalar_large ≈ copy(a5 .* scalar_large) t6, a6 = rand_tensors(Float16, dims) scalar_small = Float16(1e-5) - @test reldiff(t6 * scalar_small, copy(a6 .* scalar_small)) < 1e-1 + @test t6 * scalar_small ≈ copy(a6 .* scalar_small) info("NDArray::mul::matrix multiplication") let x = mx.NDArray([1. 2]) @@ -309,41 +308,41 @@ function test_div() dims = rand_dims() t1, a1 = rand_tensors(dims) t2, a2 = rand_tensors(dims) - thresh = 1e-6 info("NDArray::div::dims = $dims") t2 .+= 2 # avoid numerical instability @mx.inplace a2 .+= 2 - @test reldiff(t1 ./ t2, copy(a1 ./ a2)) < thresh + @test t1 ./ t2 ≈ copy(a1 ./ a2) # test inplace -= operation a0 = a1 # keep a reference to a2 @mx.inplace a1 ./= a2 # perform inplace ./= @test a0 == a1 # make sure they are still the same object - @test reldiff(copy(a0), copy(a1)) < thresh - @test reldiff(copy(a1), t1 ./ t2) < thresh + @test a0.handle == a1.handle + @test copy(a0) ≈ copy(a1) + @test copy(a1) ≈ t1 ./ t2 # test scalar scalar = rand() + 2 - @test reldiff(t2 ./ scalar, copy(a2 ./ scalar)) < thresh + @test t2 ./ scalar ≈ copy(a2 ./ scalar) # test small and large scalar t4, a4 = rand_tensors(Float32, dims) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t4 ./ scalar_small, copy(a4 ./ scalar_small)) < thresh - @test reldiff(t4 ./ scalar_large, copy(a4 ./ scalar_large)) < thresh + @test t4 ./ scalar_small ≈ copy(a4 ./ scalar_small) + @test t4 ./ scalar_large ≈ copy(a4 ./ scalar_large) t5, a5 = rand_tensors(Float64, dims) scalar_small = 1e-8 scalar_large = 1e8 - @test reldiff(t5 ./ scalar_small, copy(a5 ./ scalar_small)) < thresh - @test reldiff(t5 ./ scalar_large, copy(a5 ./ scalar_large)) < thresh + @test t5 ./ scalar_small ≈ copy(a5 ./ scalar_small) + @test t5 ./ scalar_large ≈ copy(a5 ./ scalar_large) t6, a6 = rand_tensors(Float16, dims) scalar_large = 1e4 - @test reldiff(t6 ./ scalar_large, copy(a6 ./ scalar_large)) < 1e-1 + @test t6 ./ scalar_large ≈ copy(a6 ./ scalar_large) end @@ -373,7 +372,7 @@ function test_rdiv() info("NDarray::rdiv::Float32") let x = 1 ./ mx.NDArray(Float32[1 2; 3 4]) y = 1 ./ Float32[1 2; 3 4] - @test reldiff(copy(x), y) < 1e8 + @test copy(x) ≈ y end end # function test_rdiv @@ -390,7 +389,7 @@ function test_gd() @mx.inplace aw += -lr * (ag + wd * aw) tw += -lr * (tg + wd * tw) - @test reldiff(copy(aw), tw) < 1e-6 + @test copy(aw) ≈ tw end @@ -404,9 +403,9 @@ function test_saveload() j_array, nd_array = rand_tensors(dims) mx.save(fname, nd_array) data = mx.load(fname, mx.NDArray) - @test isa(data, Vector{mx.NDArray}) + @test data isa Vector{mx.NDArray} @test length(data) == 1 - @test reldiff(copy(data[1]), j_array) < 1e-6 + @test copy(data[1]) ≈ j_array # save and load N arrays of different shape arrays = [rand_tensors(rand_dims()) for i = 1:n_arrays] @@ -416,7 +415,7 @@ function test_saveload() @test isa(data, Vector{mx.NDArray}) @test length(data) == n_arrays for i = 1:n_arrays - @test reldiff(copy(data[i]), arrays[i][1]) < 1e-6 + @test copy(data[i]) ≈ arrays[i][1] end # save and load dictionary of ndarrays @@ -424,10 +423,10 @@ function test_saveload() dict = Dict([(n, v) for (n,v) in zip(names, nd_arrays)]) mx.save(fname, dict) data = mx.load(fname, mx.NDArray) - @test isa(data, Dict{Symbol, mx.NDArray}) + @test data isa Dict{Symbol, mx.NDArray} @test length(data) == n_arrays for i = 1:n_arrays - @test reldiff(copy(data[names[i]]), arrays[i][1]) < 1e-6 + @test copy(data[names[i]]) ≈ arrays[i][1] end rm(fname) @@ -443,14 +442,13 @@ function test_clip() clipped = mx.clip(nd_array, a_min=clip_down, a_max=clip_up) # make sure the original array is not modified - @test reldiff(copy(nd_array), j_array) < 1e-6 + @test copy(nd_array) ≈ j_array @test all(clip_down .<= copy(clipped) .<= clip_up) end function test_power() info("NDArray::power") - thresh = 1e8 info("NDArray::power::Int::x.^n") let x = mx.NDArray([1 2; 3 4]) @@ -491,9 +489,9 @@ function test_power() @test copy(x.^2) == Float32[1 4; 9 16] @test copy(x.^3) == Float32[1 8; 27 64] - @test reldiff(copy(x.^-1), A.^-1) < thresh - @test reldiff(copy(x.^1.1), A.^1.1) < thresh - @test reldiff(copy(x.^2.9), A.^2.9) < thresh + @test copy(x.^-1) ≈ A.^-1 + @test copy(x.^1.1) ≈ A.^1.1 + @test copy(x.^2.9) ≈ A.^2.9 end info("NDArray::power::Float32::n.^x") @@ -504,8 +502,8 @@ function test_power() @test copy(2.^x) == Float32[2 4; 8 16] @test copy(3.^x) == Float32[3 9; 27 81] - @test reldiff(copy(1.1.^x), 1.1.^A) < thresh - @test reldiff(copy(2.9.^x), 2.9.^A) < thresh + @test copy(1.1.^x) ≈ 1.1.^A + @test copy(2.9.^x) ≈ 2.9.^A end info("NDArray::power::Float32::x.^y") @@ -541,28 +539,28 @@ function test_sqrt() j_array, nd_array = rand_tensors(dims) sqrt_ed = sqrt(nd_array) - @test reldiff(copy(sqrt_ed), sqrt.(j_array)) < 1e-6 + @test copy(sqrt_ed) ≈ sqrt.(j_array) end function test_nd_as_jl() - dims = (2,3) + dims = (2, 3) info("NDArray::nd_as_jl::dims = $dims") x = mx.zeros(dims) + 5 y = mx.ones(dims) z = mx.zeros(dims) - @mx.nd_as_jl ro=x rw=(y,z) begin + @mx.nd_as_jl ro=x rw=(y, z) begin for i = 1:length(z) z[i] = x[i] end - z[:,1] = y[:,1] + z[:, 1] = y[:, 1] y[:] = 0 end - @test reldiff(copy(y), 0) < 1e-6 - @test reldiff(copy(z)[:,1], 1) < 1e-6 - @test reldiff(copy(z)[:,2:end], copy(x)[:,2:end]) < 1e-6 + @test sum(copy(y)) == 0 + @test sum(copy(z)[:, 1]) == 2 + @test copy(z)[:, 2:end] ≈ copy(x)[:, 2:end] end function test_dot() @@ -679,7 +677,6 @@ end function test_fill() info("NDArray::fill") - thresh = 1e8 let x = mx.fill(42, 2, 3, 4) @test eltype(x) == Int @@ -690,7 +687,7 @@ function test_fill() let x = mx.fill(Float32(42), 2, 3, 4) @test eltype(x) == Float32 @test size(x) == (2, 3, 4) - @test reldiff(copy(x), fill(Float32(42), 2, 3, 4)) < thresh + @test copy(x) ≈ fill(Float32(42), 2, 3, 4) end let x = mx.fill(42, (2, 3, 4)) @@ -702,7 +699,7 @@ function test_fill() let x = mx.fill(Float32(42), (2, 3, 4)) @test eltype(x) == Float32 @test size(x) == (2, 3, 4) - @test reldiff(copy(x), fill(Float32(42), 2, 3, 4)) < thresh + @test copy(x) ≈ fill(Float32(42), 2, 3, 4) end info("NDArray::fill!::arr") diff --git a/test/unittest/operator.jl b/test/unittest/operator.jl index 76e51f4403f5..85fc7c6238e9 100644 --- a/test/unittest/operator.jl +++ b/test/unittest/operator.jl @@ -1,8 +1,9 @@ module TestOperator + using MXNet using Base.Test -using ..Main: rand_dims, reldiff +using ..Main: rand_dims function test_scalar_op() data = mx.Variable(:data) @@ -19,13 +20,13 @@ function test_scalar_op() out = copy(exec_test.outputs[1]) jl_out1 = (4 - ((1+data_jl+1)*2/5) - 0.2) jl_out = 2 ./ jl_out1 - @test reldiff(copy(out), jl_out) < 1e-6 + @test copy(out) ≈ jl_out out_grad = 2mx.ones(shape) jl_grad = 2copy(out_grad) / 5 jl_grad = 2jl_grad ./ (jl_out1 .^ 2) mx.backward(exec_test, out_grad) - @test reldiff(copy(arr_grad), jl_grad) < 1e-6 + @test copy(arr_grad) ≈ jl_grad end ################################################################################ diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 39eda86b1bb2..baeb92a68e23 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -1,8 +1,9 @@ module TestSymbolicNode + using MXNet using Base.Test -using ..Main: mlp2, mlpchain, reldiff, exec +using ..Main: mlp2, mlpchain, exec ################################################################################ # Test Implementations @@ -233,12 +234,12 @@ function test_dot() y = mx.Variable(:y) z = mx.dot(x, y) z_exec = mx.bind(z, context=mx.cpu(), - args=Dict(:x=>mx.ones((100, 2)), :y=>mx.ones((2, 200)))) + args=Dict(:x => mx.ones((100, 2)), :y => mx.ones((2, 200)))) mx.forward(z_exec) ret = copy(z_exec.outputs[1]) @test size(ret) == (100, 200) - @test reldiff(ret, 2*ones(100, 200)) < 1e-6 + @test ret ≈ 2*ones(100, 200) end function test_print() @@ -253,7 +254,7 @@ function test_misc() # Test for #189 a = mx.Variable("a") b = mx.Variable("b") - symb = mx.ElementWiseSum(a,b) + symb = mx.ElementWiseSum(a, b) end function test_add() @@ -340,7 +341,7 @@ function test_minus() end # function test_minus function test_mul() - info("SymoblicNode::elementwise mul") + info("SymbolicNode::elementwise mul") let x = mx.Variable(:x), A = Float32[1 2; 3 4] let y = exec(x .* 42; :x => A)[] @test size(y) == size(A) @@ -379,7 +380,7 @@ function test_mul() end # function test_mul function test_div() - info("SymoblicNode::elementwise div") + info("SymbolicNode::elementwise div") let x = mx.Variable(:x), A = Float32[1 2; 3 4] let y = exec(x ./ 42; :x => A)[] @test size(y) == size(A) @@ -418,7 +419,7 @@ function test_div() end # function test_div function test_power() - info("SymoblicNode::elementwise power") + info("SymbolicNode::elementwise power") let x = mx.Variable(:x), A = Float32[1 2; 3 4] let y = exec(x.^42; :x => A)[] @test size(y) == size(A) From 526857e952963618bc8b6927871cecf1cf24a118 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 14 Nov 2017 02:09:57 +0800 Subject: [PATCH 546/630] docs: address docstring override warning (#320) Address this: ``` julia> using MXNet INFO: Recompiling stale cache file ~/.julia/lib/v0.6/MXNet.ji for module MXNet. WARNING: replacing docs for 'Base.:^ :: Union{}' in module 'MXNet.mx'. ``` --- src/ndarray.jl | 9 +-------- src/symbolic-node.jl | 2 +- 2 files changed, 2 insertions(+), 9 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 3e4cff5591d5..0b0e01a40e64 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -741,14 +741,7 @@ broadcast_(::typeof(/), x::Real, y::NDArray) = import Base: ^ -""" - .^(x::NDArray, y::NDArray) - .^(x::NDArray, s::Real) - .^(s::Real, x::NDArray) - -Elementwise power of `NDArray`. -""" -^ +# document of `.^` is merged into SymbolicNode's broadcast_(::typeof(^), x::NDArray, y::NDArray) = _power(x, y) broadcast_(::typeof(^), x::NDArray, s::Real) = _power_scalar(x, scalar=s) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 72eb60b3a8c0..bbe2d1874846 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -579,7 +579,7 @@ import Base: ^ """ .^(x, y) -Elementwise power of `SymbolicNode`. +Elementwise power of `SymbolicNode` and `NDArray`. Operating with `Real` is available. """ ^ From 80711865a2d721c9fe8d571a5cbc0a393eeb94d5 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 14 Nov 2017 02:14:10 +0800 Subject: [PATCH 547/630] travis: enable 'build branch updates' on master/stable only (#319) --- .travis.yml | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/.travis.yml b/.travis.yml index 734de9e1eff9..a91994db2fc1 100644 --- a/.travis.yml +++ b/.travis.yml @@ -9,6 +9,12 @@ julia: - 0.6 # - nightly 0.6 supports depends on #170 +branches: + only: + - master + - stable + - /^v\d+\.\d+(\.\d+)?(-\S*)?$/ # for tagging + # dependent apt packages addons: apt: From e4b6c0ebc202789afc62826d224a5cc9a5d42db1 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 14 Nov 2017 02:17:25 +0800 Subject: [PATCH 548/630] docs: update examples in overview (#317) * docs: update examples in overview close #286 * docs: add Makefile --- docs/Makefile | 3 + docs/src/index.md | 32 +++++- docs/src/user-guide/install.md | 16 +-- docs/src/user-guide/overview.md | 192 +++++++++++++++----------------- 4 files changed, 128 insertions(+), 115 deletions(-) create mode 100644 docs/Makefile diff --git a/docs/Makefile b/docs/Makefile new file mode 100644 index 000000000000..d1cadf2e487b --- /dev/null +++ b/docs/Makefile @@ -0,0 +1,3 @@ +all: + julia --color=yes ./make.jl + mkdocs build diff --git a/docs/src/index.md b/docs/src/index.md index a41b77478631..b6a51fc162ad 100644 --- a/docs/src/index.md +++ b/docs/src/index.md @@ -6,8 +6,10 @@ computing and state-of-art deep learning to Julia. Some highlight of features include: -* Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. -* Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. +* Efficient tensor/matrix computation across multiple devices, + including multiple CPUs, GPUs and distributed server nodes. +* Flexible symbolic manipulation to composite and construct + state-of-the-art deep learning models. For more details, see documentation below. Please also checkout the [examples](https://github.com/dmlc/MXNet.jl/tree/master/examples) directory. @@ -15,19 +17,39 @@ For more details, see documentation below. Please also checkout the ## Tutorials ```@contents -Pages = ["tutorial/mnist.md", "tutorial/char-lstm.md"] +Pages = [ + "tutorial/mnist.md", + "tutorial/char-lstm.md", +] Depth = 2 ``` ## User's Guide ```@contents -Pages = ["user-guide/install.md", "user-guide/overview.md", "user-guide/faq.md"] +Pages = [ + "user-guide/install.md", + "user-guide/overview.md", + "user-guide/faq.md", +] Depth = 2 ``` ## API Documentation ```@contents -Pages = ["api/context.md", "api/model.md", "api/initializers.md", "api/optimizers.md", "api/callbacks.md", "api/metric.md", "api/io.md", "api/ndarray.md", "api/symbolic-node.md", "api/nn-factory.md", "api/executor.md", "api/visualize.md"] +Pages = [ + "api/context.md", + "api/ndarray.md", + "api/symbolic-node.md", + "api/model.md", + "api/initializers.md", + "api/optimizers.md", + "api/callbacks.md", + "api/metric.md", + "api/io.md", + "api/nn-factory.md", + "api/executor.md", + "api/visualize.md", +] ``` diff --git a/docs/src/user-guide/install.md b/docs/src/user-guide/install.md index a585b4409c6d..30ed65d48511 100644 --- a/docs/src/user-guide/install.md +++ b/docs/src/user-guide/install.md @@ -10,7 +10,7 @@ To install MXNet.jl, simply type Pkg.add("MXNet") ``` -in the Julia REPL. Or to use the latest git version of MXNet.jl, use the +In the Julia REPL. Or to use the latest git version of MXNet.jl, use the following command instead ```julia @@ -27,9 +27,9 @@ to point the build-process in the right direction. If the automatic cuda detection fails you can also set `CUDA_HOME` to override the process. To control which version of libmxnet will be compiled, you can use the `MXNET_COMMIT` variable to point to either a version tag (e.g. `v0.10.0`), a -branch name (e.g. `master`) or a specific commit hash (e.g. `a0b1c2d3`). +branch name (e.g. `master`) or a specific commit hash (e.g. `a0b1c2d3`). -The libmxnet source is downloaded to `Pkg.dir("MXNet")/deps/src/mxnet`. +The libmxnet source is downloaded to `Pkg.dir("MXNet", "deps", "src", "mxnet")`. The automatic build is using default configurations, with OpenCV disabled. If the compilation failed due to unresolved dependency, or if you want to customize the build, you can compile and @@ -39,12 +39,12 @@ Manual Compilation ------------------ It is possible to compile libmxnet separately and point MXNet.jl to a -the existing library in case automatic compilation fails due to -unresolved dependencies in an un-standard environment; Or when one want -to work with a seperate, maybe customized libmxnet. +existing library in case automatic compilation fails due to +unresolved dependencies in an non-standard environment; Or when one want +to work with a separate, maybe customized libmxnet. To build libmxnet, please refer to [the installation guide of -libmxnet](http://mxnet.readthedocs.org/en/latest/build.html). After +libmxnet](https://mxnet.incubator.apache.org/install/index.html). After successfully installing libmxnet, set the `MXNET_HOME` *environment variable* to the location of libmxnet. In other words, the compiled `libmxnet.so` should be found in `$MXNET_HOME/lib`. @@ -65,7 +65,7 @@ Basically, MXNet.jl will search `libmxnet.so` or `libmxnet.dll` in the following paths (and in that order): - `$MXNET_HOME/lib`: customized libmxnet builds -- `Pkg.dir("MXNet")/deps/usr/lib`: automatic builds +- `Pkg.dir("MXNet", "deps", "usr", "lib")`: automatic builds - Any system wide library search path Note that MXNet.jl can not load `libmxnet.so` even if it is on one of diff --git a/docs/src/user-guide/overview.md b/docs/src/user-guide/overview.md index 9a7d8e514894..d1948220a3cf 100644 --- a/docs/src/user-guide/overview.md +++ b/docs/src/user-guide/overview.md @@ -1,8 +1,6 @@ -Overview -======== +# Overview -MXNet.jl Namespace ------------------- +## MXNet.jl Namespace Most the functions and types in MXNet.jl are organized in a flat namespace. Because many some functions are conflicting with existing @@ -11,13 +9,32 @@ convention of accessing the MXNet.jl interface is the to use the `mx.` prefix explicitly: ```julia -using MXNet - -x = mx.zeros(2,3) # MXNet NDArray -y = zeros(eltype(x), size(x)) # Julia Array -copy!(y, x) # Overloaded function in Julia Base -z = mx.ones(size(x), mx.gpu()) # MXNet NDArray on GPU -mx.copy!(z, y) # Same as copy!(z, y) +julia> using MXNet + +julia> x = mx.zeros(2,3) # MXNet NDArray +2×3 mx.NDArray{Float32} @ CPU0: + 0.0 0.0 0.0 + 0.0 0.0 0.0 + +julia> y = zeros(eltype(x), size(x)) # Julia Array +2×3 Array{Float32,2}: + 0.0 0.0 0.0 + 0.0 0.0 0.0 + +julia> copy!(y, x) # Overloaded function in Julia Base +2×3 Array{Float32,2}: + 0.0 0.0 0.0 + 0.0 0.0 0.0 + +julia> z = mx.ones(size(x), mx.gpu()) # MXNet NDArray on GPU +2×3 mx.NDArray{Float32} @ GPU0: + 1.0 1.0 1.0 + 1.0 1.0 1.0 + +julia> mx.copy!(z, y) # Same as copy!(z, y) +2×3 mx.NDArray{Float32} @ GPU0: + 0.0 0.0 0.0 + 0.0 0.0 0.0 ``` Note functions like `size`, `copy!` that is extensively overloaded for @@ -26,24 +43,23 @@ various types works out of the box. But functions like `zeros` and prefer, the `mx.` prefix can be used explicitly for all MXNet.jl functions, including `size` and `copy!` as shown in the last line. -Low Level Interface -------------------- +## Low Level Interface -### NDArrays +### `NDArray` -NDArray is the basic building blocks of the actual computations in +`NDArray` is the basic building blocks of the actual computations in MXNet. It is like a Julia `Array` object, with some important differences listed here: - The actual data could live on different `Context` (e.g. GPUs). For some contexts, iterating into the elements one by one is very slow, - thus indexing into NDArray is not supported in general. The easiest + thus indexing into NDArray is not recommanded in general. The easiest way to inspect the contents of an NDArray is to use the `copy` function to copy the contents as a Julia `Array`. -- Operations on NDArray (including basic arithmetics and neural +- Operations on `NDArray` (including basic arithmetics and neural network related operators) are executed in parallel with automatic dependency tracking to ensure correctness. -- There is no generics in NDArray, the `eltype` is always +- There is no generics in `NDArray`, the `eltype` is always `mx.MX_float`. Because for applications in machine learning, single precision floating point numbers are typical a best choice balancing between precision, speed and portability. Also since libmxnet is @@ -52,14 +68,14 @@ differences listed here: While most of the computation is hidden in libmxnet by operators corresponding to various neural network layers. Getting familiar with -the NDArray API is useful for implementing `Optimizer` or customized +the `NDArray` API is useful for implementing `Optimizer` or customized operators in Julia directly. -The followings are common ways to create NDArray objects: +The followings are common ways to create `NDArray` objects: - `mx.empty(shape[, context])`: create on uninitialized array of a given shape on a specific device. For example, - ` mx.empty(2,3)`, `mx.((2,3), mx.gpu(2)) `. + `mx.empty(2,3)`, `mx.((2,3), mx.gpu(2))`. - `mx.zeros(shape[, context])` and `mx.ones(shape[, context])`: similar to the Julia's built-in `zeros` and `ones`. - `mx.copy(jl_arr, context)`: copy the contents of a Julia `Array` to @@ -80,11 +96,13 @@ println(copy(a)) ``` A slice is a sub-region sharing the same memory with the original -NDArray object. A slice is always a contiguous piece of memory, so only +`NDArray` object. A slice is always a contiguous piece of memory, so only slicing on the *last* dimension is supported. The example above also -shows a way to set the contents of an NDArray. +shows a way to set the contents of an `NDArray`. -```julia +```@repl +using MXNet +mx.srand(42) a = mx.empty(2,3) a[:] = 0.5 # set all elements to a scalar a[:] = rand(size(a)) # set contents with a Julia Array @@ -101,39 +119,37 @@ a = b ``` does **not** mean copying the contents of `b` to `a`. Instead, it just -make the variable `a` pointing to a new object, which is `b`. Similarly, -inplace arithmetics does not work as expected: +make the variable `a` pointing to a new object, which is `b`. +Similarly, inplace arithmetics does not work as expected: -```julia +```@repl inplace-macro +using MXNet a = mx.ones(2) r = a # keep a reference to a b = mx.ones(2) a += b # translates to a = a + b -println(copy(a)) -# => Float32[2.0f0,2.0f0] -println(copy(r)) -# => Float32[1.0f0,1.0f0] +a +r ``` As we can see, `a` has expected value, but instead of inplace updating, -a new NDArray is created and `a` is set to point to this new object. If +a new `NDArray` is created and `a` is set to point to this new object. If we look at `r`, which still reference to the old `a`, its content has not changed. There is currently no way in Julia to overload the operators like `+=` to get customized behavior. -Instead, you will need to write `a[:] = a+b`, or if you want *real* +Instead, you will need to write `a[:] = a + b`, or if you want *real* inplace `+=` operation, MXNet.jl provides a simple macro `@mx.inplace`: -```julia +```@repl inplace-macro @mx.inplace a += b macroexpand(:(@mx.inplace a += b)) -# => :(MXNet.mx.add_to!(a,b)) ``` As we can see, it translate the `+=` operator to an explicit `add_to!` function call, which invokes into libmxnet to add the contents of `b` into `a` directly. For example, the following is the update rule in the -SGD `Optimizer` (both `grad` and `weight` are NDArray objects): +`SGD Optimizer` (both `grad` and `weight` are `NDArray` objects): ```julia @inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) @@ -142,10 +158,10 @@ SGD `Optimizer` (both `grad` and `weight` are NDArray objects): Note there is no much magic in `mx.inplace`: it only does a shallow translation. In the SGD update rule example above, the computation like scaling the gradient by `grad_scale` and adding the weight decay all -create temporary NDArray objects. To mitigate this issue, libmxnet has a +create temporary `NDArray` objects. To mitigate this issue, libmxnet has a customized memory allocator designed specifically to handle this kind of situations. The following snippet does a simple benchmark on allocating -temp NDArray vs. pre-allocating: +temp `NDArray` vs. pre-allocating: ```julia using Benchmark @@ -224,24 +240,24 @@ println(copy(a)) # 2.0 2.0 2.0] ``` -Intermediate Level Interface ----------------------------- +## Intermediate Level Interface ### Symbols and Composition The way we build deep learning models in MXNet.jl is to use the powerful symbolic composition system. It is like [Theano](http://deeplearning.net/software/theano/), except that we -avoided long expression compiliation time by providing *larger* neural +avoided long expression compilation time by providing *larger* neural network related building blocks to guarantee computation performance. See also [this note](http://mxnet.readthedocs.org/en/latest/program_model.html) for the design and trade-off of the MXNet symbolic composition system. -The basic type is `mx.Symbol`. The following is a trivial example of +The basic type is `mx.SymbolicNode`. The following is a trivial example of composing two symbols with the `+` operation. -```julia +```@repl +using MXNet A = mx.Variable(:A) B = mx.Variable(:B) C = A + B @@ -253,12 +269,13 @@ be realized by recursive composition. For example, the following code snippet shows a simple 2-layer MLP construction, using a hidden layer of 128 units and a ReLU activation function. -```julia +```@repl fcnet +using MXNet net = mx.Variable(:data) -net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) -net = mx.Activation(data=net, name=:relu1, act_type=:relu) -net = mx.FullyConnected(data=net, name=:fc2, num_hidden=64) -net = mx.Softmax(data=net, name=:out) +net = mx.FullyConnected(net, name=:fc1, num_hidden=128) +net = mx.Activation(net, name=:relu1, act_type=:relu) +net = mx.FullyConnected(net, name=:fc2, num_hidden=64) +net = mx.SoftmaxOutput(net, name=:out) ``` Each time we take the previous symbol, and compose with an operation. @@ -284,55 +301,33 @@ the networks, while *parameters* are typically trainable *weights*, When composing symbols, their arguments accumulates. We can list all the arguments by -```julia -julia> mx.list_arguments(net) -6-element Array{Symbol,1}: - :data # Input data, name from the first data variable - :fc1_weight # Weights of the fully connected layer named :fc1 - :fc1_bias # Bias of the layer :fc1 - :fc2_weight # Weights of the layer :fc2 - :fc2_bias # Bias of the layer :fc2 - :out_label # Input label, required by the softmax layer named :out +```@repl fcnet +mx.list_arguments(net) ``` Note the names of the arguments are generated according to the provided name for each layer. We can also specify those names explicitly: -```julia +```@repl +using MXNet net = mx.Variable(:data) w = mx.Variable(:myweight) -net = mx.FullyConnected(data=data, weight=w, name=:fc1, num_hidden=128) +net = mx.FullyConnected(data, weight=w, name=:fc1, num_hidden=128) mx.list_arguments(net) -# => -# 3-element Array{Symbol,1}: -# :data -# :myweight -# :fc1_bias ``` -The simple fact is that a `Variable` is just a placeholder `mx.Symbol`. +The simple fact is that a `Variable` is just a placeholder `mx.SymbolicNode`. In composition, we can use arbitrary symbols for arguments. For example: -```julia +```@repl +using MXNet net = mx.Variable(:data) -net = mx.FullyConnected(data=net, name=:fc1, num_hidden=128) +net = mx.FullyConnected(net, name=:fc1, num_hidden=128) net2 = mx.Variable(:data2) -net2 = mx.FullyConnected(data=net2, name=:net2, num_hidden=128) +net2 = mx.FullyConnected(net2, name=:net2, num_hidden=128) mx.list_arguments(net2) -# => -# 3-element Array{Symbol,1}: -# :data2 -# :net2_weight -# :net2_bias composed_net = net2(data2=net, name=:composed) mx.list_arguments(composed_net) -# => -# 5-element Array{Symbol,1}: -# :data -# :fc1_weight -# :fc1_bias -# :net2_weight -# :net2_bias ``` Note we use a composed symbol, `net` as the argument `data2` for `net2` @@ -347,9 +342,10 @@ symbol could be inferred automatically. For example, given the input shape, and some hyper-parameters like `num_hidden`, the shapes for the weights and bias in a neural network could be inferred. -```julia +```@repl infer-shape +using MXNet net = mx.Variable(:data) -net = mx.FullyConnected(data=net, name=:fc1, num_hidden=10) +net = mx.FullyConnected(net, name=:fc1, num_hidden=10) arg_shapes, out_shapes, aux_shapes = mx.infer_shape(net, data=(10, 64)) ``` @@ -357,19 +353,15 @@ The returned shapes corresponds to arguments with the same order as returned by `mx.list_arguments`. The `out_shapes` are shapes for outputs, and `aux_shapes` can be safely ignored for now. -```julia -for (n,s) in zip(mx.list_arguments(net), arg_shapes) - println("$n => $s") +```@repl infer-shape +for (n, s) in zip(mx.list_arguments(net), arg_shapes) + println("$n\t=> $s") end -# => -# data => (10,64) -# fc1_weight => (10,10) -# fc1_bias => (10,) -for (n,s) in zip(mx.list_outputs(net), out_shapes) - println("$n => $s") +``` +```@repl infer-shape +for (n, s) in zip(mx.list_outputs(net), out_shapes) + println("$n\t=> $s") end -# => -# fc1_output => (10,64) ``` ### Binding and Executing @@ -381,21 +373,18 @@ A context describes the computation devices (CPUs, GPUs, etc.) and an executor will carry out the computation (forward/backward) specified in the corresponding symbolic composition. -```julia +```@repl +using MXNet A = mx.Variable(:A) B = mx.Variable(:B) C = A .* B a = mx.ones(3) * 4 b = mx.ones(3) * 2 -c_exec = mx.bind(C, context=mx.cpu(), args=Dict(:A => a, :B => b)) +c_exec = mx.bind(C, context=mx.cpu(), args=Dict(:A => a, :B => b)); mx.forward(c_exec) +c_exec.outputs[1] copy(c_exec.outputs[1]) # copy turns NDArray into Julia Array -# => -# 3-element Array{Float32,1}: -# 8.0 -# 8.0 -# 8.0 ``` For neural networks, it is easier to use `simple_bind`. By providing the @@ -406,7 +395,6 @@ the binding and executing steps are hidden under the `Model` interface. **TODO** Provide pointers to model tutorial and further details about binding and symbolic API. -High Level Interface --------------------- +## High Level Interface The high level interface include model training and prediction API, etc. From a51d9b5ebadaf57d3f54df908e02f663e4935808 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 15 Nov 2017 00:09:41 +0800 Subject: [PATCH 549/630] docs: fix more example rendering in overview (#322) --- docs/src/user-guide/overview.md | 43 +++++++++++++++++++-------------- 1 file changed, 25 insertions(+), 18 deletions(-) diff --git a/docs/src/user-guide/overview.md b/docs/src/user-guide/overview.md index d1948220a3cf..a767643a3735 100644 --- a/docs/src/user-guide/overview.md +++ b/docs/src/user-guide/overview.md @@ -85,14 +85,12 @@ Most of the convenient functions like `size`, `length`, `ndims`, `eltype` on array objects should work out-of-the-box. Although indexing is not supported, it is possible to take *slices*: -```julia +```@repl +using MXNet a = mx.ones(2,3) b = mx.slice(a, 1:2) b[:] = 2 -println(copy(a)) -# => -# Float32[2.0 2.0 1.0 -# 2.0 2.0 1.0] +a ``` A slice is a sub-region sharing the same memory with the original @@ -226,18 +224,19 @@ push. The following example shows how to create a local `KVStore`, initialize a value and then pull it back. -```julia +```@setup kv +using MXNet +``` + +```@example kv kv = mx.KVStore(:local) -shape = (2,3) +shape = (2, 3) key = 3 -mx.init!(kv, key, mx.ones(shape)*2) +mx.init!(kv, key, mx.ones(shape) * 2) a = mx.empty(shape) mx.pull!(kv, key, a) # pull value into a -println(copy(a)) -# => -# Float32[2.0 2.0 2.0 -# 2.0 2.0 2.0] +a ``` ## Intermediate Level Interface @@ -256,26 +255,34 @@ design and trade-off of the MXNet symbolic composition system. The basic type is `mx.SymbolicNode`. The following is a trivial example of composing two symbols with the `+` operation. -```@repl +```@setup sym1 using MXNet +``` + +```@example sym1 A = mx.Variable(:A) B = mx.Variable(:B) C = A + B +print(C) # debug printing ``` -We get a new *symbol* by composing existing *symbols* by some +We get a new `SymbolicNode` by composing existing `SymbolicNode`s by some *operations*. A hierarchical architecture of a deep neural network could be realized by recursive composition. For example, the following code snippet shows a simple 2-layer MLP construction, using a hidden layer of -128 units and a ReLU activation function. +128 units and a `ReLU` activation function. -```@repl fcnet +```@setup fcnet using MXNet +``` + +```@example fcnet net = mx.Variable(:data) net = mx.FullyConnected(net, name=:fc1, num_hidden=128) net = mx.Activation(net, name=:relu1, act_type=:relu) net = mx.FullyConnected(net, name=:fc2, num_hidden=64) net = mx.SoftmaxOutput(net, name=:out) +print(net) # debug printing ``` Each time we take the previous symbol, and compose with an operation. @@ -301,7 +308,7 @@ the networks, while *parameters* are typically trainable *weights*, When composing symbols, their arguments accumulates. We can list all the arguments by -```@repl fcnet +```@example fcnet mx.list_arguments(net) ``` @@ -312,7 +319,7 @@ name for each layer. We can also specify those names explicitly: using MXNet net = mx.Variable(:data) w = mx.Variable(:myweight) -net = mx.FullyConnected(data, weight=w, name=:fc1, num_hidden=128) +net = mx.FullyConnected(net, weight=w, name=:fc1, num_hidden=128) mx.list_arguments(net) ``` From 73b856bcb17f83a189aaee65f22ae0be001cc34c Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 16 Nov 2017 02:53:00 +0800 Subject: [PATCH 550/630] Update README badge (#324) [ci skip] --- README.md | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index 624b04206a48..c6600cdc9fd5 100644 --- a/README.md +++ b/README.md @@ -4,9 +4,10 @@ [![Windows Build](https://ci.appveyor.com/api/projects/status/re90njols2th2ide?svg=true)](https://ci.appveyor.com/project/pluskid/mxnet-jl) [![codecov.io](https://codecov.io/github/dmlc/MXNet.jl/coverage.svg?branch=master)](https://codecov.io/github/dmlc/MXNet.jl?branch=master) [![](https://img.shields.io/badge/docs-latest-blue.svg)](https://dmlc.github.io/MXNet.jl/latest) -[![MXNet](http://pkg.julialang.org/badges/MXNet_0.4.svg)](http://pkg.julialang.org/?pkg=MXNet) +[![](https://img.shields.io/badge/docs-stable-blue.svg)](https://dmlc.github.io/MXNet.jl/stable) +[![MXNet](http://pkg.julialang.org/badges/MXNet_0.6.svg)](http://pkg.julialang.org/?pkg=MXNet) [![License](http://dmlc.github.io/img/apache2.svg)](LICENSE.md) -[![Join the chat at https://gitter.im/dmlc/mxnet](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/dmlc/mxnet?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge) +[![Join the chat at https://gitter.im/dmlc/mxnet](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/dmlc/mxnet) MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julialang.org/) package. MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of its features include: From 1dfb5b3693a51cccf3f78c5a037abf64eba67ffc Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 16 Nov 2017 08:48:17 +0800 Subject: [PATCH 551/630] Cut a release for mxnet v0.12.0 (#304) * prepare for releasing * build: fix windows build * update NEWS for #314 * update NEWS for #312 * update NEWS for #276 --- NEWS.md | 99 ++++++++++++++++++++++++++++++++++++++------------- deps/build.jl | 20 ++++++----- 2 files changed, 86 insertions(+), 33 deletions(-) diff --git a/NEWS.md b/NEWS.md index fcd48dc3f81e..c481c0598820 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,19 +1,31 @@ # v0.3.0 (TBD) -* Drop 0.5 support. (#TBD) +* Update `libmxnet` to v0.12.0. + (See https://github.com/apache/incubator-mxnet/releases/tag/0.12.0) + +* Drop 0.5 support. ([#300][300]) ## New API -* `deepcopy` for NDArray (#273) -* `scalar ./ NDArray` is available now. (#292) -* `fill` and `fill!` for NDArray (#TBD) +### `SymbolicNode` + +* Debugging print support. ([#276][276]) + +### `NDArray` + +* `deepcopy` for `NDArray` ([#273][273]) + +* `scalar ./ NDArray` is available now. ([#292][292]) + +* `fill` and `fill!` for `NDArray`. ([#297][297], [#311][311]) + An API correspond to Python's `mx.nd.full()` * `fill(x, dims, ctx=cpu())` * `fill(x, dims...)` * `fill!(arr::NDArray, x)` -* Matrix (2D NDArray) multiplication is available now. (#TBD) +* Matrix (2D `NDArray`) multiplication is available now. ([#300][300]) ```julia julia> x @@ -26,7 +38,8 @@ 2.0 4.0 ``` -* `NDArray` `getindex`/`setindex!` linear indexing support and `first` for extracting scalar value. (#TBD) +* `NDArray` `getindex`/`setindex!` linear indexing support and `first` for + extracting scalar value. ([#294][294]) ```julia julia> x = mx.zeros(2, 5) @@ -45,61 +58,99 @@ julia> y[] # this is available, also 42.0f0 ``` -* Elementwise power of `NDArray`. (#293) +* Elementwise power of `NDArray`. ([#293][293]) + * `x.^2` * `2.^x` * `x.^y` * where `x` and `y` are `NDArray`s. -* Elementwise power of irrational and `NDArray` (#TBD) +* Elementwise power of irrational and `NDArray`. ([#310][310]) + * `e.^x` * `x.^e` * `π.^x` ## API Changes -* `reshape` of NDArray shares the same interface with Base (#272). - * `reshape(NDArray, dim; reverse=false)` - * `reshape(NDArray, dim...; reverse=false)` - * `Reshape` deprecated. +### `SymbolicNode` -* `reshape` of SymbolicNode shares the same interface with Base - and additional keyword argument (#279). +* `reshape` of `SymbolicNode` shares the same interface with Base + and additional keyword argument. ([#279][279]) * `reshape(SymbolicNode, dim; reverse=false, name)` * `reshape(SymbolicNode, dim...; reverse=false, name)` - * `Reshape` deprecated. + * `Reshape` is deprecated. + +* `mx.forward(x)` will return `x.outputs` now. ([#312][312]) -* `srand!` deprecated, please use `srand` (#282) +### `NDArray` -* `mean` and `sum` of NDArray share the same interface with Base - and fix the `axis` indexing (#TBD). +* `reshape` of `NDArray` shares the same interface with Base. ([#272][272]) + + * `reshape(NDArray, dim; reverse=false)` + * `reshape(NDArray, dim...; reverse=false)` + * `Reshape` is deprecated. + +* `srand!` deprecated, please use `srand`. ([#282][282]) + +* `mean` and `sum` of `NDArray` share the same interface with Base + and fix the `axis` indexing. ([#303][303]) * This is a breaking change; no deprecated warning. * Before: `mean(arr, axis=0)` * After: `mean(arr, 1)` -* `max` and `min` of NDArray renamed to `maximum` and `minimum` and share the - same interface with Base. The `axis` indexing is fixed, also. (#TBD) +* `max` and `min` of `NDArray` renamed to `maximum` and `minimum` and share the + same interface with Base. The `axis` indexing is fixed, also. ([#303][303]) * This is a breaking change; no deprecated warning. * Before: `mx.max(arr, axis=0)` or `mx.max_axis(arr, axis=0)` * After: `maximum(arr, 1)` -* `mx.transpose` for high dimension NDArray has been renamed to `permutedims` - and shares the same interface with Base. (#TBD) +* `mx.transpose` for high dimension `NDArray` has been renamed to `permutedims` + and shares the same interface with Base. ([#303][303]) * This is a breaking changes; no deprecated warning. * Before: `mx.transpose(A, axis=[2, 1, 3])` * After: `permutedims(A, [2, 1, 3])` -* `prod` of `NDArray` shares the same interface with Base and fix - the `axis` indexing. (#TBD). +* `prod` of `NDArray` shares the same interface with Base and fix the `axis` + indexing. ([#303][303]) * This is a breaking change; no deprecated warning. * Before: `prod(arr, axis=-1)` * After: `prod(arr, 1)` +## Bugfix + +* Broadcasting operation on same variable is back. ([#300][300], [#314][314]) + ```julia + x = mx.NDArray(...) + x .* x + ``` + + ```julia + y = mx.Variable(:y) + y .* y + ``` + +[272]: https://github.com/dmlc/MXNet.jl/pull/272 +[273]: https://github.com/dmlc/MXNet.jl/pull/273 +[276]: https://github.com/dmlc/MXNet.jl/pull/276 +[279]: https://github.com/dmlc/MXNet.jl/pull/279 +[282]: https://github.com/dmlc/MXNet.jl/pull/282 +[292]: https://github.com/dmlc/MXNet.jl/pull/292 +[293]: https://github.com/dmlc/MXNet.jl/pull/293 +[294]: https://github.com/dmlc/MXNet.jl/pull/294 +[297]: https://github.com/dmlc/MXNet.jl/pull/297 +[300]: https://github.com/dmlc/MXNet.jl/pull/300 +[303]: https://github.com/dmlc/MXNet.jl/pull/303 +[310]: https://github.com/dmlc/MXNet.jl/pull/310 +[311]: https://github.com/dmlc/MXNet.jl/pull/311 +[312]: https://github.com/dmlc/MXNet.jl/pull/312 +[314]: https://github.com/dmlc/MXNet.jl/pull/314 + # v0.2.2 (2017.05.14) * Updated supported version of MXNet to 0.9.4. * Improved build-system with support for auto-detecting GPU support. diff --git a/deps/build.jl b/deps/build.jl index c1463da5c04f..619196628bf5 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -5,8 +5,8 @@ import JSON # First try to detect and load existing libmxnet ################################################################################ libmxnet_detected = false -libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "master") -curr_win = "20170819" +libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "0.12.0") +curr_win = "20171019" # v0.12.0 if haskey(ENV, "MXNET_HOME") info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") @@ -85,7 +85,7 @@ if !libmxnet_detected return end info("Downloading pre-built packages for Windows.") - base_url = "https://github.com/yajiedesign/mxnet/releases/download/weekly_binary_build/prebuildbase_win10_x64_vc14.7z" + base_url = "https://github.com/yajiedesign/mxnet/releases/download/weekly_binary_build_v2/prebuildbase_win10_x64_vc14_v2.7z" if libmxnet_curr_ver == "master" # download_cmd uses powershell 2, but we need powershell 3 to do this @@ -99,15 +99,17 @@ if !libmxnet_detected exe7z = joinpath(JULIA_HOME, "7z.exe") - run(download_cmd(base_url, "mxnet_base.7z")) - run(`$exe7z x mxnet_base.7z -y -ousr`) - run(`cmd /c copy "usr\\3rdparty\\openblas\\bin\\*.dll" "usr\\lib"`) - run(`cmd /c copy "usr\\3rdparty\\opencv\\*.dll" "usr\\lib"`) - run(download_cmd(package_url, "mxnet.7z")) - run(`$exe7z x mxnet.7z -y -ousr`) + # this command will create the dir "usr\\lib" + run(`$exe7z x mxnet.7z build lib -y -ousr`) run(`cmd /c copy "usr\\build\\*.dll" "usr\\lib"`) + run(download_cmd(base_url, "mxnet_base.7z")) + run(`$exe7z x mxnet_base.7z -y -ousr`) + run(`cmd /c copy "usr\\prebuildbase_win10_x64_vc14_v2\\3rdparty\\bin\\*.dll" "usr\\lib"`) + + # testing + run(`cmd /c dir "usr\\lib"`) return end From b56c44ee4564201d99f0d5a8227375d03c093d4e Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 16 Nov 2017 21:22:41 +0800 Subject: [PATCH 552/630] Bump upstream to v0.12.1 (#326) --- NEWS.md | 10 +++++++--- deps/build.jl | 3 ++- 2 files changed, 9 insertions(+), 4 deletions(-) diff --git a/NEWS.md b/NEWS.md index c481c0598820..0cea0db56359 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,7 +1,11 @@ -# v0.3.0 (TBD) +# v0.3.0 (2017.11.16) -* Update `libmxnet` to v0.12.0. - (See https://github.com/apache/incubator-mxnet/releases/tag/0.12.0) +* Update `libmxnet` to + * On Windows: v0.12.0. + (See https://github.com/apache/incubator-mxnet/releases/tag/0.12.0) + + * On Linux/macOS: v0.12.1. + (See https://github.com/apache/incubator-mxnet/releases/tag/0.12.1) * Drop 0.5 support. ([#300][300]) diff --git a/deps/build.jl b/deps/build.jl index 619196628bf5..522ceed5ff23 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -5,7 +5,7 @@ import JSON # First try to detect and load existing libmxnet ################################################################################ libmxnet_detected = false -libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "0.12.0") +libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "0.12.1") curr_win = "20171019" # v0.12.0 if haskey(ENV, "MXNET_HOME") @@ -139,6 +139,7 @@ if !libmxnet_detected USE_JULIA_BLAS = true FORCE_LAPACK = true end + info("USE_JULIA_BLAS -> $USE_JULIA_BLAS") blas_name = blas_vendor == :openblas64 ? "openblas" : string(blas_vendor) MSHADOW_LDFLAGS = "MSHADOW_LDFLAGS=-lm $blas_path" From 9efedbccc098a3b1eb1288ba6e51b61d8d3e169b Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 17 Nov 2017 00:30:11 +0800 Subject: [PATCH 553/630] Update releasing note (#327) --- README-DEV.md | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) diff --git a/README-DEV.md b/README-DEV.md index b148fde3d5c7..a1d6fa9012fc 100644 --- a/README-DEV.md +++ b/README-DEV.md @@ -4,7 +4,10 @@ 2. Check out the `stable` branch, merge with `master`. 3. Update `libmxnet_curr_ver` in `deps/build.jl` to the latest commit SHA (or any proper reference). Using `master` here is not good because future changes in libmxnet might break existing Julia packages. 4. Run tests. -5. Commit changes and push. -6. Run `Pkg.tag("MXNet")` in Julia. -7. Run `Pkg.publish()`, which will open a browser for making a pull request to METADATA.jl. -8. Edit the [releases page](https://github.com/dmlc/MXNet.jl/releases) to copy the release notes from `NEWS.md` to the newly created release tag. +5. Merge master into stable branch. +6. Tag stable branch: `git tag v1.2.3` +7. Push tag to remote: `git push origin ` +8. Edit the [releases page](https://github.com/dmlc/MXNet.jl/releases) + to copy the release notes from `NEWS.md` to the newly created release tag. +9. Goto https://github.com/JuliaLang/METADATA.jl/pulls + and check `attobot` already make a PR for the release. From a4aab013ddc9ec29a979cbde778189d7bb643a46 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 18 Nov 2017 00:32:50 +0800 Subject: [PATCH 554/630] docs: minor changes in overview (#330) --- docs/src/user-guide/overview.md | 57 ++++++++++++++++----------------- 1 file changed, 28 insertions(+), 29 deletions(-) diff --git a/docs/src/user-guide/overview.md b/docs/src/user-guide/overview.md index a767643a3735..cddeed6bc8c9 100644 --- a/docs/src/user-guide/overview.md +++ b/docs/src/user-guide/overview.md @@ -11,7 +11,7 @@ prefix explicitly: ```julia julia> using MXNet -julia> x = mx.zeros(2,3) # MXNet NDArray +julia> x = mx.zeros(2, 3) # MXNet NDArray 2×3 mx.NDArray{Float32} @ CPU0: 0.0 0.0 0.0 0.0 0.0 0.0 @@ -51,20 +51,20 @@ functions, including `size` and `copy!` as shown in the last line. MXNet. It is like a Julia `Array` object, with some important differences listed here: -- The actual data could live on different `Context` (e.g. GPUs). For - some contexts, iterating into the elements one by one is very slow, - thus indexing into NDArray is not recommanded in general. The easiest - way to inspect the contents of an NDArray is to use the `copy` - function to copy the contents as a Julia `Array`. -- Operations on `NDArray` (including basic arithmetics and neural - network related operators) are executed in parallel with automatic - dependency tracking to ensure correctness. -- There is no generics in `NDArray`, the `eltype` is always - `mx.MX_float`. Because for applications in machine learning, single - precision floating point numbers are typical a best choice balancing - between precision, speed and portability. Also since libmxnet is - designed to support multiple languages as front-ends, it is much - simpler to implement with a fixed data type. +- The actual data could live on different `Context` (e.g. GPUs). For + some contexts, iterating into the elements one by one is very slow, + thus indexing into NDArray is not recommanded in general. The easiest + way to inspect the contents of an NDArray is to use the `copy` + function to copy the contents as a Julia `Array`. +- Operations on `NDArray` (including basic arithmetics and neural + network related operators) are executed in parallel with automatic + dependency tracking to ensure correctness. +- There is no generics in `NDArray`, the `eltype` is always + `mx.MX_float`. Because for applications in machine learning, single + precision floating point numbers are typical a best choice balancing + between precision, speed and portability. Also since libmxnet is + designed to support multiple languages as front-ends, it is much + simpler to implement with a fixed data type. While most of the computation is hidden in libmxnet by operators corresponding to various neural network layers. Getting familiar with @@ -73,13 +73,13 @@ operators in Julia directly. The followings are common ways to create `NDArray` objects: -- `mx.empty(shape[, context])`: create on uninitialized array of a - given shape on a specific device. For example, - `mx.empty(2,3)`, `mx.((2,3), mx.gpu(2))`. -- `mx.zeros(shape[, context])` and `mx.ones(shape[, context])`: - similar to the Julia's built-in `zeros` and `ones`. -- `mx.copy(jl_arr, context)`: copy the contents of a Julia `Array` to - a specific device. +- `mx.empty(shape[, context])`: create on uninitialized array of a + given shape on a specific device. For example, + `mx.empty(2, 3)`, `mx.((2, 3), mx.gpu(2))`. +- `mx.zeros(shape[, context])` and `mx.ones(shape[, context])`: + similar to the Julia's built-in `zeros` and `ones`. +- `mx.copy(jl_arr, context)`: copy the contents of a Julia `Array` to + a specific device. Most of the convenient functions like `size`, `length`, `ndims`, `eltype` on array objects should work out-of-the-box. Although indexing @@ -87,7 +87,7 @@ is not supported, it is possible to take *slices*: ```@repl using MXNet -a = mx.ones(2,3) +a = mx.ones(2, 3) b = mx.slice(a, 1:2) b[:] = 2 a @@ -101,7 +101,7 @@ shows a way to set the contents of an `NDArray`. ```@repl using MXNet mx.srand(42) -a = mx.empty(2,3) +a = mx.empty(2, 3) a[:] = 0.5 # set all elements to a scalar a[:] = rand(size(a)) # set contents with a Julia Array copy!(a, rand(size(a))) # set value by copying a Julia Array @@ -248,9 +248,8 @@ symbolic composition system. It is like [Theano](http://deeplearning.net/software/theano/), except that we avoided long expression compilation time by providing *larger* neural network related building blocks to guarantee computation performance. -See also [this -note](http://mxnet.readthedocs.org/en/latest/program_model.html) for the -design and trade-off of the MXNet symbolic composition system. +See also [this note](http://mxnet.readthedocs.org/en/latest/program_model.html) +for the design and trade-off of the MXNet symbolic composition system. The basic type is `mx.SymbolicNode`. The following is a trivial example of composing two symbols with the `+` operation. @@ -305,8 +304,8 @@ categories: *inputs* and *parameters*. *inputs* are data and labels for the networks, while *parameters* are typically trainable *weights*, *bias*, *filters*. -When composing symbols, their arguments accumulates. We can list all the -arguments by +When composing symbols, their arguments accumulates. +We can list all the arguments by ```@example fcnet mx.list_arguments(net) From 57b50d49691174ffc8fd78bf821d807e277d8f7b Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 18 Nov 2017 02:32:19 +0800 Subject: [PATCH 555/630] build: set upstream version back to master (#328) --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index 522ceed5ff23..a59d9f84a5b3 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -5,7 +5,7 @@ import JSON # First try to detect and load existing libmxnet ################################################################################ libmxnet_detected = false -libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "0.12.1") +libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "master") curr_win = "20171019" # v0.12.0 if haskey(ENV, "MXNET_HOME") From 8564f190728ca3fa50dd2d048667b9ed08cc7a60 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 21 Nov 2017 01:36:06 +0800 Subject: [PATCH 556/630] executor: add Base.show and Base.print (#337) --- src/executor.jl | 38 ++++++++++++++++++++++++++++++-------- src/symbolic-node.jl | 6 +++--- 2 files changed, 33 insertions(+), 11 deletions(-) diff --git a/src/executor.jl b/src/executor.jl index 036c5743b7c0..26da87c69ac9 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -203,20 +203,42 @@ function copy_params_from(self::Executor, arg_params::Dict{Base.Symbol,NDArray}, end +Base.show(io::IO, x::Executor) = + print(io, "mx.", split(string(typeof(x)), '.')[end], " ", x.handle.value) + """ + print([io::IO], x::Executor) + Get a debug string about internal execution plan. Can be used to get an estimated about the memory cost. + ```julia - net = ... # Symbol - dProvider = ... # DataProvider - exec = mx.simple_bind(net, mx.cpu(), data=size(dProvider.data_batch[1])) - dbg_str = mx.debug_str(exec) - println(split(ref, ['\\n'])[end-2]) +julia> x = mx.Variable(:x) +MXNet.mx.SymbolicNode x + +julia> exec = mx.bind(x + 1, mx.cpu(), Dict(:x => mx.ones(2,3))) +mx.Executor Ptr{Void} @0x000055c3dee9eb30 + +julia> print(exec) +Symbol Outputs: + output[0]=_plus_scalar0(0) +Variable:x +-------------------- +Op:_plus_scalar, Name=_plus_scalar0 +Inputs: + arg[0]=x(0) version=0 +Attrs: + scalar=1.00000000e+00 +Total 0 MB allocated +Total 11 TempSpace resource requested ``` """ -function debug_str(self :: Executor) - s_ref = Ref{Cstring}() - @mxcall(:MXExecutorPrint, (MX_handle, Ptr{Cstring}), self.handle, s_ref) +Base.print(io::IO, x::Executor) = print(io, debug_str(x)) +Base.print(x::Executor) = print(STDOUT, x) + +function debug_str(x::Executor) + s_ref = Ref{Cstring}(C_NULL) + @mxcall(:MXExecutorPrint, (MX_handle, Ptr{Cstring}), x.handle, s_ref) unsafe_string(s_ref[]) end diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index bbe2d1874846..c9bf7e3b9db7 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -229,16 +229,16 @@ Base.show(io::IO, sym::SymbolicNode) = import Base: print -function print(io :: IO, sym :: SymbolicNode) +function print(io::IO, sym::SymbolicNode) out = Ref{mx.char_p}(C_NULL) @mx.mxcall(:MXSymbolPrint, (mx.MX_SymbolHandle, Ref{mx.char_p}), sym.handle, out) print(io, unsafe_string(out[])) end -print(sym :: SymbolicNode) = print(STDOUT, sym) +print(sym::SymbolicNode) = print(STDOUT, sym) """ - print([io :: IO], sym :: SymbolicNode) + print([io::IO], sym::SymbolicNode) Print the content of symbol, used for debug. From ceb7fbfc303ce71e4c029651a4e8909648d67172 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 21 Nov 2017 01:46:51 +0800 Subject: [PATCH 557/630] travis: enable caching for reducing build time (#329) * travis: tweak number of make job on CI * travis: enable cache for libmxnet --- .travis.yml | 10 +++++++--- deps/build.jl | 10 +++++----- deps/cpcblas.sh | 7 +++++++ test/travis/run_test.sh | 8 +++++++- 4 files changed, 26 insertions(+), 9 deletions(-) create mode 100755 deps/cpcblas.sh diff --git a/.travis.yml b/.travis.yml index a91994db2fc1..680df7af481e 100644 --- a/.travis.yml +++ b/.travis.yml @@ -1,10 +1,13 @@ # Documentation: http://docs.travis-ci.com/user/languages/julia/ sudo: false + language: julia + os: - linux - osx osx_image: xcode8 + julia: - 0.6 # - nightly 0.6 supports depends on #170 @@ -15,6 +18,10 @@ branches: - stable - /^v\d+\.\d+(\.\d+)?(-\S*)?$/ # for tagging +cache: + directories: + - $TRAVIS_BUILD_DIR/deps/src + # dependent apt packages addons: apt: @@ -40,9 +47,6 @@ notifications: email: false script: - # bump the time limit of no ouput - # the `travis_wait` wrapper can be removed once this issue fixed: - # https://github.com/JuliaLang/julia/pull/23601 - ${TRAVIS_DIR}/run_test.sh after_success: diff --git a/deps/build.jl b/deps/build.jl index a59d9f84a5b3..c22af6c7bf89 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -70,7 +70,7 @@ end function get_cpucore() if haskey(ENV, "TRAVIS") # on travis-ci - 4 + 2 else min(Sys.CPU_CORES, 8) end @@ -166,17 +166,17 @@ if !libmxnet_detected end) @build_steps begin ChangeDirectory(_mxdir) - `git submodule deinit --force .` `git fetch` if libmxnet_curr_ver != "master" `git checkout $libmxnet_curr_ver` else - `git merge --ff origin/$libmxnet_curr_ver` + `git checkout origin/$libmxnet_curr_ver` end `git submodule update --init --recursive` `git -C mshadow checkout -- make/mshadow.mk` - `make clean` - `cp ../../cblas.h include/cblas.h` + + # copying on changed, make travis caching happy + `../../cpcblas.sh` `sed -i -s "s/MSHADOW_CFLAGS = \(.*\)/MSHADOW_CFLAGS = \1 $ilp64/" mshadow/make/mshadow.mk` diff --git a/deps/cpcblas.sh b/deps/cpcblas.sh new file mode 100755 index 000000000000..1a592186b49c --- /dev/null +++ b/deps/cpcblas.sh @@ -0,0 +1,7 @@ +#!/bin/sh + +# be invoked from build.jl + +set -e + +diff ../../cblas.h include/cblas.h || cp -v ../../cblas.h include/cblas.h diff --git a/test/travis/run_test.sh b/test/travis/run_test.sh index a576c69f6979..bf726eb49157 100755 --- a/test/travis/run_test.sh +++ b/test/travis/run_test.sh @@ -1,4 +1,10 @@ #!/bin/bash +set -e if [[ -a .git/shallow ]]; then git fetch --unshallow; fi -julia -e 'Pkg.clone(pwd()); Pkg.build("MXNet"); Pkg.test("MXNet"; coverage=true)' +julia -e 'Pkg.clone(pwd())' +( + cd `julia -e 'println(Pkg.dir("MXNet", "deps"))'` && + ln -fs $TRAVIS_BUILD_DIR/deps/src +) +julia -e 'Pkg.build("MXNet"); Pkg.test("MXNet"; coverage=true)' From 1a7887c5c1613fbbc676e4d1f5c0fa17318325a1 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 21 Nov 2017 01:48:05 +0800 Subject: [PATCH 558/630] ndarray: add outer constrcutor for AbstractArray (#334) --- src/ndarray.jl | 7 +++---- test/unittest/ndarray.jl | 33 ++++++++++++++++++++++++--------- 2 files changed, 27 insertions(+), 13 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 0b0e01a40e64..9aca2f3d9c42 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -98,6 +98,9 @@ mutable struct NDArray end end +NDArray(x::AbstractArray{T}) where {T<:DType} = copy(collect(x), cpu()) +NDArray(x::Array{T}) where {T<:DType} = copy(x, cpu()) + const NDArrayOrReal = Union{NDArray, Real} @unfuse NDArray @@ -107,10 +110,6 @@ function Base.show(io :: IO, arr :: NDArray) Base.showarray(io, try_get_shared(arr, sync=:read), false, header=false) end -function NDArray(data :: Array{T}) where T<:Real - copy(data, cpu()) -end - function Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) Base.unsafe_convert(MX_handle, obj.handle) end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 0e1837bdd5a3..5217ca80feaa 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -15,6 +15,20 @@ function rand_tensors(::Type{T}, dims::NTuple{N, Int}) where {N, T} return (tensor, array) end +function test_constructor() + info("NDArray::NDArray(x::AbstractArray)") + function check_absarray(x) + y = mx.NDArray(x) + @test ndims(x) == ndims(y) + @test eltype(x) == eltype(y) + @test x[3] == y[3][] + end + + check_absarray(1:10) + check_absarray(1.0:10) +end # function test_constructor + + function test_copy() dims = rand_dims() tensor = rand(mx.MX_float, dims) @@ -87,7 +101,7 @@ end function test_linear_idx() info("NDArray::getindex::linear indexing") - let A = reshape(collect(1:30), 3, 10) + let A = reshape(1:30, 3, 10) x = mx.NDArray(A) @test copy(x) == A @@ -104,7 +118,7 @@ function test_linear_idx() @test_throws BoundsError x[42] end - let A = reshape(collect(1:24), 3, 2, 4) + let A = reshape(1:24, 3, 2, 4) x = mx.NDArray(A) @test copy(x) == A @@ -118,7 +132,7 @@ function test_linear_idx() end info("NDArray::setindex!::linear indexing") - let A = reshape(collect(1:24), 3, 2, 4) + let A = reshape(1:24, 3, 2, 4) x = mx.NDArray(A) @test copy(x) == A @@ -136,7 +150,7 @@ end # function test_linear_idx function test_first() info("NDArray::first") - let A = reshape(collect(1:30), 3, 10) + let A = reshape(1:30, 3, 10) x = mx.NDArray(A) @test x[] == 1 @@ -613,7 +627,7 @@ end function test_sum() info("NDArray::sum") - let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + let A = reshape(1.0:8, 2, 2, 2), X = mx.NDArray(A) @test copy(sum(X))[] == sum(A) @test copy(sum(X, 1)) == sum(A, 1) @test copy(sum(X, 2)) == sum(A, 2) @@ -626,7 +640,7 @@ end function test_mean() info("NDArray::mean") - let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + let A = reshape(1.0:8, 2, 2, 2), X = mx.NDArray(A) @test copy(mean(X))[] == mean(A) @test copy(mean(X, 1)) == mean(A, 1) @test copy(mean(X, 2)) == mean(A, 2) @@ -639,7 +653,7 @@ end function test_maximum() info("NDArray::maximum") - let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + let A = reshape(1.0:8, 2, 2, 2), X = mx.NDArray(A) @test copy(maximum(X))[] == maximum(A) @test copy(maximum(X, 1)) == maximum(A, 1) @test copy(maximum(X, 2)) == maximum(A, 2) @@ -652,7 +666,7 @@ end function test_minimum() info("NDArray::minimum") - let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + let A = reshape(1.0:8, 2, 2, 2), X = mx.NDArray(A) @test copy(minimum(X))[] == minimum(A) @test copy(minimum(X, 1)) == minimum(A, 1) @test copy(minimum(X, 2)) == minimum(A, 2) @@ -665,7 +679,7 @@ end function test_prod() info("NDArray::prod") - let A = reshape(1.0:8, 2, 2, 2) |> collect, X = mx.NDArray(A) + let A = reshape(1.0:8, 2, 2, 2), X = mx.NDArray(A) @test copy(prod(X))[] == prod(A) @test copy(prod(X, 1)) == prod(A, 1) @test copy(prod(X, 2)) == prod(A, 2) @@ -740,6 +754,7 @@ end # Run tests ################################################################################ @testset "NDArray Test" begin + test_constructor() test_assign() test_copy() test_slice() From 010ea3cc8340a91aba0fc2b9c9bcdf0d49ad9f6c Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 21 Nov 2017 03:12:37 +0800 Subject: [PATCH 559/630] sym: implement get_children (#333) See https://github.com/apache/incubator-mxnet/pull/5141 --- NEWS.md | 8 ++++++++ src/symbolic-node.jl | 29 +++++++++++++++++++++++++++++ test/unittest/symbolic-node.jl | 17 +++++++++++++++++ 3 files changed, 54 insertions(+) diff --git a/NEWS.md b/NEWS.md index 0cea0db56359..0259c6803791 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,11 @@ +# v0.4.0 (#TBD) + +## New APIs + +### `SymbolicNode` + +* `mx.get_children` for exploring the graph programmatically. (#TBD) + # v0.3.0 (2017.11.16) * Update `libmxnet` to diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index c9bf7e3b9db7..11c2a6fdc8ec 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -119,6 +119,35 @@ function get_internals(self :: SymbolicNode) return SymbolicNode(MX_SymbolHandle(ref_hdr[])) end +""" + get_children(x::SymbolicNode) + +Gets a new grouped `SymbolicNode` whose output contains inputs to output +nodes of the original symbol. + +```julia +julia> x = mx.Variable(:x) +MXNet.mx.SymbolicNode x + +julia> y = mx.Variable(:y) +MXNet.mx.SymbolicNode y + +julia> z = x + y +MXNet.mx.SymbolicNode _plus1 + +julia> a |> mx.get_children |> mx.list_outputs +2-element Array{Symbol,1}: + :x + :y +``` +""" +function get_children(x::SymbolicNode) + hdl = Ref{MX_handle}(C_NULL) + @mxcall(:MXSymbolGetChildren, (MX_handle, Ref{MX_handle}), x, hdl) + sym = hdl[] |> MX_SymbolHandle |> SymbolicNode + isempty(list_outputs(sym)) ? nothing : sym +end + """ get_attr(self :: SymbolicNode, key :: Symbol) diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index baeb92a68e23..766f789c413b 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -53,6 +53,23 @@ function test_internal() @test mx.list_arguments(fc1) == mx.list_arguments(oldfc) end +function test_get_children() + info("SymbolicNode::get_children") + + let x = mx.Variable(:x), y = mx.Variable(:y) + z = x + y + @test length(mx.list_outputs(z)) == 1 + @test length(mx.list_outputs(mx.get_children(z))) == 2 + @test mx.list_outputs(mx.get_children(z)) == [:x, :y] + end + + info("SymbolicNode::get_children::on leaf") + let x = mx.Variable(:x) + @test mx.get_children(x) == nothing + end +end # test_get_children + + function test_compose() info("SymbolicNode::compose") From 1f50a144c90e5034af79468b0c9a9ff234a11b98 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 21 Nov 2017 03:13:02 +0800 Subject: [PATCH 560/630] sym: fix printing of symbol generated via get_internals (#332) --- src/symbolic-node.jl | 8 +++++++- test/unittest/symbolic-node.jl | 11 +++++++++-- 2 files changed, 16 insertions(+), 3 deletions(-) diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index 11c2a6fdc8ec..d8305eb57c00 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -250,7 +250,13 @@ function get_name(self :: mx.SymbolicNode) success = Ref(0) @mxcall(:MXSymbolGetName, (MX_handle, Ref{char_p}, Ref{Int}), self.handle.value, name, success) @assert success[] != -1 - return Symbol(unsafe_string(name[])) + + str = name[] + if str == C_NULL # e.g. the symbol returned via get_internals + string(self.handle.value) + else + Symbol(unsafe_string(str)) + end end Base.show(io::IO, sym::SymbolicNode) = diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index 766f789c413b..edde78c32541 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -468,7 +468,7 @@ function test_power() end end - info("NDArray::power::e.^x::x.^e") + info("SymbolicNode::power::e.^x::x.^e") let x = mx.Variable(:x), A = [0 0 0; 0 0 0] y = exec(e.^x; :x => A)[] @test copy(y) ≈ ones(A) @@ -486,7 +486,7 @@ function test_power() end end - info("NDArray::power::π.^x::x.^π") + info("SymbolicNode::power::π.^x::x.^π") let x = mx.Variable(:x), A = Float32[1 2; 3 4] let y = π.^x z = exec(y; :x => A)[] @@ -500,6 +500,12 @@ function test_power() end end # function test_power +function test_get_name() + info("SymbolicNode::get_name::with get_internals") + name = mx.get_name(mx.get_internals(mlp2())) # no error + @test contains(name, "Ptr") +end # function test_get_name + ################################################################################ # Run tests ################################################################################ @@ -522,6 +528,7 @@ end # function test_power test_mul() test_div() test_power() + test_get_name() end end From b0556e682dd3e361d4f1242152c27a6c85d144ac Mon Sep 17 00:00:00 2001 From: Michael Creel Date: Wed, 22 Nov 2017 09:57:12 +0100 Subject: [PATCH 561/630] Update regression-example.jl (#339) Fix the call to scatter plot, in the last line. It is commented out, but if a user uncomments it to see a plot of the fit, the fix is needed. --- examples/regression-example.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/examples/regression-example.jl b/examples/regression-example.jl index 885f031dc658..94a0d3761ba2 100644 --- a/examples/regression-example.jl +++ b/examples/regression-example.jl @@ -57,4 +57,4 @@ mx.fit(model, optimizer, eval_metric=mx.MSE(), trainprovider, eval_data=evalprov plotprovider = mx.ArrayDataProvider(:data => ValidationInput, :label => ValidationOutput) fit = mx.predict(model, plotprovider) println("correlation between fitted values and true regression line: ", cor(vec(fit), vec(ValidationOutput))) -#scatter(ValidationOutput,fit',w = 3, xlabel="true", ylabel="predicted", title="45º line is what we hope for", show=true) +#scatter(ValidationOutput',fit',w = 3, xlabel="true", ylabel="predicted", title="45º line is what we hope for", show=true) From 91a410e6a460eb9ead3955bb7462ffaf12cfead7 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 23 Nov 2017 01:17:50 +0800 Subject: [PATCH 562/630] test: minor style changes for mlp-test (#340) --- examples/mnist/mlp-test.jl | 23 +++++++++++++++++------ 1 file changed, 17 insertions(+), 6 deletions(-) diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl index 2acedd073dfa..56bd00b6a122 100644 --- a/examples/mnist/mlp-test.jl +++ b/examples/mnist/mlp-test.jl @@ -2,32 +2,30 @@ # features of MXNet.jl in this example in order to detect regression errors. module MNISTTest + using MXNet using Base.Test include("mnist-data.jl") function get_mnist_mlp() - mlp = @mx.chain mx.Variable(:data) => + @mx.chain mx.Variable(:data) => mx.FullyConnected(name=:fc1, num_hidden=128) => mx.Activation(name=:relu1, act_type=:relu) => mx.FullyConnected(name=:fc2, num_hidden=64) => mx.Activation(name=:relu2, act_type=:relu) => mx.FullyConnected(name=:fc3, num_hidden=10) => mx.SoftmaxOutput(name=:softmax) - return mlp end -function get_mnist_data(batch_size=100) - return get_mnist_providers(batch_size) -end +get_mnist_data(batch_size = 100) = get_mnist_providers(batch_size) function mnist_fit_and_predict(optimizer, initializer, n_epoch) mlp = get_mnist_mlp() train_provider, eval_provider = get_mnist_data() # setup model - model = mx.FeedForward(mlp, context=mx.cpu()) + model = mx.FeedForward(mlp, context = mx.cpu()) # fit parameters cp_prefix = "mnist-test-cp" @@ -73,12 +71,25 @@ function mnist_fit_and_predict(optimizer, initializer, n_epoch) end function test_mnist_mlp() + info("MNIST::SGD") @test mnist_fit_and_predict(mx.SGD(lr=0.1, momentum=0.9), mx.UniformInitializer(0.01), 2) > 90 + + info("MNIST::ADAM") @test mnist_fit_and_predict(mx.ADAM(), mx.NormalInitializer(), 2) > 90 + + info("MNIST::AdaGrad") @test mnist_fit_and_predict(mx.AdaGrad(), mx.NormalInitializer(), 2) > 90 + + info("MNIST::AdaDelta") @test mnist_fit_and_predict(mx.AdaDelta(), mx.NormalInitializer(), 2) > 90 + + info("MNIST::AdaMax") @test mnist_fit_and_predict(mx.AdaMax(), mx.NormalInitializer(), 2) > 90 + + info("MNIST::RMSProp") @test mnist_fit_and_predict(mx.RMSProp(), mx.NormalInitializer(), 2) > 90 + + info("MNIST::Nadam") @test mnist_fit_and_predict(mx.Nadam(), mx.NormalInitializer(), 2) > 90 end From f12648245daba2926652862db958e6d8486f1332 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 23 Nov 2017 01:20:25 +0800 Subject: [PATCH 563/630] sym: handy macro `mx.var` for creating `mx.Variable` (#338) --- NEWS.md | 10 ++++++++++ src/symbolic-node.jl | 21 +++++++++++++++++++++ test/unittest/symbolic-node.jl | 16 ++++++++++++++++ 3 files changed, 47 insertions(+) diff --git a/NEWS.md b/NEWS.md index 0259c6803791..3e5dce1c6eee 100644 --- a/NEWS.md +++ b/NEWS.md @@ -6,6 +6,16 @@ * `mx.get_children` for exploring the graph programmatically. (#TBD) +* A handy macro `@mx.var` for creating `mx.Variable`. (#TBD) + + ```julia + julia> x = @mx.var x + MXNet.mx.SymbolicNode x + + julia> x, y, z = @mx.var x y z + (MXNet.mx.SymbolicNode x, MXNet.mx.SymbolicNode y, MXNet.mx.SymbolicNode z) + ``` + # v0.3.0 (2017.11.16) * Update `libmxnet` to diff --git a/src/symbolic-node.jl b/src/symbolic-node.jl index d8305eb57c00..bb3c97773488 100644 --- a/src/symbolic-node.jl +++ b/src/symbolic-node.jl @@ -347,6 +347,27 @@ function Variable(name :: Union{Symbol, AbstractString}; attrs = Dict()) node end +""" + @var ... + +A handy macro for creating `mx.Variable`. + +```julia +julia> x = @mx.var x +MXNet.mx.SymbolicNode x + +julia> x, y, z = @mx.var x y z +(MXNet.mx.SymbolicNode x, MXNet.mx.SymbolicNode y, MXNet.mx.SymbolicNode z) +``` +""" +macro var(n::Symbol) + Expr(:call, :Variable, QuoteNode(n)) +end + +macro var(names::Symbol...) + Expr(:tuple, map(n -> Expr(:call, :Variable, QuoteNode(n)), names)...) +end + """ Group(nodes :: SymbolicNode...) diff --git a/test/unittest/symbolic-node.jl b/test/unittest/symbolic-node.jl index edde78c32541..e3e003d296af 100644 --- a/test/unittest/symbolic-node.jl +++ b/test/unittest/symbolic-node.jl @@ -506,6 +506,21 @@ function test_get_name() @test contains(name, "Ptr") end # function test_get_name +function test_var() + info("SymbolicNode::var") + x = @mx.var x + @test x isa mx.SymbolicNode + + x′ = @mx.var x + @test x.handle != x′.handle + + x, y, z = @mx.var x y z + @test x isa mx.SymbolicNode + @test y isa mx.SymbolicNode + @test z isa mx.SymbolicNode +end # test_var + + ################################################################################ # Run tests ################################################################################ @@ -529,6 +544,7 @@ end # function test_get_name test_div() test_power() test_get_name() + test_var() end end From cb06a9aeb59d0bb64b3f0f17e7c919b7b1f56e0e Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 25 Nov 2017 09:38:39 +0800 Subject: [PATCH 564/630] build: bump max number of make jobs to 32 (#343) --- deps/build.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deps/build.jl b/deps/build.jl index c22af6c7bf89..8b4c254cbb39 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -72,7 +72,7 @@ function get_cpucore() if haskey(ENV, "TRAVIS") # on travis-ci 2 else - min(Sys.CPU_CORES, 8) + min(Sys.CPU_CORES, 32) end end From 45d6279f3fcc833308b4a9bb4d1e07a5a2ea8767 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 27 Nov 2017 10:41:31 +0800 Subject: [PATCH 565/630] ndarray: add `Base.show(io, MIME"text/plain")` (#347) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * ndarray: add `Base.show(io, MIME"text/plain")` e.g. make Array of NDArray show like this ```julia julia> [mx.zeros(100)] 1-element Array{MXNet.mx.NDArray,1}: NDArray Float32[0.0, 0.0, 0.0 … 0.0, 0.0, 0.0] ``` * test cases --- src/ndarray.jl | 12 +++++++++--- test/unittest/ndarray.jl | 12 +++++++++++- 2 files changed, 20 insertions(+), 4 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 9aca2f3d9c42..9cb168ca4ff5 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -105,9 +105,15 @@ const NDArrayOrReal = Union{NDArray, Real} @unfuse NDArray -function Base.show(io :: IO, arr :: NDArray) - println(io, "$(join(size(arr), "×")) mx.NDArray{$(eltype(arr))} @ $(context(arr)):") - Base.showarray(io, try_get_shared(arr, sync=:read), false, header=false) +function Base.show(io::IO, x::NDArray) + print(io, "NDArray ") + Base.showarray(io, try_get_shared(x, sync = :read), header = false) +end + +# for REPL +function Base.show(io::IO, ::MIME{Symbol("text/plain")}, x::NDArray) + println(io, "$(join(size(x), "×")) mx.NDArray{$(eltype(x))} @ $(context(x)):") + Base.showarray(io, try_get_shared(x, sync = :read), false, header = false) end function Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 5217ca80feaa..2c278bb6e201 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -741,13 +741,23 @@ function test_transpose() end function test_show() - let str = sprint(show, mx.NDArray([1 2 3 4])) + info("NDArray::show::REPL") + let str = sprint(show, MIME"text/plain"(), mx.NDArray([1 2 3 4])) @test contains(str, "1×4") @test contains(str, "mx.NDArray") @test contains(str, "Int64") @test contains(str, "CPU") @test match(r"1\s+2\s+3\s+4", str) != nothing end + + info("NDArray::show") + let str = sprint(show, mx.NDArray([1 2 3 4])) + @test str == "NDArray [1 2 3 4]" + end + + let str = sprint(show, mx.zeros(4)) + @test str == "NDArray Float32[0.0, 0.0, 0.0, 0.0]" + end end ################################################################################ From e0f625a49328cd98a8e11093a4ed8a0981f555ed Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 28 Nov 2017 04:15:32 +0800 Subject: [PATCH 566/630] example: fix batchsize config in regression-example (#342) --- examples/regression-example.jl | 44 ++++++++++++++++++++++++++-------- 1 file changed, 34 insertions(+), 10 deletions(-) diff --git a/examples/regression-example.jl b/examples/regression-example.jl index 94a0d3761ba2..e820d54001ec 100644 --- a/examples/regression-example.jl +++ b/examples/regression-example.jl @@ -13,8 +13,8 @@ generate_inputs(mean, var, size) = rand(MvNormal(mean, var), size) output(data) = sin.(data[1:1,:]).*sin.(data[2:2,:])./(data[1:1,:].*data[2:2,:]) # create training and evaluation data sets -mean=[0.0;0.0] -var=[1.0 0.0;0.0 1.0] +mean=[0.0; 0.0] +var=[1.0 0.0; 0.0 1.0] samplesize = 5000 TrainInput = generate_inputs(mean, var, samplesize) TrainOutput = output(TrainInput) @@ -22,9 +22,22 @@ ValidationInput = generate_inputs(mean, var, samplesize) ValidationOutput = output(ValidationInput) # how to set up data providers using data in memory -batchsize = 100 # can adjust this later, but must be defined now for next line -trainprovider = mx.ArrayDataProvider(:data => TrainInput, batch_size=batchsize, shuffle=true, :label => TrainOutput) -evalprovider = mx.ArrayDataProvider(:data => ValidationInput, batch_size=batchsize, shuffle=true, :label => ValidationOutput) +function data_source(batchsize = 100) + train = mx.ArrayDataProvider( + :data => TrainInput, + :label => TrainOutput, + batch_size = batchsize, + shuffle = true, + ) + valid = mx.ArrayDataProvider( + :data => ValidationInput, + :label => ValidationOutput, + batch_size = batchsize, + shuffle = true, + ) + + train, valid +end # create a two hidden layer MPL: try varying num_hidden, and change tanh to relu, # or add/remove a layer @@ -35,7 +48,7 @@ net = @mx.chain mx.Variable(:data) => mx.Activation(act_type=:tanh) => mx.FullyConnected(num_hidden=3) => mx.Activation(act_type=:tanh) => - mx.FullyConnected(num_hidden=1) => + mx.FullyConnected(num_hidden=1) => mx.LinearRegressionOutput(mx.Variable(:label)) # final model definition, don't change, except if using gpu @@ -47,11 +60,22 @@ optimizer = mx.ADAM() # train, reporting loss for training and evaluation sets # initial training with small batch size, to get to a good neighborhood -batchsize = 200 -mx.fit(model, optimizer, initializer=mx.NormalInitializer(0.0,0.1), eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 20) +trainprovider, evalprovider = data_source(#= batchsize =# 200) +mx.fit(model, optimizer, trainprovider, + initializer = mx.NormalInitializer(0.0, 0.1), + eval_metric = mx.MSE{mx.NDArray{Float32,1}}(), + eval_data = evalprovider, + n_epoch = 20, + callbacks = [mx.speedometer()]) # more training with the full sample -batchsize = samplesize -mx.fit(model, optimizer, eval_metric=mx.MSE(), trainprovider, eval_data=evalprovider, n_epoch = 20) +trainprovider, evalprovider = data_source(#= batchsize =# samplesize) +mx.fit(model, optimizer, trainprovider, + initializer = mx.NormalInitializer(0.0, 0.1), + eval_metric = mx.MSE{mx.NDArray{Float32,1}}(), + eval_data = evalprovider, + n_epoch = 500, # previous setting is batchsize = 200, epoch = 20 + # implies we did (5000 / 200) * 20 times update in previous `fit` + callbacks = [mx.speedometer()]) # obtain predictions plotprovider = mx.ArrayDataProvider(:data => ValidationInput, :label => ValidationOutput) From 935eb3594110ab628c81d49e1e1af2d07545df9b Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 28 Nov 2017 04:25:26 +0800 Subject: [PATCH 567/630] ndarray: make _minus type stable (#345) * ndarray: make _minus type stable The current importer `_import_ndarray_functions` provide `_minus(x, y; out = x)` and its return value is rely on keyword argument `out`. But Julia cannot (or hard to) do type inference on keyword argument at the moment, so this commit propose a new method `_minus!(x, y)` which modified the first argument, instead of provide a keyword argument. The new method can make type stable. fix #341 * add test cases --- src/ndarray.jl | 30 +++++++++++++++++++++++++----- test/unittest/ndarray.jl | 18 ++++++++++++------ 2 files changed, 37 insertions(+), 11 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 9cb168ca4ff5..9bb74f83f5d2 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -637,7 +637,7 @@ function sub_from!(dst::NDArray, arg::NDArrayOrReal) if isa(arg, Real) _minus_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) else - _minus(dst, arg, out=dst) + _minus!(dst, arg) end end @@ -1037,6 +1037,15 @@ function _autoimport(name::Symbol) end end +function _outexpr(name::Symbol, x #= the first arg of `sig` =#) + if endswith(string(name), "!") # `func!` + Ptr, 1, :([[MX_handle(x.handle)]]), :($x) + else + retexpr = :(NDArray(MX_NDArrayHandle(unsafe_load(hdls_ref[], 1)))) + Ref, 0, :(Ref{Ptr{MX_handle}}(C_NULL)), retexpr + end +end + macro _remap(sig::Expr, imp::Expr) fname = sig.args[1] opname = string(imp.args[1]) @@ -1055,16 +1064,19 @@ macro _remap(sig::Expr, imp::Expr) mxvals = Expr(:vect, map(x -> :(dump_mx_param($(x.args[2]))), mxargs)...) ndhlds = Expr(:vect, map(x -> :($(x).handle), ndin)...) + # handler for `func!` which has side effect on first argument. + T, n_output, hdls_ref, retexpr = _outexpr(fname, sig.args[2].args[1]) + func_body = quote op_handle = _get_cached_libmx_op_handle($opname) - n_output = Ref(Cint(0)) - hdls_ref = Ref{Ptr{MX_handle}}(C_NULL) + n_output = Ref(Cint($n_output)) + hdls_ref = $hdls_ref @mxcall(:MXImperativeInvoke, (MX_handle, Cint, Ptr{MX_handle}, Ref{Cint}, - Ref{Ptr{MX_handle}}, + $T{Ptr{MX_handle}}, Cint, char_pp, char_pp), @@ -1076,7 +1088,7 @@ macro _remap(sig::Expr, imp::Expr) $(length(mxargs)), $mxkeys, $mxvals) - NDArray(MX_NDArrayHandle(unsafe_load(hdls_ref[], 1))) + $retexpr end docstr = " $sig" @@ -1123,6 +1135,13 @@ _mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap prod(arr::NDArray) prod(arr) @_remap prod(arr::NDArray, dims) prod(arr; axis = 0 .- dims, keepdims = true) +################################################################################ +# remapping to solving type unstablility +################################################################################ + +@_remap _minus(x::NDArray, y::NDArray) _minus(x, y) +@_remap _minus!(x::NDArray, y::NDArray) _minus(x, y) + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -1248,6 +1267,7 @@ const _op_import_bl = [ # import black list; do not import these funcs "dot", "transpose", "prod", + "_minus", ] macro _import_ndarray_functions() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 2c278bb6e201..47ce9b08957d 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -264,6 +264,12 @@ function test_minus() scalar_large = Float16(1e4) @test t6 - scalar_small ≈ copy(a6 .- scalar_small) @test t6 - scalar_large ≈ copy(a6 .- scalar_large) + + info("NDArray::minus::type stablility") + let x = mx.zeros(dims), y = mx.ones(dims) + @inferred x - y + @inferred x .- y + end end function test_mul() @@ -361,29 +367,29 @@ end function test_rdiv() - info("NDarray::rdiv") + info("NDArray::rdiv") - info("NDarray::rdiv::Inf16") + info("NDArray::rdiv::Inf16") let x = 1 ./ mx.zeros(Float16, 4) @test copy(x) == [Inf16, Inf16, Inf16, Inf16] end - info("NDarray::rdiv::Inf32") + info("NDArray::rdiv::Inf32") let x = 1 ./ mx.zeros(Float32, 4) @test copy(x) == [Inf32, Inf32, Inf32, Inf32] end - info("NDarray::rdiv::Inf64") + info("NDArray::rdiv::Inf64") let x = 1 ./ mx.zeros(Float64, 4) @test copy(x) == [Inf64, Inf64, Inf64, Inf64] end - info("NDarray::rdiv::Int") + info("NDArray::rdiv::Int") let x = 1 ./ mx.NDArray([1 2; 3 4]) @test copy(x) == [1 0; 0 0] end - info("NDarray::rdiv::Float32") + info("NDArray::rdiv::Float32") let x = 1 ./ mx.NDArray(Float32[1 2; 3 4]) y = 1 ./ Float32[1 2; 3 4] @test copy(x) ≈ y From 2a5a284099766516bf3b26ce05ded190cef1ef6f Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 28 Nov 2017 04:26:34 +0800 Subject: [PATCH 568/630] model: refine and test cases for FeedForward constructor (#346) --- src/model.jl | 9 ++------- test/unittest/model.jl | 34 ++++++++++++++++++++++++++++++++++ 2 files changed, 36 insertions(+), 7 deletions(-) create mode 100644 test/unittest/model.jl diff --git a/src/model.jl b/src/model.jl index df15e4cace0a..44a2ba755798 100644 --- a/src/model.jl +++ b/src/model.jl @@ -25,6 +25,7 @@ mutable struct FeedForward <: AbstractModel # leave the rest fields undefined FeedForward(arch :: SymbolicNode, ctx :: Vector{Context}) = new(arch, ctx) + FeedForward(arch :: SymbolicNode, ctx :: Context) = new(arch, [ctx]) end """ @@ -53,14 +54,8 @@ end or a list of `Context` objects. In the latter case, data parallelization will be used for training. If no context is provided, the default context `cpu()` will be used. """ -function FeedForward(arch :: SymbolicNode; context :: Union{Context, Vector{Context}, Void} = nothing) - if isa(context, Void) - context = [Context(CPU)] - elseif isa(context, Context) - context = [context] - end +FeedForward(arch::SymbolicNode; context::Union{Context,Vector{Context}} = [cpu()]) = FeedForward(arch, context) -end """ init_model(self, initializer; overwrite=false, input_shapes...) diff --git a/test/unittest/model.jl b/test/unittest/model.jl new file mode 100644 index 000000000000..fafda7968e25 --- /dev/null +++ b/test/unittest/model.jl @@ -0,0 +1,34 @@ +module TestModel + +using Base.Test +using MXNet + + +function test_feedforward() + info("Model::FeedForward::constructor") + let x = @mx.var x + m = mx.FeedForward(x) + @assert m.arch === x + @assert length(m.ctx) == 1 + end + + info("Model::FeedForward::constructor::keyword context") + let x = @mx.var x + m = mx.FeedForward(x, context = mx.cpu()) + @assert m.arch === x + @assert length(m.ctx) == 1 + end + + let x = @mx.var x + m = mx.FeedForward(x, context = [mx.cpu(), mx.cpu(1)]) + @assert m.arch === x + @assert length(m.ctx) == 2 + end +end + + +@testset "Model Test" begin + test_feedforward() +end + +end # module TestModel From cb042fd2f870529799b16552d754980e867c498e Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 1 Dec 2017 21:18:39 +0800 Subject: [PATCH 569/630] parametric NDArray (#331) * ndarray: add outer constrcutor for AbstractArray * ndarray: refine copy * ndarray: refine copy! * ndarray: refine convert * ndarray: refine add_to! * ndarray: refine sub_from! * ndarray: refine mul_to! * ndarray: refine div_from! * ndarray: refine rdiv_from! * ndarray: refine _wait_to_read/_wait_to_write * ndarray: refine is_shared * ndarray: refine save * ndarray: refine dot * ndarray: VecOfNDArray * executor: refine backward * ndarray: refine empty * executor: refine bind --- src/callback.jl | 31 +++-- src/executor.jl | 113 ++++++++-------- src/io.jl | 95 +++++++------ src/kvstore.jl | 36 ++--- src/metric.jl | 96 ++++++------- src/model.jl | 75 ++++++----- src/ndarray.jl | 281 ++++++++++++++++++--------------------- src/util.jl | 14 ++ test/unittest/ndarray.jl | 10 +- test/unittest/util.jl | 25 ++++ 10 files changed, 390 insertions(+), 386 deletions(-) create mode 100644 test/unittest/util.jl diff --git a/src/callback.jl b/src/callback.jl index 289fdd066aa9..16e44fdc632d 100644 --- a/src/callback.jl +++ b/src/callback.jl @@ -48,7 +48,7 @@ end See also [`every_n_epoch`](@ref) and [`speedometer`](@ref). """ -function every_n_batch(callback :: Function, n :: Int; call_on_0 :: Bool = false) +function every_n_batch(callback::Function, n::Int; call_on_0::Bool = false) BatchCallback(n, call_on_0, callback) end function (cb :: BatchCallback)(state :: OptimizationState) @@ -62,7 +62,7 @@ function (cb :: BatchCallback)(state :: OptimizationState) end """ - speedometer(; frequency=50) + speedometer(;frequency=50) Create an `AbstractBatchCallback` that measure the training speed (number of samples processed per second) every k mini-batches. @@ -71,9 +71,9 @@ Create an `AbstractBatchCallback` that measure the training speed * `frequency::Int`: keyword argument, default 50. The frequency (number of min-batches) to measure and report the speed. """ -function speedometer(;frequency::Int=50) +function speedometer(;frequency::Int = 50) cl_tic = 0 - every_n_batch(frequency, call_on_0=true) do state :: OptimizationState + every_n_batch(frequency, call_on_0 = true) do state::OptimizationState if state.curr_batch == 0 # reset timer cl_tic = time() @@ -104,10 +104,11 @@ A convenient function to construct a callback that runs every `n` full data-pass See also [`every_n_batch`](@ref). """ -function every_n_epoch(callback :: Function, n :: Int; call_on_0 :: Bool = false) +every_n_epoch(callback::Function, n::Int; call_on_0::Bool = false) = EpochCallback(n, call_on_0, callback) -end -function (cb :: EpochCallback)(model :: Any, state :: OptimizationState, metric :: Vector{Tuple{Base.Symbol, T}}) where T<:Real + +function (cb::EpochCallback)(model::Any, state::OptimizationState, + metric::Vector{Tuple{Symbol, T}}) where T<:Real if state.curr_epoch == 0 if cb.call_on_0 cb.callback(model, state, metric) @@ -124,15 +125,17 @@ Create an `AbstractEpochCallback` that save checkpoints of the model to disk. The checkpoints can be loaded back later on. # Arguments -* `prefix::AbstractString`: the prefix of the filenames to save the model. The model - architecture will be saved to prefix-symbol.json, while the weights will be saved - to prefix-0012.params, for example, for the 12-th epoch. -* `frequency::Int`: keyword argument, default 1. The frequency (measured in epochs) to - save checkpoints. +* `prefix::AbstractString`: the prefix of the filenames to save the model. + The model architecture will be saved to prefix-symbol.json, + while the weights will be saved to prefix-0012.params, + for example, for the 12-th epoch. +* `frequency::Int`: keyword argument, default is 1. + The frequency (measured in epochs) to save checkpoints. * `save_epoch_0::Bool`: keyword argument, default false. Whether we should save a - checkpoint for epoch 0 (model initialized but not seen any data yet). + checkpoint for epoch 0 (model initialized but not seen any data yet). """ -function do_checkpoint(prefix::AbstractString; frequency::Int=1, save_epoch_0=false) +function do_checkpoint(prefix::AbstractString; + frequency::Int = 1, save_epoch_0::Bool = false) mkpath(dirname(prefix)) every_n_epoch(frequency, call_on_0=save_epoch_0) do model, state, metric save_checkpoint(model, prefix, state) diff --git a/src/executor.jl b/src/executor.jl index 26da87c69ac9..cd4a9256eeca 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -8,46 +8,49 @@ be carried out with an executor. mutable struct Executor handle :: MX_ExecutorHandle symbol :: SymbolicNode - arg_arrays :: Vector{NDArray} - grad_arrays :: Vector{Union{Void,NDArray}} - aux_arrays :: Vector{NDArray} - outputs :: Vector{NDArray} - arg_dict :: Dict{Base.Symbol, NDArray} - aux_dict :: Dict{Base.Symbol, NDArray} + arg_arrays :: VecOfNDArray + grad_arrays :: Vector{Union{Void,<:NDArray}} + aux_arrays :: VecOfNDArray + outputs :: VecOfNDArray + arg_dict :: Dict{Symbol} + aux_dict :: Dict{Symbol} end -function Executor(hdr :: MX_ExecutorHandle, symbol :: SymbolicNode, - arg_arrays :: Vector{NDArray}, grad_arrays :: Vector{Union{Void,NDArray}}, - aux_arrays :: Vector{NDArray}) + +function Executor(hdl::MX_ExecutorHandle, sym::SymbolicNode, + arg_arrays::VecOfNDArray, grad_arrays::AbstractVector, + aux_arrays::VecOfNDArray) # get output arrays ref_size = Ref{MX_uint}(0) - ref_hdrs = Ref{Ptr{MX_handle}}(0) + ref_hdls = Ref{Ptr{MX_handle}}(C_NULL) @mxcall(:MXExecutorOutputs, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_handle}}), - hdr, ref_size, ref_hdrs) - out_hdrs = unsafe_wrap(Array, ref_hdrs[], ref_size[]) + hdl, ref_size, ref_hdls) + out_hdrs = unsafe_wrap(Array, ref_hdls[], ref_size[]) out_arrays = [NDArray(MX_NDArrayHandle(x)) for x in out_hdrs] - arg_names = list_arguments(symbol) + arg_names = list_arguments(sym) @assert(length(arg_names) == length(unique(arg_names)), "Duplicated names in arguments: $arg_names") - arg_dict = Dict{Base.Symbol,NDArray}(zip(arg_names, arg_arrays)) + arg_dict = Dict(zip(arg_names, arg_arrays)) - aux_names = list_auxiliary_states(symbol) + aux_names = list_auxiliary_states(sym) @assert(length(aux_names) == length(unique(aux_names)), "Duplicated names in auxiliary states: $aux_names") - aux_dict = Dict{Base.Symbol,NDArray}(zip(aux_names, aux_arrays)) + aux_dict = Dict(zip(aux_names, aux_arrays)) - Executor(hdr, symbol, arg_arrays, grad_arrays, aux_arrays, out_arrays, arg_dict, aux_dict) + Executor(hdl, sym, arg_arrays, grad_arrays, aux_arrays, out_arrays, arg_dict, aux_dict) end -function Base.unsafe_convert(::Type{MX_handle}, obj::Executor) +Base.unsafe_convert(::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(MX_handle, obj.handle) -end Base.convert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) Base.cconvert(t::Type{MX_handle}, obj::Executor) = Base.unsafe_convert(t, obj) -function _get_ndarray_inputs(arg_key::AbstractString, args::Vector{NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) +function _get_ndarray_inputs(arg_key::AbstractString, args::VecOfNDArray, + arg_names::Vector{Symbol}, allow_missing::Bool) @assert(length(args) == length(arg_names), "Length of $arg_key does not match number of arguments") return (MX_handle[args...], args) end -function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Base.Symbol,NDArray}, arg_names::Vector{Base.Symbol}, allow_missing::Bool) + +function _get_ndarray_inputs(arg_key::AbstractString, args::Dict{Symbol}, + arg_names::Vector{Symbol}, allow_missing::Bool) args_vec = map(arg_names) do name arr = get(args, name, nothing) if !allow_missing @@ -75,16 +78,16 @@ Create an `Executor` by binding a `SymbolicNode` to concrete `NDArray`. * `ctx::Context`: the context on which the computation should run. * `args`: either a list of `NDArray` or a dictionary of name-array pairs. Concrete arrays for all the inputs in the network architecture. The inputs typically include - network parameters (weights, bias, filters, etc.), data and labels. See [`list_arguments`](@ref) - and [`infer_shape`](@ref). -* `args_grad`: -* `aux_states`: -* `grad_req`: + network parameters (weights, bias, filters, etc.), data and labels. + See [`list_arguments`](@ref) and [`infer_shape`](@ref). +* `args_grad`: a `Vector` of `NDArray` or a `Dict` contains `NDArray` +* `aux_states`: a `Vector` of `NDArray` or a `Dict` contains `NDArray` +* `grad_req`: single value, a `Vector` of `GRAD_REQ` or a `Dict{Symbol,GRAD_REQ}` """ -function bind(self :: SymbolicNode, ctx :: Context, args :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}}; - args_grad :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), - aux_states :: Union{Vector{NDArray},Dict{Base.Symbol,NDArray}} = Dict{Base.Symbol,NDArray}(), - grad_req :: Union{GRAD_REQ,Vector{GRAD_REQ},Dict{Base.Symbol,GRAD_REQ}} = GRAD_WRITE) +function bind(self::SymbolicNode, ctx::Context, args; + args_grad = Dict{Symbol,NDArray}(), + aux_states = Dict{Symbol,NDArray}(), + grad_req = GRAD_WRITE) arg_names = list_arguments(self) @@ -97,7 +100,7 @@ function bind(self :: SymbolicNode, ctx :: Context, args :: Union{Vector{NDArray elseif isa(grad_req, Vector{GRAD_REQ}) @assert(length(grad_req) == length(args)) reqs = MX_uint[grad_req...] - elseif isa(grad_req, Dict{Base.Symbol, GRAD_REQ}) + elseif isa(grad_req, Dict{Symbol, GRAD_REQ}) reqs = MX_uint[get(grad_req, name, GRAD_NOP) for name in arg_names] end @@ -111,20 +114,16 @@ function bind(self :: SymbolicNode, ctx :: Context, args :: Union{Vector{NDArray executor = Executor(MX_ExecutorHandle(ref_hdr[]), self, args, args_grad, aux_states) end -function bind(self :: SymbolicNode; kwargs...) + +function bind(x::SymbolicNode; context::Context = cpu(), kwargs...) kwargs = Dict(kwargs) @assert(haskey(kwargs, :args), "Must specify args") args = pop!(kwargs, :args) - if haskey(kwargs, :context) - context = pop!(kwargs, :context) - else - context = cpu() - end - bind(self, context, args; kwargs...) + bind(x, context, args; kwargs...) end -function simple_bind(self :: SymbolicNode, ctx :: Context; - grad_req :: Union{GRAD_REQ, Dict{Symbol, GRAD_REQ}}=GRAD_WRITE, +function simple_bind(self::SymbolicNode, ctx::Context; + grad_req::Union{GRAD_REQ,Dict{Symbol,GRAD_REQ}} = GRAD_WRITE, kwargs...) arg_shapes, out_shapes, aux_shapes = infer_shape(self; kwargs...) @assert(!isa(arg_shapes, Void), "Information not enough to perform complete shape inference") @@ -168,21 +167,15 @@ function forward(self::Executor; is_train::Bool = false, kwargs...) self.outputs end -function backward(self :: Executor) - backward(self, NDArray[]) -end -function backward(self :: Executor, out_grad :: NDArray) - backward(self, [out_grad]) -end -function backward(self :: Executor, out_grads :: Vector{NDArray}) - out_grads = MX_handle[out_grads...] - @mxcall(:MXExecutorBackward, (MX_handle, MX_uint, Ptr{MX_handle}), self, length(out_grads), out_grads) -end +backward(x::Executor) = backward(x, NDArray[]) +backward(x::Executor, out_grad::NDArray) = backward(x, [out_grad]) +backward(x::Executor, out_grads::VecOfNDArray) = + @mxcall(:MXExecutorBackward, (MX_handle, MX_uint, Ptr{MX_handle}), + x, length(out_grads), MX_handle[out_grads...]) - -function copy_params_from(self::Executor, arg_params::Dict{Base.Symbol,NDArray}, - aux_params::Union{Void,Dict{Base.Symbol,NDArray}}=nothing; - allow_extra_params::Bool=false) +function copy_params_from(self::Executor, arg_params::Dict{Symbol}, + aux_params::Dict{Symbol} = Dict{Symbol,Any}(); + allow_extra_params::Bool = false) for (name, array) in arg_params if haskey(self.arg_dict, name) copy!(self.arg_dict[name], array) @@ -191,13 +184,11 @@ function copy_params_from(self::Executor, arg_params::Dict{Base.Symbol,NDArray}, end end - if !isa(aux_params, Void) - for (name, array) in aux_params - if haskey(self.aux_dict, name) - copy!(self.aux_dict[name], array) - else - @assert(allow_extra_params, "Extra auxiliary state $name not recognized") - end + for (name, array) in aux_params + if haskey(self.aux_dict, name) + copy!(self.aux_dict[name], array) + else + @assert(allow_extra_params, "Extra auxiliary state $name not recognized") end end end diff --git a/src/io.jl b/src/io.jl index 2ba0bf78a584..597ea8a90c6e 100644 --- a/src/io.jl +++ b/src/io.jl @@ -113,24 +113,29 @@ function get_label end A basic subclass of `AbstractDataBatch`, that implement the interface by accessing member fields. """ -mutable struct DataBatch <: AbstractDataBatch - data :: Vector{NDArray} - label :: Vector{NDArray} +mutable struct DataBatch{T,S,N,M} <: AbstractDataBatch + data :: Vector{NDArray{T,N}} + label :: Vector{NDArray{S,M}} count :: Int end -count_samples(batch :: DataBatch) = batch.count -get_data(::Provider, batch :: DataBatch) where {Provider<:AbstractDataProvider} = batch.data -get_label(::Provider, batch :: DataBatch) where {Provider<:AbstractDataProvider} = batch.label + +count_samples(batch::DataBatch) = batch.count + +get_data(::Provider, batch::DataBatch) where {Provider<:AbstractDataProvider} = + batch.data + +get_label(::Provider, batch::DataBatch) where {Provider<:AbstractDataProvider} = + batch.label """ SlicedNDArray A alias type of `Tuple{UnitRange{Int},NDArray}`. """ -const SlicedNDArray = Tuple{UnitRange{Int},NDArray} +const SlicedNDArray = Tuple{UnitRange{Int},<:NDArray} function _load_general!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, - targets :: Vector{Vector{SlicedNDArray}}, loader::Function) + targets :: Vector{<:Vector{<:SlicedNDArray}}, loader::Function) data = loader(provider, batch) for (d_src, d_targets) in zip(data, targets) for (slice_idx, d_dst) in d_targets @@ -157,7 +162,7 @@ This utility function is used in data parallelization, where a mini-batch is spl and computed on several different devices. """ function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, - targets :: Vector{Vector{SlicedNDArray}}) + targets :: Vector{<:Vector{<:SlicedNDArray}}) _load_general!(provider, batch, targets, get_data) end @@ -171,16 +176,18 @@ end The same as [`load_data!`](@ref), except that this is for loading labels. """ function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, - targets :: Vector{Vector{SlicedNDArray}}) + targets :: Vector{<:Vector{<:SlicedNDArray}}) _load_general!(provider, batch, targets, get_label) end -function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{NDArray}) +function load_data!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, + targets :: Vector{<:NDArray}) for (src, dst) in zip(get_data(provider, batch), targets) copy!(dst, src) end end -function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, targets :: Vector{NDArray}) +function load_label!(provider :: AbstractDataProvider, batch :: AbstractDataBatch, + targets :: Vector{<:NDArray}) for (src, dst) in zip(get_label(provider, batch), targets) copy!(dst, src) end @@ -198,7 +205,7 @@ import Base.get Returns the corresponding data array corresponding to that name. """ -function get(provider :: AbstractDataProvider, batch :: AbstractDataBatch, name :: Base.Symbol) +function get(provider::AbstractDataProvider, batch::AbstractDataBatch, name::Symbol) for (idx, (k, s)) in enumerate(provide_data(provider)) if name == k return get_data(provider, batch)[idx] @@ -216,20 +223,20 @@ end eachbatch(provider::AbstractDataProvider) Allows you to perform operations on data every epoch. This is especially useful -when you need to perform real-time augmentation of the data. +when you need to perform real-time augmentation of the data. # Arguments: * `provider`: an instance of the custom DataProvider type. You must return this instance after modifying its fields. """ -eachbatch(provider :: AbstractDataProvider) = provider +eachbatch(provider::AbstractDataProvider) = provider """ ArrayDataProvider A convenient tool to iterate `NDArray` or Julia `Array`. - + ArrayDataProvider(data[, label]; batch_size, shuffle, data_padding, label_padding) Construct a data provider from `NDArray` or Julia Arrays. @@ -252,19 +259,19 @@ Construct a data provider from `NDArray` or Julia Arrays. TODO: remove `data_padding` and `label_padding`, and implement rollover that copies the last or first several training samples to feed the padding. """ -mutable struct ArrayDataProvider <: AbstractDataProvider - data_arrays :: Vector{Array} - data_names :: Vector{Base.Symbol} - label_arrays :: Vector{Array} - label_names :: Vector{Base.Symbol} +mutable struct ArrayDataProvider{T,N} <: AbstractDataProvider + data_arrays :: Vector{Array{T,N}} + data_names :: Vector{Symbol} + label_arrays + label_names :: Vector{Symbol} batch_size :: Int sample_count :: Int shuffle :: Bool data_padding :: MX_float label_padding :: MX_float - data_batch :: Vector{NDArray} - label_batch :: Vector{NDArray} + data_batch + label_batch end # Julia's type system is sometimes very frustrating. You cannot specify a function @@ -273,10 +280,14 @@ end # results, about the parametric type in the Pair{T1,T2} type, thus does not match the # generic Pair type. In general, Int <: Number but Vector{Int} <: Vector{Number} is not # true. So let us just use Any here... -function ArrayDataProvider(data::Any; batch_size::Int=0, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) - ArrayDataProvider(data, [], batch_size=batch_size, shuffle=shuffle, data_padding=data_padding, label_padding=label_padding) +function ArrayDataProvider(data; batch_size::Int = 0, shuffle::Bool = false, + data_padding::Real = 0, label_padding::Real = 0) + ArrayDataProvider(data, [], batch_size = batch_size, shuffle = shuffle, + data_padding = data_padding, label_padding = label_padding) end -function ArrayDataProvider(data::Any, label::Any; batch_size::Int=0, shuffle::Bool=false, data_padding::Real=0, label_padding::Real=0) + +function ArrayDataProvider(data, label; batch_size::Int = 0, shuffle::Bool = false, + data_padding::Real = 0, label_padding::Real = 0) asarr(arr :: Array{T}) where {T} = convert(Array{MX_float}, arr) asarr(arr :: NDArray) = copy(arr) @@ -349,16 +360,15 @@ function ArrayDataProvider(data::Any, label::Any; batch_size::Int=0, shuffle::Bo end ArrayDataProvider(data_arrays, data_names, label_arrays, label_names, batch_size, - sample_count, shuffle, data_padding, label_padding, data_batch, label_batch) + sample_count, shuffle, MX_float(data_padding), MX_float(label_padding), + data_batch, label_batch) end -function provide_data(provider::ArrayDataProvider) - return collect(zip(provider.data_names, map(size, provider.data_batch))) -end +provide_data(provider::ArrayDataProvider) = + collect(zip(provider.data_names, map(size, provider.data_batch))) -function provide_label(provider::ArrayDataProvider) - return collect(zip(provider.label_names, map(size, provider.label_batch))) -end +provide_label(provider::ArrayDataProvider) = + collect(zip(provider.label_names, map(size, provider.label_batch))) get_batch_size(provider::ArrayDataProvider) = provider.batch_size @@ -366,9 +376,7 @@ struct ArrayDataProviderState <: AbstractDataProviderState curr_idx :: Int end -function Base.eltype(provider :: ArrayDataProvider) - ArrayDataProviderState -end +Base.eltype(provider :: ArrayDataProvider) = ArrayDataProviderState function Base.start(provider :: ArrayDataProvider) if provider.shuffle @@ -381,9 +389,8 @@ function Base.start(provider :: ArrayDataProvider) return ArrayDataProviderState(1) end -function Base.done(provider::ArrayDataProvider, state :: ArrayDataProviderState) - return state.curr_idx > provider.sample_count -end +Base.done(provider::ArrayDataProvider, state::ArrayDataProviderState) = + state.curr_idx > provider.sample_count struct ArrayDataBatch <: AbstractDataBatch idx :: UnitRange{Int} @@ -425,8 +432,8 @@ a list of built-in data iterators. """ mutable struct MXDataProvider <: AbstractDataProvider handle :: MX_DataIterHandle - data_shape :: Vector{Tuple{Base.Symbol, Tuple}} - label_shape:: Vector{Tuple{Base.Symbol, Tuple}} + data_shape :: Vector{Tuple{Symbol,Tuple}} + label_shape:: Vector{Tuple{Symbol,Tuple}} batch_size :: Int # those two a auxiliary variables to help avoid calling reset @@ -455,8 +462,8 @@ function _get_label(handle :: MX_DataIterHandle) end function MXDataProvider(handle :: MX_DataIterHandle; - data_name :: Base.Symbol=:data, - label_name :: Union{Base.Symbol,Void}=:softmax_label, + data_name :: Symbol = :data, + label_name :: Union{Symbol,Void} = :softmax_label, kwargs...) # for convenience, we ignore the rest keyword arguments # init iterator, load the first batch and get shapes @assert(_iter_next(handle), "Failed to load the first batch in MXDataProvider") @@ -569,7 +576,7 @@ function _define_data_iter_creator(hdr :: MX_handle) isprovider = endswith(string(iter_name), "Iter") signature = _format_signature(Int(ref_narg[]), ref_arg_names) f_desc = " " * string(iter_name) * "(" *signature * ")\n\n" - if isprovider + if isprovider f_desc *= "Can also be called with the alias `$(string(iter_name)[1:end-4] * "Provider")`.\n" end f_desc *= unsafe_string(ref_desc[]) * "\n\n" diff --git a/src/kvstore.jl b/src/kvstore.jl index 1ac56260b401..fa4768cceaf7 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -3,10 +3,10 @@ mutable struct KVStore updater_c :: Ptr{Void} updater :: Function - KVStore(hdr :: MX_KVStoreHandle) = new(hdr, Ptr{Void}(0)) + KVStore(hdr::MX_KVStoreHandle) = new(hdr, Ptr{Void}(0)) end -function KVStore(kv_type::Base.Symbol = :local) +function KVStore(kv_type::Symbol = :local) #@assert(kv_type ∈ [:local]) # TODO: update with allowed types ref_hdr = Ref{MX_handle}(0) @@ -20,7 +20,7 @@ end Base.convert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) Base.cconvert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) -function _flatten_kvlist(keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) +function _flatten_kvlist(keys :: Vector{Int}, vals :: Vector{<:Vector{<:NDArray}}) @assert length(keys) == length(vals) keys_flt = Int[] vals_flt = NDArray[] @@ -31,16 +31,15 @@ function _flatten_kvlist(keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) return (keys_flt, vals_flt) end -function init!(self :: KVStore, key :: Int, val :: NDArray) - init!(self, [key], [val]) -end -function init!(self :: KVStore, key :: Int, vals :: Vector{NDArray}) - init!(self, Base.ones(Int, length(vals))*key, vals) -end -function init!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}) +init!(self::KVStore, key::Int, val::NDArray) = init!(self, [key], [val]) + +init!(self::KVStore, key::Int, vals::Vector{<:NDArray}) = + init!(self, Base.ones(Int, length(vals)) * key, vals) + +init!(self::KVStore, keys::Vector{Int}, vals::Vector{<:Vector{<:NDArray}}) = init!(self, _flatten_kvlist(keys, vals)...) -end -function init!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{NDArray}) + +function init!(self::KVStore, keys::Vector{Int}, vals::Vector{<:NDArray}) @assert length(keys) == length(vals) keys = Cint[keys...] vals = MX_handle[vals...] @@ -52,13 +51,14 @@ import Base.push! function push!(self :: KVStore, key :: Int, val :: NDArray; priority :: Int = 0) push!(self, [key], [val]; priority = priority) end -function push!(self :: KVStore, key :: Int, vals :: Vector{NDArray}; priority :: Int = 0) +function push!(self :: KVStore, key :: Int, vals :: Vector{<:NDArray}; priority :: Int = 0) push!(self, Base.ones(Int, length(vals))*key, vals; priority = priority) end -function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{Vector{NDArray}}; priority::Int=0) +function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{<:Vector{<:NDArray}}; + priority::Int=0) push!(self, _flatten_kvlist(keys, vals)...; priority = priority) end -function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{NDArray}; priority::Int=0) +function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{<:NDArray}; priority::Int=0) @assert length(keys) == length(vals) keys = Cint[keys...] vals = MX_handle[vals...] @@ -69,13 +69,13 @@ end function pull!(self :: KVStore, key :: Int, out :: NDArray; priority :: Int = 0) pull!(self, [key], [out]) end -function pull!(self :: KVStore, key :: Int, outs :: Vector{NDArray}; priority :: Int = 0) +function pull!(self :: KVStore, key :: Int, outs :: Vector{<:NDArray}; priority :: Int = 0) pull!(self, Base.ones(Int, length(outs))*key, outs; priority = priority) end -function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{Vector{NDArray}}; priority::Int=0) +function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{<:Vector{<:NDArray}}; priority::Int=0) pull!(self, _flatten_kvlist(keys, outs)...; priority = priority) end -function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{NDArray}; priority::Int=0) +function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{<:NDArray}; priority::Int=0) @assert length(keys) == length(outs) keys = Cint[keys...] outs = MX_handle[outs...] diff --git a/src/metric.jl b/src/metric.jl index db38060c933e..3998af8efb8c 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -14,7 +14,7 @@ abstract type AbstractEvalMetric end hasNDArraySupport(metric) -> Val{true/false} Trait for `_update_single_output` should return `Val{true}() if metric can handle `NDArray` -directly and `Val{false}()i` if requires `Array`. Metric that work with NDArrays can be +directly and `Val{false}()` if requires `Array`. Metric that work with NDArrays can be async, while native Julia arrays require that we copy the output of the network, which is a blocking operation. """ @@ -30,11 +30,12 @@ Update and accumulate metrics. * `labels::Vector{NDArray}`: the labels from the data provider. * `preds::Vector{NDArray}`: the outputs (predictions) of the network. """ -function update!(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}) where T <: AbstractEvalMetric +function update!(metric::T, labels::VecOfNDArray, preds::VecOfNDArray) where T <: AbstractEvalMetric _update!(metric, labels, preds, hasNDArraySupport(metric)) end -function _update!(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}, :: Val{true}) where T<: AbstractEvalMetric +function _update!(metric::T, labels::VecOfNDArray, preds::VecOfNDArray, + ::Val{true}) where T<: AbstractEvalMetric if length(labels) != length(preds) Base.warn_once( "The number of labels ($(length(labels))) does not correspond to the\ @@ -45,7 +46,8 @@ function _update!(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArra end end -function _update!(metric :: T, labels :: Vector{NDArray}, preds :: Vector{NDArray}, :: Val{false}) where T<: AbstractEvalMetric +function _update!(metric::T, labels::VecOfNDArray, preds::VecOfNDArray, + ::Val{false}) where T<: AbstractEvalMetric if length(labels) != length(preds) Base.warn_once( "The number of labels ($(length(labels))) does not correspond to the\ @@ -65,9 +67,7 @@ end Reset the accumulation counter. """ -function reset!(metric :: AbstractEvalMetric) - throw(MethodError(reset!, (typeof(metric),))) -end +reset!(metric::AbstractEvalMetric) = throw(MethodError(reset!, (typeof(metric),))) import Base: get @@ -79,9 +79,7 @@ Get the accumulated metrics. Returns `Vector{Tuple{Base.Symbol, Real}}`, a list of name-value pairs. For example, `[(:accuracy, 0.9)]`. """ -function get(metric :: AbstractEvalMetric) - throw(MethodError(get, (typeof(metric),))) -end +get(metric::AbstractEvalMetric) = throw(MethodError(get, (typeof(metric),))) """ NullMetric() @@ -91,17 +89,11 @@ A metric that calculates nothing. Can be used to ignore an output during trainin mutable struct NullMetric <: mx.AbstractEvalMetric end -function update!(metric :: NullMetric, labels :: Vector{NDArray}, preds :: Vector{NDArray}) - return nothing -end +update!(metric::NullMetric, labels::VecOfNDArray, preds::VecOfNDArray) = nothing -function reset!(metric :: NullMetric) - return nothing -end +reset!(metric::NullMetric) = nothing -function get(metric :: NullMetric) - return Tuple{Symbol, Float64}[] -end +get(metric::NullMetric) = Tuple{Symbol, Float64}[] """ MultiMetric(metrics::Vector{AbstractEvalMetric}) @@ -118,21 +110,19 @@ mutable struct MultiMetric <: mx.AbstractEvalMetric metrics :: Vector{mx.AbstractEvalMetric} end -function update!(metric :: MultiMetric, labels :: Vector{NDArray}, preds :: Vector{NDArray}) +function update!(metric :: MultiMetric, labels :: Vector{<:NDArray}, preds :: Vector{<:NDArray}) for m in metric.metrics update!(m, labels, preds) end - return nothing + nothing end function reset!(metric :: MultiMetric) map(reset!, metric.metrics) - return nothing + nothing end -function get(metric :: MultiMetric) - mapreduce(get, append!, metric.metrics) -end +get(metric :: MultiMetric) = mapreduce(get, append!, metric.metrics) """ SeqMetric(metrics::Vector{AbstractEvalMetric}) @@ -150,23 +140,21 @@ mutable struct SeqMetric <: mx.AbstractEvalMetric metrics :: Vector{mx.AbstractEvalMetric} end -function update!(metric :: SeqMetric, labels :: Vector{NDArray}, preds :: Vector{NDArray}) +function update!(metric::SeqMetric, labels::VecOfNDArray, preds::VecOfNDArray) @assert length(metric.metrics) == length(labels) @assert length(metric.metrics) == length(preds) for (m, l, p) in zip(metric.metrics, labels, preds) update!(m, [l], [p]) end - return nothing + nothing end -function reset!(metric :: SeqMetric) +function reset!(metric::SeqMetric) map(reset!, metric.metrics) - return nothing + nothing end -function get(metric :: SeqMetric) - mapreduce(get, append!, metric.metrics) -end +get(metric::SeqMetric) = mapreduce(get, append!, metric.metrics) """ Accuracy @@ -185,7 +173,7 @@ end hasNDArraySupport(::Accuracy) = Val{false}() -function _update_single_output(metric :: Accuracy, label :: Array, pred :: Array) +function _update_single_output(metric::Accuracy, label::Array, pred::Array) # Samples are stored in the last dimension @assert size(label, ndims(label)) == size(pred, ndims(pred)) @@ -217,9 +205,7 @@ function _update_single_output(metric :: Accuracy, label :: Array, pred :: Array end end -function get(metric :: Accuracy) - return [(:accuracy, metric.acc_sum / metric.n_sample)] -end +get(metric::Accuracy) = [(:accuracy, metric.acc_sum / metric.n_sample)] function reset!(metric :: Accuracy) metric.acc_sum = 0.0 @@ -235,31 +221,34 @@ Calculates the mean squared error regression loss. Requires that label and prediction have the same shape. """ -mutable struct MSE <: AbstractEvalMetric - mse_sum :: Vector{NDArray} +mutable struct MSE{N} <: AbstractEvalMetric + mse_sum :: Vector{NDArray{MX_float,N}} n_sample :: Int - MSE() = new(Vector{NDArray}(), 0) + MSE{N}() where {N} = new(Vector{NDArray{MX_float,N}}(), 0) end +MSE() = MSE{1}() # backward compat? + hasNDArraySupport(::MSE) = Val{true}() -function _update_single_output(metric :: MSE, label :: NDArray, pred :: NDArray) +function _update_single_output(metric::MSE, label::NDArray{T,N}, + pred::NDArray{T,N}) where {T,N} @assert size(label) == size(pred) metric.n_sample += length(label) - mse_sum = mx.sum(mx._PowerScalar(label - pred,scalar=2)) + mse_sum = mx.sum((label .- pred).^2) push!(metric.mse_sum, mse_sum) - return nothing + nothing end -function get(metric :: MSE) +function get(metric::MSE) # Delay copy until last possible moment mse_sum = mapreduce(nda->copy(nda)[1], +, 0.0, metric.mse_sum) - return [(:MSE, mse_sum / metric.n_sample)] + [(:MSE, mse_sum / metric.n_sample)] end -function reset!(metric :: MSE) - metric.mse_sum = Vector{NDArray}() +function reset!(metric::MSE{N}) where N + metric.mse_sum = Vector{NDArray{Float32,N}}() metric.n_sample = 0 end @@ -319,7 +308,7 @@ end hasNDArraySupport(::NMSE) = Val{false}() -function _update_single_output(metric :: NMSE, label :: Array, pred :: Array) +function _update_single_output(metric::NMSE, label::Array, pred::Array) n_sample = size(pred)[end] metric.n_sample += n_sample @@ -332,11 +321,9 @@ function _update_single_output(metric :: NMSE, label :: Array, pred :: Array) end end -function get(metric :: NMSE) - return [(:NMSE, metric.nmse_sum / metric.n_sample)] -end +get(metric::NMSE) = [(:NMSE, metric.nmse_sum / metric.n_sample)] -function reset!(metric :: NMSE) +function reset!(metric::NMSE) metric.nmse_sum = 0.0 metric.n_sample = 0 end @@ -357,11 +344,9 @@ mutable struct ACE <: AbstractEvalMetric ACE(eps=1.0e-8) = new(0.0, 0, eps) end -function get(metric :: ACE) - return [(:ACE, - metric.ace_sum / metric.n_sample)] -end +get(metric::ACE) = [(:ACE, - metric.ace_sum / metric.n_sample)] -function reset!(metric :: ACE) +function reset!(metric::ACE) metric.ace_sum = 0.0 metric.n_sample = 0 end @@ -474,4 +459,3 @@ function _update_single_output(metric :: MultiACE, label :: Array{T}, pred :: Ar error("Can't handle prediction with dimensions $(ndims(pred)).") end end - diff --git a/src/model.jl b/src/model.jl index 44a2ba755798..06b7a2cf8a13 100644 --- a/src/model.jl +++ b/src/model.jl @@ -18,14 +18,14 @@ mutable struct FeedForward <: AbstractModel arch :: SymbolicNode ctx :: Vector{Context} - arg_params :: Dict{Base.Symbol, NDArray} - aux_params :: Dict{Base.Symbol, NDArray} + arg_params :: Dict{Symbol} + aux_params :: Dict{Symbol} - pred_exec :: Union{Executor, Void} + pred_exec :: Union{Executor,Void} # leave the rest fields undefined - FeedForward(arch :: SymbolicNode, ctx :: Vector{Context}) = new(arch, ctx) - FeedForward(arch :: SymbolicNode, ctx :: Context) = new(arch, [ctx]) + FeedForward(arch::SymbolicNode, ctx::Vector{Context}) = new(arch, ctx) + FeedForward(arch::SymbolicNode, ctx::Context) = new(arch, [ctx]) end """ @@ -33,7 +33,7 @@ Get a split of `batch_size` into `n_split` pieces for data parallelization. Retu of length `n_split`, with each entry a `UnitRange{Int}` indicating the slice index for that piece. """ -function _split_inputs(batch_size :: Int, n_split :: Int) +function _split_inputs(batch_size::Int, n_split::Int) @assert(batch_size >= n_split) per_split = floor(Int, batch_size / n_split) counts = Base.zeros(Int, n_split)+per_split @@ -73,7 +73,7 @@ weights. * `input_shapes`: the shape of all data and label inputs to this model, given as keyword arguments. For example, `data=(28,28,1,100), label=(100,)`. """ -function init_model(self :: FeedForward, initializer :: AbstractInitializer; overwrite::Bool=false, input_shapes...) +function init_model(self::FeedForward, initializer::AbstractInitializer; overwrite::Bool=false, input_shapes...) # all arg names, including data, label, and parameters arg_names = list_arguments(self.arch) @@ -92,8 +92,8 @@ function init_model(self :: FeedForward, initializer :: AbstractInitializer; ove self.aux_params = Dict{Symbol, NDArray}() end - arg_params = Dict{Symbol, NDArray}() - aux_params = Dict{Symbol, NDArray}() + arg_params = Dict{Symbol,NDArray}() + aux_params = Dict{Symbol,NDArray}() for (name, shape) in filter(x -> in(x[1],param_names), zip(arg_names, arg_shapes)) if haskey(self.arg_params, name) @@ -138,7 +138,7 @@ function init_model(self :: FeedForward, initializer :: AbstractInitializer; ove return (arg_names, param_names, aux_names) end -function _setup_predictor(self :: FeedForward, overwrite :: Bool=false; verbosity :: Integer = 1, data_shapes...) +function _setup_predictor(self::FeedForward, overwrite::Bool=false; verbosity::Integer = 1, data_shapes...) if !isdefined(self, :pred_exec) || isa(self.pred_exec, Void) || overwrite if !isdefined(self, :arg_params) || !isdefined(self, :aux_params) @assert(false, "Model weights not defined, please init or train the model, or load from file") @@ -202,12 +202,12 @@ end See also [`train`](@ref), [`fit`](@ref), [`init_model`](@ref), and [`load_checkpoint`](@ref) """ -function predict(callback :: Function, self :: FeedForward, data :: AbstractDataProvider; - overwrite :: Bool = true, verbosity :: Integer = 1) +function predict(callback::Function, self::FeedForward, data::AbstractDataProvider; + overwrite::Bool = true, verbosity::Integer = 1) predict(self, data; overwrite = overwrite, callback=callback, verbosity = verbosity) end -function predict(self :: FeedForward, data :: AbstractDataProvider; - overwrite::Bool=true, callback::Union{Function,Void}=nothing, verbosity :: Integer = 1) +function predict(self::FeedForward, data::AbstractDataProvider; + overwrite::Bool = true, callback::Union{Function,Void}=nothing, verbosity::Integer = 1) data_shapes = provide_data(data) data_names = [x[1] for x in data_shapes] _setup_predictor(self, overwrite; verbosity = verbosity, data_shapes...) @@ -255,11 +255,13 @@ function predict(self :: FeedForward, data :: AbstractDataProvider; return output_arrays end -function _init_model(self :: FeedForward, data :: AbstractDataProvider, initializer :: AbstractInitializer, overwrite :: Bool) - init_model(self, initializer; overwrite=overwrite, [provide_data(data)..., provide_label(data)...]...) +function _init_model(self::FeedForward, data::AbstractDataProvider, + initializer::AbstractInitializer, overwrite::Bool) + init_model(self, initializer; overwrite=overwrite, + [provide_data(data)..., provide_label(data)...]...) end -function _create_kvstore(kv_type :: Base.Symbol, num_device :: Int, arg_params :: Dict{Base.Symbol,NDArray}, verbosity :: Int) +function _create_kvstore(kv_type::Symbol, num_device::Int, arg_params::Dict{Symbol}, verbosity::Int) if num_device == 1 && !ismatch(r"dist", string(kv_type)) return nothing else @@ -281,7 +283,7 @@ end n_epoch :: Int = 10, eval_data :: Union{Void, AbstractDataProvider} = nothing, eval_metric :: AbstractEvalMetric = Accuracy(), - kvstore :: Union{Base.Symbol, KVStore} = :local, + kvstore :: Union{Symbol, KVStore} = :local, force_init :: Bool = false, callbacks :: Vector{AbstractCallback} = AbstractCallback[], verbosity :: Int = 3 @@ -289,7 +291,7 @@ end function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, state::OptimizationState, type_filter::Type; - metric::Vector{Tuple{Base.Symbol, T}} = Vector{Tuple{Base.Symbol, Real}}()) where T<:Real + metric::Vector{Tuple{Symbol,T}} = Vector{Tuple{Symbol,Real}}()) where T<:Real map(callbacks) do cb if isa(cb, type_filter) if type_filter == AbstractEpochCallback @@ -327,7 +329,7 @@ Train the `model` on `data` with the `optimizer`. calculated on the validation set. * `kvstore`: keyword argument, default `:local`. The key-value store used to synchronize gradients and parameters when multiple devices are used for training. - :type kvstore: `KVStore` or `Base.Symbol` + :type kvstore: `KVStore` or `Symbol` * `initializer::AbstractInitializer`: keyword argument, default `UniformInitializer(0.01)`. * `force_init::Bool`: keyword argument, default false. By default, the random initialization using the provided `initializer` will be skipped if the model weights already exists, maybe from a previous @@ -342,7 +344,8 @@ Train the `model` on `data` with the `optimizer`. - `2`: Print one time messages and a message at the start of each epoch - `3`: Print a summary of the training and validation accuracy for each epoch """ -function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) +function fit(self::FeedForward, optimizer::AbstractOptimizer, data::AbstractDataProvider; + kwargs...) opts = TrainingOptions(; kwargs...) opts.verbosity >= 1 && info("Start training on $(self.ctx)") @@ -357,7 +360,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra # setup kvstore kvstore = opts.kvstore - if isa(kvstore, Base.Symbol) + if isa(kvstore, Symbol) opts.verbosity >= 2 && info("Creating KVStore...") kvstore = _create_kvstore(kvstore, length(self.ctx), self.arg_params, opts.verbosity) end @@ -379,7 +382,7 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra freeze_idx = filter(i -> in(param_names[i], freeze_names), 1:length(param_names)) # Setup grad_req as a dictionary - grad_req = Dict{Symbol, GRAD_REQ}() + grad_req = Dict{Symbol,GRAD_REQ}() for param in param_names if in(param, freeze_names) grad_req[param] = GRAD_NOP @@ -581,24 +584,26 @@ function fit(self :: FeedForward, optimizer :: AbstractOptimizer, data :: Abstra nothing end -function save_checkpoint(self :: FeedForward, prefix :: AbstractString, state :: OptimizationState) +save_checkpoint(self::FeedForward, prefix::AbstractString, state::OptimizationState) = save_checkpoint(self.arch, self.arg_params, self.aux_params, prefix, state.curr_epoch) -end -function save_checkpoint(sym :: SymbolicNode, arg_params :: Dict{Base.Symbol, NDArray}, - aux_params :: Dict{Base.Symbol, NDArray}, prefix :: AbstractString, epoch :: Int) + +function save_checkpoint(sym::SymbolicNode, arg_params::Dict{Symbol}, + aux_params::Dict{Symbol}, prefix::AbstractString, epoch::Int) save("$prefix-symbol.json", sym) - save_dict = merge(Dict{Base.Symbol, NDArray}(map((x) -> Symbol("arg:$(x[1])") => x[2], arg_params)), - Dict{Base.Symbol, NDArray}(map((x) -> Symbol("aux:$(x[1])") => x[2], aux_params))) + save_dict = Dict{Symbol, NDArray}(map((x) -> Symbol("arg:$(x[1])") => x[2], arg_params)) + if !isempty(aux_params) + merge!(save_dict, Dict(map((x) -> Symbol("aux:$(x[1])") => x[2], aux_params))) + end save_filename = format("{1}-{2:04d}.params", prefix, epoch) save(save_filename, save_dict) info("Saved checkpoint to '$save_filename'") end -function load_checkpoint(prefix :: AbstractString, epoch :: Int) +function load_checkpoint(prefix::AbstractString, epoch::Int) arch = load("$prefix-symbol.json", SymbolicNode) saved_dict = load(format("{1}-{2:04d}.params", prefix, epoch), NDArray) - arg_params = Dict{Base.Symbol, NDArray}() - aux_params = Dict{Base.Symbol, NDArray}() + arg_params = Dict{Symbol,Any}() + aux_params = Dict{Symbol,Any}() for (k,v) in saved_dict tp, name = split(string(k), ':') name = Symbol(name) @@ -617,7 +622,7 @@ end Load a mx.FeedForward model from the checkpoint *prefix*, *epoch* and optionally provide a context. """ -function load_checkpoint(prefix :: AbstractString, epoch :: Int, ::Type{FeedForward}; context = nothing) +function load_checkpoint(prefix::AbstractString, epoch::Int, ::Type{FeedForward}; context = nothing) arch, arg_params, aux_params = load_checkpoint(prefix, epoch) model = FeedForward(arch, context = context) model.arg_params = arg_params @@ -625,8 +630,8 @@ function load_checkpoint(prefix :: AbstractString, epoch :: Int, ::Type{FeedForw return model end -function load_checkpoint(self :: FeedForward, prefix :: AbstractString, epoch :: Int; - overwrite :: Bool = true, allow_different_arch :: Bool = false) +function load_checkpoint(self::FeedForward, prefix::AbstractString, epoch::Int; + overwrite::Bool = true, allow_different_arch::Bool = false) if isdefined(self, :arg_params) && isdefined(self, :aux_params) && !overwrite info("model weights already exists, skip loading... (call with overwrite=true if needed)") return self diff --git a/src/ndarray.jl b/src/ndarray.jl index 9bb74f83f5d2..1a2ffa280d58 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -3,7 +3,7 @@ const DType = Union{Float32, Float64, Float16, UInt8, Int32, Int8, Int64} @enum TypeFlag kFloat32 kFloat64 kFloat16 kUint8 kInt32 kInt8 kInt64 const DEFAULT_DTYPE = Float32 # MSHADOW_DEFAULT_DTYPE -function toTypeFlag(:: Type{T}) where T <: DType +function toTypeFlag(T::Type{<:DType}) if T == Float32 return kFloat32 elseif T == Float64 @@ -23,7 +23,7 @@ function toTypeFlag(:: Type{T}) where T <: DType end end -function fromTypeFlag(T :: TypeFlag) +function fromTypeFlag(T::TypeFlag) if T == kFloat32 return Float32 elseif T == kFloat64 @@ -89,19 +89,21 @@ of tensor-based computation. C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory have shape (28,28,1,100). """ -mutable struct NDArray +mutable struct NDArray{T,D} handle :: MX_NDArrayHandle writable :: Bool - function NDArray(handle, writable=true) - new(handle, writable) - end + NDArray{T,D}(handle, writable = true) where {T,D} = new(handle, writable) end NDArray(x::AbstractArray{T}) where {T<:DType} = copy(collect(x), cpu()) NDArray(x::Array{T}) where {T<:DType} = copy(x, cpu()) +NDArray(handle, writable = true) = + NDArray{eltype(handle), ndims(handle)}(handle, writable) +# type aliases const NDArrayOrReal = Union{NDArray, Real} +const VecOfNDArray = AbstractVector{<:NDArray} @unfuse NDArray @@ -112,15 +114,15 @@ end # for REPL function Base.show(io::IO, ::MIME{Symbol("text/plain")}, x::NDArray) - println(io, "$(join(size(x), "×")) mx.NDArray{$(eltype(x))} @ $(context(x)):") - Base.showarray(io, try_get_shared(x, sync = :read), false, header = false) + type_ = split(string(typeof(x)), '.', limit=2)[end] + println(io, "$(join(size(x), "×")) $(type_) @ $(context(x)):") + Base.showarray(io, try_get_shared(x, sync = :read), false, header=false) end -function Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) +Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(MX_handle, obj.handle) -end -Base.convert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) -Base.cconvert(t::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(t, obj) +Base.convert(T::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(T, obj) +Base.cconvert(T::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(T, obj) ################################################################################ # NDArray functions exported to the users @@ -140,21 +142,15 @@ end """ - empty(DType, shape :: Tuple, ctx :: Context) - empty(DType, shape :: Tuple) + empty(DType, dims[, ctx::Context = cpu()]) + empty(DType, dims) empty(DType, dim1, dim2, ...) Allocate memory for an uninitialized `NDArray` with a specified type. """ -function empty(::Type{T}, shape :: NTuple{N, Int}) where {N,T<:DType} - empty(T, shape, cpu()) -end -function empty(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) where {N,T<:DType} - NDArray(_ndarray_alloc(T, shape, ctx, false)) -end -function empty(:: Type{T}, shape :: Int...) where T<:DType - empty(T, shape) -end +empty(::Type{T}, dims::NTuple{N, Int}, ctx::Context = cpu()) where {N,T<:DType} = + NDArray{T, N}(_ndarray_alloc(T, dims, ctx, false)) +empty(::Type{T}, dims::Int...) where {T<:DType} = empty(T, dims) """ empty(shape :: Tuple, ctx :: Context) @@ -173,54 +169,39 @@ function empty(shape :: Int...) empty(shape) end -import Base.similar - """ - similar(arr :: NDArray) + similar(x::NDArray) -Create an `NDArray` with similar shape, data type, and context with the given one. +Create an `NDArray` with similar shape, data type, +and context with the given one. +Note that the returned `NDArray` is uninitialized. """ -function similar(arr :: NDArray) - empty(eltype(arr), size(arr), context(arr)) -end +Base.similar(x::NDArray{T}) where {T} = empty(T, size(x), context(x)) """ - zeros(DType, shape :: Tuple, ctx :: Context) - zeros(DType, shape :: Tuple) - zeros(DType, dim1, dim2, ...) + zeros(DType, dims[, ctx::Context = cpu()]) + zeros(DType, dims...) -Create zero-ed `NDArray` with specific shape and type +Create zero-ed `NDArray` with specific shape and type. """ -function zeros(:: Type{T}, shape :: NTuple{N, Int}) where {N,T<:DType} - zeros(T, shape, cpu()) -end -function zeros(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) where {N,T<:DType} - arr = empty(T, shape, ctx) +function zeros(::Type{T}, dims::NTuple{N, Int}, ctx::Context = cpu()) where {N,T<:DType} + arr = empty(T, dims, ctx) arr[:] = zero(T) - return arr -end -function zeros(:: Type{T}, shape :: Int...) where T<:DType - zeros(T, shape) + arr end +zeros(::Type{T}, dims::Int...) where {T<:DType} = zeros(T, dims) + """ - zeros(shape :: Tuple, ctx :: Context) - zeros(shape :: Tuple) - zeros(dim1, dim2, ...) + zeros(dims[, ctx::Context = cpu()]) + zeros(dims...) Create zero-ed `NDArray` with specific shape. """ -function zeros(shape :: NTuple{N, Int}) where N - zeros(shape, cpu()) -end -function zeros(shape :: NTuple{N, Int}, ctx :: Context) where N - arr = empty(shape, ctx) - arr[:] = 0 - return arr -end -function zeros(shape :: Int...) - zeros(shape) -end +zeros(dims::NTuple{N, Int}, ctx::Context = cpu()) where N = + zeros(MX_float, dims, ctx) + +zeros(dims::Int...) = zeros(dims) """ ones(DType, shape :: Tuple, ctx :: Context) @@ -263,11 +244,11 @@ end import Base: size, length, ndims, eltype """ - size(arr :: NDArray) - size(arr :: NDArray, dim :: Int) + size(x::NDArray) + size(x::NDArray, dim) -Get the shape of an `NDArray`. The shape is in Julia's column-major convention. See -also the notes on NDArray shapes [`NDArray`](@ref). +Get the shape of an `NDArray`. The shape is in Julia's column-major convention. +See also the notes on NDArray shapes [`NDArray`](@ref). """ function size(arr :: NDArray) ref_ndim = Ref{MX_uint}(0) @@ -281,45 +262,50 @@ function size(arr :: NDArray, dim :: Int) end """ - length(arr :: NDArray) + length(x::NDArray) Get the number of elements in an `NDArray`. """ -function length(arr :: NDArray) - prod(size(arr)) -end +length(x::NDArray) = prod(size(x)) """ - ndims(arr :: NDArray) + ndims(x::NDArray) -Get the number of dimensions of an `NDArray`. Is equivalent to `length(size(arr))`. +Get the number of dimensions of an `NDArray`. +Is equivalent to `length(size(arr))`. """ -function ndims(arr :: NDArray) - length(size(arr)) +ndims(x::NDArray) = ndims(x.handle) + +function ndims(x::MX_NDArrayHandle)::Int + ref_ndim = Ref{MX_uint}(0) + ref_shape = Ref{Ptr{MX_uint}}(0) + @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), + x, ref_ndim, ref_shape) + ref_ndim[] end """ - eltype(arr :: NDArray) + eltype(x::NDArray) Get the element type of an `NDArray`. """ -function eltype(arr :: T) where T <: Union{NDArray, MX_NDArrayHandle} +function eltype(x::Union{NDArray, MX_NDArrayHandle}) dtype_ref = Ref{Cint}(0) - @mxcall(:MXNDArrayGetDType, (MX_handle, Ptr{Cint}), arr, dtype_ref) + @mxcall(:MXNDArrayGetDType, (MX_handle, Ptr{Cint}), x, dtype_ref) - if dtype_ref[] == -1 # arr->is_none() - warn("Eltype of $arr is not defined") + if dtype_ref[] == -1 # x->is_none() + warn("Eltype of $x is not defined") Base.show_backtrace(STDOUT, backtrace()) println() - return Float32 + Float32 else - return fromTypeFlag(TypeFlag(dtype_ref[])) + fromTypeFlag(TypeFlag(dtype_ref[])) end end -@inline _first(arr::NDArray) = try_get_shared(arr, sync = :read) |> first +@inline _first(x::NDArray) = try_get_shared(x, sync = :read) |> first -Base.first(arr::NDArray) = _first(arr) +Base.first(x::NDArray) = _first(x) """ slice(arr :: NDArray, start:stop) @@ -469,7 +455,7 @@ import Base: copy!, copy, convert, deepcopy Copy contents of `src` into `dst`. """ -function copy!(dst :: NDArray, src :: NDArray) +function copy!(dst::NDArray, src::NDArray) @assert(dst.writable) if dst.handle == src.handle warn("Copying an NDArray to itself") @@ -480,33 +466,31 @@ function copy!(dst :: NDArray, src :: NDArray) return dst end -function copy!(dst :: Array{T}, src :: NDArray) where T<:DType - @assert T == eltype(src) +function copy!(dst::Array{T}, src::NDArray{T}) where T<:DType @assert size(dst) == size(src) @mxcall(:MXNDArraySyncCopyToCPU, (MX_handle, Ptr{Void}, Csize_t), src, pointer(dst), length(dst)) - return dst -end -function copy!(dst :: Array{T}, src :: NDArray) where T<:Real - copy!(dst, copy(src)) + dst end -function copy!(dst :: NDArray, src :: Array{T}) where T<:Real +copy!(dst::Array{<:Real}, src::NDArray) = copy!(dst, copy(src)) + +function copy!(dst::NDArray{T}, src::Array{<:Real}) where {T} @assert dst.writable @assert size(dst) == size(src) - src = convert(Array{eltype(dst)}, src) # this might involve copying + src = convert(Array{T}, src) # this might involve copying @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{Void}, Csize_t), dst.handle, pointer(src), length(src)) - return dst + dst end -function copy_ignore_shape!(dst :: NDArray, src :: Array{T}) where T<:Real +function copy_ignore_shape!(dst::NDArray{T}, src::Array{<:Real}) where {T} @assert dst.writable @assert length(dst) == length(src) - src = convert(Array{eltype(dst)}, src) # this might involve copying + src = convert(Array{T}, src) # this might involve copying @mxcall(:MXNDArraySyncCopyFromCPU, (MX_handle, Ptr{Void}, Csize_t), dst.handle, pointer(src), length(src)) - return dst + dst end @@ -519,31 +503,23 @@ Create a copy of an array. When no `Context` is given, create a Julia `Array`. Otherwise, create an `NDArray` on the specified context. """ # Create copy: NDArray -> Julia Array -function copy(arr :: NDArray) - j_arr = Array{eltype(arr)}(size(arr)) - copy!(j_arr, arr) -end +copy(x::NDArray{T,D}) where{T,D} = copy!(Array{T,D}(size(x)), x) # Create copy: NDArray -> NDArray in a given context -function copy(arr :: NDArray, ctx :: Context) - dst = NDArray(_ndarray_alloc(eltype(arr), size(arr), ctx, true)) - copy!(dst, arr) -end +copy(x::NDArray{T,D}, ctx::Context) where {T,D} = + copy!(NDArray{T,D}(_ndarray_alloc(T, size(x), ctx, true)), x) # Create copy: Julia Array -> NDArray in a given context -function copy(arr :: Array{T}, ctx :: Context) where T<:DType - dst = empty(T, size(arr), ctx) - copy!(dst, arr) -end +copy(x::Array{T}, ctx::Context) where {T<:DType} = + copy!(empty(T, size(x), ctx), x) """ - convert(::Type{Array{T}}, arr :: NDArray) + convert(::Type{Array{<:Real}}, x::NDArray) -Convert an `NDArray` into a Julia `Array` of specific type. Data will be copied. +Convert an `NDArray` into a Julia `Array` of specific type. +Data will be copied. """ -function convert(t::Type{Array{T}}, arr :: NDArray) where T<:Real - convert(t, copy(arr)) -end +convert(T::Type{Array{<:Real}}, x::NDArray) = convert(T, copy(x)) """ deepcopy(arr::NDArray) @@ -599,13 +575,13 @@ end Add a bunch of arguments into `dst`. Inplace updating. """ -function add_to!(dst::NDArray, args::NDArrayOrReal...) +function add_to!(dst::NDArray{T}, args::NDArrayOrReal...) where T @assert dst.writable for arg in args if isa(arg, Real) - _plus_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) + _plus_scalar(dst, scalar = convert(T, arg), out = dst) else - _plus(dst, arg, out=dst) + _plus(dst, arg, out = dst) end end return dst @@ -632,10 +608,10 @@ broadcast_(::typeof(+), x::Real, y::NDArray) = x + y Subtract a bunch of arguments from `dst`. Inplace updating. """ -function sub_from!(dst::NDArray, arg::NDArrayOrReal) +function sub_from!(dst::NDArray{T}, arg::NDArrayOrReal) where T @assert dst.writable if isa(arg, Real) - _minus_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) + _minus_scalar(dst, scalar = convert(T, arg), out = dst) else _minus!(dst, arg) end @@ -664,12 +640,12 @@ broadcast_(::typeof(-), x::Real, y::NDArray) = x - y Elementwise multiplication into `dst` of either a scalar or an `NDArray` of the same shape. Inplace updating. """ -function mul_to!(dst::NDArray, arg::NDArrayOrReal) +function mul_to!(dst::NDArray{T}, arg::NDArrayOrReal) where T @assert dst.writable if isa(arg, Real) - _mul_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) + _mul_scalar(dst, scalar = convert(T, arg), out = dst) else - _mul(dst, arg, out=dst) + _mul(dst, arg, out = dst) end end @@ -692,23 +668,19 @@ broadcast_(::typeof(*), x::Real, y::NDArray) = y .* x Matrix (2D NDArray) multiplication. """ -function *(x::NDArray, y::NDArray) - @assert ndims(x) == 2 - @assert ndims(y) == 2 - dot(x, y) -end +*(x::NDArray{T,2}, y::NDArray{S,2}) where {T,S} = dot(x, y) """ div_from!(dst::NDArray, arg::NDArrayOrReal) Elementwise divide a scalar or an `NDArray` of the same shape from `dst`. Inplace updating. """ -function div_from!(dst::NDArray, arg::NDArrayOrReal) +function div_from!(dst::NDArray{T}, arg::NDArrayOrReal) where {T} @assert dst.writable if isa(arg, Real) - _div_scalar(dst, scalar=convert(eltype(dst), arg), out=dst) + _div_scalar(dst, scalar = convert(T, arg), out = dst) else - _div(dst, arg, out=dst) + _div(dst, arg, out = dst) end end @@ -717,9 +689,9 @@ end Elementwise divide a scalar by an `NDArray`. Inplace updating. """ -function rdiv_from!(x::Real, y::NDArray) +function rdiv_from!(x::Real, y::NDArray{T}) where {T} @assert y.writable - _rdiv_scalar(y, scalar=convert(eltype(y), x), out=y) + _rdiv_scalar(y, scalar = convert(T, x), out = y) end import Base: / @@ -902,12 +874,11 @@ function pointer(arr :: NDArray) @mxcall(:MXNDArrayGetData, (MX_handle, Ref{Ptr{Void}}), arr, pdata) return convert(Ptr{eltype(arr)}, pdata[]) end -function _wait_to_read(arr :: NDArray) + +@inline _wait_to_read(arr :: NDArray) = @mxcall(:MXNDArrayWaitToRead, (MX_handle,), arr) -end -function _wait_to_write(arr :: NDArray) +@inline _wait_to_write(arr :: NDArray) = @mxcall(:MXNDArrayWaitToWrite, (MX_handle,), arr) -end """ try_get_shared(arr; sync=:nop) @@ -926,19 +897,19 @@ Try to create a Julia array by sharing the data with the underlying `NDArray`. On CPU, invoke `_wait_to_read` if `:read`; invoke `_wait_to_write` if `:write`. """ -function try_get_shared(arr :: NDArray; sync::Symbol=:nop) - if context(arr).device_type == CPU +function try_get_shared(x::NDArray; sync::Symbol=:nop) + if context(x).device_type == CPU # try to do data sharing if sync == :read - _wait_to_read(arr) + _wait_to_read(x) elseif sync == :write - _wait_to_write(arr) + _wait_to_write(x) end - unsafe_wrap(Array, pointer(arr), size(arr)) + unsafe_wrap(Array, pointer(x), size(x)) else # impossible to share, just copying - copy(arr) + copy(x) end end @@ -952,16 +923,16 @@ Test whether `j_arr` is sharing data with `arr`. * `j_arr::Array`: the Julia Array. * `arr::NDArray`: the `NDArray`. """ -is_shared(j_arr :: Array, arr :: NDArray) = false +is_shared(::Array, ::NDArray) = false -function is_shared(j_arr :: Array{T}, arr :: NDArray) where T<:DType +function is_shared(j_arr::Array{T}, arr::NDArray{T}) where {T<:DType} if length(j_arr) != length(arr) return false end if context(arr).device_type != CPU return false end - return pointer(j_arr) == pointer(arr) + pointer(j_arr) == pointer(arr) end """ @@ -980,7 +951,7 @@ corresponding components enabled. Examples: * `hdfs://my-bucket/path/my-hdfs-ndarray` * `/path-to/my-local-ndarray` """ -function load(filename::AbstractString, ::Type{NDArray}) +function load(filename::AbstractString, ::Type{<:NDArray}) out_size = Ref{MX_uint}(0) out_hdrs = Ref{Ptr{MX_handle}}(0) out_name_size = Ref{MX_uint}(0) @@ -999,25 +970,25 @@ function load(filename::AbstractString, ::Type{NDArray}) end """ - save(filename :: AbstractString, data) + save(filename::AbstractString, data) Save NDarrays to binary file. Filename could be S3 or HDFS address, if `libmxnet` is built with corresponding support (see `load`). * `filename::String`: path to the binary file to write to. -* `data`: data to save to file. Data can be a`NDArray`, a `Vector{NDArray}`, or a `Dict{Base.Symbol, NDArray}`. +* `data`: data to save to file. Data can be a`NDArray`, a `Vector` of `NDArray`, + or a `Dict{Symbol}` contains `NDArray`s. """ -function save(filename::String, data::NDArray) - save(filename, [data]) -end -function save(filename::String, data::Vector{NDArray}) +save(filename::String, data::NDArray) = save(filename, [data]) + +save(filename::String, data::VecOfNDArray) = @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), filename, length(data), MX_handle[data...], char_pp(0)) -end -function save(filename::String, data::Dict{Base.Symbol,NDArray}) - names = [k for k in keys(data)] - arrays = MX_handle[data[k] for k in names] - names = String[string(k) for k in names] + +function save(filename::String, data::Dict{Symbol}) + names = keys(data) + arrays = MX_handle.(collect(values(data))) + names = String.(collect(names)) @mxcall(:MXNDArraySave, (char_p, MX_uint, Ptr{MX_handle}, char_pp), filename, length(names), arrays, names) @@ -1047,7 +1018,7 @@ function _outexpr(name::Symbol, x #= the first arg of `sig` =#) end macro _remap(sig::Expr, imp::Expr) - fname = sig.args[1] + fname = (sig.head == :call) ? sig.args[1] : sig.args[1].args[1] # case of `where` opname = string(imp.args[1]) import_expr = _autoimport(fname) @@ -1065,7 +1036,7 @@ macro _remap(sig::Expr, imp::Expr) ndhlds = Expr(:vect, map(x -> :($(x).handle), ndin)...) # handler for `func!` which has side effect on first argument. - T, n_output, hdls_ref, retexpr = _outexpr(fname, sig.args[2].args[1]) + T, n_output, hdls_ref, retexpr = _outexpr(fname, _firstarg(sig)) func_body = quote op_handle = _get_cached_libmx_op_handle($opname) @@ -1126,7 +1097,7 @@ _mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap minimum(arr::NDArray, dims) min(arr; axis = 0 .- dims, keepdims = true) # See https://github.com/dmlc/MXNet.jl/issues/55 -@_remap dot(x::NDArray, y::NDArray) dot(y, x) +@_remap dot(x::NDArray{T,N}, y::NDArray{S,N}) where {T,S,N} dot(y, x) # See https://github.com/dmlc/MXNet.jl/pull/123 @_remap transpose(arr::NDArray) transpose(_only2d(arr)) @@ -1192,7 +1163,7 @@ function _get_ndarray_function_def(name :: String) func_name = Symbol(name) func_def = quote - function $func_name(::Type{NDArray}, args::NDArray...; out=nothing, kwargs...) + function $func_name(::Type{<:NDArray}, args::NDArray...; out=nothing, kwargs...) if out != nothing output_vars = out if isa(output_vars, NDArray) diff --git a/src/util.jl b/src/util.jl index 6877200d87b8..b0f91c824566 100644 --- a/src/util.jl +++ b/src/util.jl @@ -202,3 +202,17 @@ function _sig_checker() end end + +""" +Get first position argument from function sig +""" +function _firstarg(sig::Expr) + if sig.head ∈ (:where, :(::)) + _firstarg(sig.args[1]) + elseif sig.head == :call + i = (sig.args[2] isa Expr && sig.args[2].head == :parameters) ? 3 : 2 + _firstarg(sig.args[i]) + end +end + +_firstarg(s::Symbol) = s diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 47ce9b08957d..f6d1b1281b08 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -423,7 +423,7 @@ function test_saveload() j_array, nd_array = rand_tensors(dims) mx.save(fname, nd_array) data = mx.load(fname, mx.NDArray) - @test data isa Vector{mx.NDArray} + @test data isa Vector{<:mx.NDArray} @test length(data) == 1 @test copy(data[1]) ≈ j_array @@ -432,7 +432,7 @@ function test_saveload() nd_arrays = mx.NDArray[x[2] for x in arrays] mx.save(fname, nd_arrays) data = mx.load(fname, mx.NDArray) - @test isa(data, Vector{mx.NDArray}) + @test data isa Vector{<:mx.NDArray} @test length(data) == n_arrays for i = 1:n_arrays @test copy(data[i]) ≈ arrays[i][1] @@ -443,7 +443,7 @@ function test_saveload() dict = Dict([(n, v) for (n,v) in zip(names, nd_arrays)]) mx.save(fname, dict) data = mx.load(fname, mx.NDArray) - @test data isa Dict{Symbol, mx.NDArray} + @test data isa Dict{Symbol,<:mx.NDArray} @test length(data) == n_arrays for i = 1:n_arrays @test copy(data[names[i]]) ≈ arrays[i][1] @@ -592,6 +592,10 @@ function test_dot() y = mx.zeros(dims2) z = mx.dot(x, y) @test size(z) == (2, 8) + + x = mx.zeros(1, 2) + y = mx.zeros(1, 2, 3) + @test_throws MethodError dot(x, y) end function test_eltype() diff --git a/test/unittest/util.jl b/test/unittest/util.jl new file mode 100644 index 000000000000..d27b509bd010 --- /dev/null +++ b/test/unittest/util.jl @@ -0,0 +1,25 @@ +module TestUtil + +using Base.Test + +using MXNet + + +function test_firstarg() + info("Util::_firstarg") + @test mx._firstarg(:(f(x, y))) == :x + @test mx._firstarg(:(f(x::mx.NDArray, y))) == :x + @test mx._firstarg(:(f(x::mx.NDArray, y::mx.NDArray))) == :x + @test mx._firstarg(:(f(x::Int, y::mx.NDArray))) == :x + @test mx._firstarg(:(f(x::Int, y::mx.NDArray; other = 42))) == :x + @test mx._firstarg(:(f(x::mx.NDArray{T}, y) where {T})) == :x + @test mx._firstarg(:(f(x::mx.NDArray{T,N}, y) where {T,N})) == :x + @test mx._firstarg(:(f(x::mx.NDArray{T,N} where {T,N}, y))) == :x +end # function test_firstarg + + +@testset "Util Test" begin + test_firstarg() +end # @testset "Util" + +end # module TestUtil From 914fab6d3498731103c00985062e478811ded1b7 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 2 Dec 2017 13:10:14 +0800 Subject: [PATCH 570/630] ndarray: minor style changes (#349) --- src/ndarray.jl | 61 +++++++++++++++++--------------------------------- 1 file changed, 21 insertions(+), 40 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 1a2ffa280d58..f750f4fcef1b 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -128,11 +128,11 @@ Base.cconvert(T::Type{MX_handle}, obj::NDArray) = Base.unsafe_convert(T, obj) # NDArray functions exported to the users ################################################################################ """ - context(arr :: NDArray) + context(arr::NDArray) Get the context that this `NDArray` lives on. """ -function context(arr :: NDArray) +function context(arr::NDArray) ref_typeid = Ref{Cint}(0) ref_devid = Ref{Cint}(0) @mxcall(:MXNDArrayGetContext, (MX_handle, Ref{Cint}, Ref{Cint}), @@ -140,7 +140,6 @@ function context(arr :: NDArray) return Context(ref_typeid[], ref_devid[]) end - """ empty(DType, dims[, ctx::Context = cpu()]) empty(DType, dims) @@ -148,26 +147,19 @@ end Allocate memory for an uninitialized `NDArray` with a specified type. """ -empty(::Type{T}, dims::NTuple{N, Int}, ctx::Context = cpu()) where {N,T<:DType} = +empty(::Type{T}, dims::NTuple{N,Int}, ctx::Context = cpu()) where {N,T<:DType} = NDArray{T, N}(_ndarray_alloc(T, dims, ctx, false)) empty(::Type{T}, dims::Int...) where {T<:DType} = empty(T, dims) """ - empty(shape :: Tuple, ctx :: Context) - empty(shape :: Tuple) + empty(dims::Tuple[, ctx::Context = cpu()]) empty(dim1, dim2, ...) Allocate memory for an uninitialized `NDArray` with specific shape of type Float32. """ -function empty(shape :: NTuple{N, Int}) where N - empty(shape, cpu()) -end -function empty(shape :: NTuple{N, Int}, ctx :: Context) where N - NDArray(_ndarray_alloc(shape, ctx, false)) -end -function empty(shape :: Int...) - empty(shape) -end +empty(dims::NTuple{N,Int}, ctx::Context = cpu()) where N = + NDArray(_ndarray_alloc(dims, ctx, false)) +empty(dims::Int...) = empty(dims) """ similar(x::NDArray) @@ -184,7 +176,7 @@ Base.similar(x::NDArray{T}) where {T} = empty(T, size(x), context(x)) Create zero-ed `NDArray` with specific shape and type. """ -function zeros(::Type{T}, dims::NTuple{N, Int}, ctx::Context = cpu()) where {N,T<:DType} +function zeros(::Type{T}, dims::NTuple{N,Int}, ctx::Context = cpu()) where {N,T<:DType} arr = empty(T, dims, ctx) arr[:] = zero(T) arr @@ -200,47 +192,36 @@ Create zero-ed `NDArray` with specific shape. """ zeros(dims::NTuple{N, Int}, ctx::Context = cpu()) where N = zeros(MX_float, dims, ctx) - zeros(dims::Int...) = zeros(dims) """ - ones(DType, shape :: Tuple, ctx :: Context) - ones(DType, shape :: Tuple) - ones(DType, dim1, dim2, ...) + ones(DType, dims::Tuple[, ctx::Context = cpu()]) + ones(DType, dim1, dim2...) Create an `NDArray` with specific shape & type, and initialize with 1. """ -function ones(:: Type{T}, shape :: NTuple{N, Int}) where {N,T<:DType} - ones(T, shape, cpu()) -end -function ones(:: Type{T}, shape :: NTuple{N, Int}, ctx :: Context) where {N,T<:DType} - arr = empty(T, shape, ctx) +function ones(::Type{T}, dims::NTuple{N,Int}, ctx::Context = cpu()) where {N,T<:DType} + arr = empty(T, dims, ctx) arr[:] = one(T) - return arr -end -function ones(:: Type{T}, shape :: Int...) where T<:DType - ones(T, shape) + arr end +ones(::Type{T}, dims::Int...) where T<:DType = ones(T, dims) + """ - ones(shape :: Tuple, ctx :: Context) - ones(shape :: Tuple) + ones(dims::Tuple[, ctx::Context = cpu()]) ones(dim1, dim2, ...) Create an `NDArray` with specific shape and initialize with 1. """ -function ones(shape :: NTuple{N, Int}) where N - ones(shape, cpu()) -end -function ones(shape :: NTuple{N, Int}, ctx :: Context) where N - arr = empty(shape, ctx) +function ones(dims::NTuple{N,Int}, ctx::Context = cpu()) where N + arr = empty(dims, ctx) arr[:] = 1 - return arr -end -function ones(shape :: Int...) - ones(shape) + arr end +ones(dims::Int...) = ones(dims) + import Base: size, length, ndims, eltype """ From c43d0ddf26b65a4ff55bc1d2f9ce9bc4d82777d4 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 2 Dec 2017 14:26:22 +0800 Subject: [PATCH 571/630] model: fix test cases macro (#355) --- test/unittest/model.jl | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/test/unittest/model.jl b/test/unittest/model.jl index fafda7968e25..86a3a6f131ec 100644 --- a/test/unittest/model.jl +++ b/test/unittest/model.jl @@ -8,21 +8,21 @@ function test_feedforward() info("Model::FeedForward::constructor") let x = @mx.var x m = mx.FeedForward(x) - @assert m.arch === x - @assert length(m.ctx) == 1 + @test m.arch === x + @test length(m.ctx) == 1 end info("Model::FeedForward::constructor::keyword context") let x = @mx.var x m = mx.FeedForward(x, context = mx.cpu()) - @assert m.arch === x - @assert length(m.ctx) == 1 + @test m.arch === x + @test length(m.ctx) == 1 end let x = @mx.var x m = mx.FeedForward(x, context = [mx.cpu(), mx.cpu(1)]) - @assert m.arch === x - @assert length(m.ctx) == 2 + @test m.arch === x + @test length(m.ctx) == 2 end end From 09ee1f4ad067d76d57487afba4d55439602bfc9d Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 3 Dec 2017 00:56:28 +0800 Subject: [PATCH 572/630] ndarray: implement `size(x, dims...)` (#350) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit ```julia julia> x = mx.NDArray([1 2; 3 4; 5 6]) 3×2 mx.NDArray{Int64,2} @ CPU0: 1 2 3 4 5 6 julia> size(x, 1, 2, 3, 4) (3, 2, 1, 1) ``` --- NEWS.md | 16 ++++++++++++++++ src/ndarray.jl | 17 ++++++++++++----- test/unittest/ndarray.jl | 10 ++++++++++ 3 files changed, 38 insertions(+), 5 deletions(-) diff --git a/NEWS.md b/NEWS.md index 3e5dce1c6eee..307e8180eb71 100644 --- a/NEWS.md +++ b/NEWS.md @@ -16,6 +16,22 @@ (MXNet.mx.SymbolicNode x, MXNet.mx.SymbolicNode y, MXNet.mx.SymbolicNode z) ``` +### `NDArray` + +* `size(x, dims...)` is supported now. (#TBD) + + ```julia + julia> x = mx.NDArray([1 2; 3 4; 5 6]) + 3×2 mx.NDArray{Int64,2} @ CPU0: + 1 2 + 3 4 + 5 6 + + julia> size(x, 1, 2, 3, 4) + (3, 2, 1, 1) + + ``` + # v0.3.0 (2017.11.16) * Update `libmxnet` to diff --git a/src/ndarray.jl b/src/ndarray.jl index f750f4fcef1b..045b7c28eb1e 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -226,22 +226,29 @@ import Base: size, length, ndims, eltype """ size(x::NDArray) - size(x::NDArray, dim) + size(x::NDArray, dims...) Get the shape of an `NDArray`. The shape is in Julia's column-major convention. See also the notes on NDArray shapes [`NDArray`](@ref). """ -function size(arr :: NDArray) +function size(x::NDArray) ref_ndim = Ref{MX_uint}(0) ref_shape = Ref{Ptr{MX_uint}}(0) @mxcall(:MXNDArrayGetShape, (MX_handle, Ref{MX_uint}, Ref{Ptr{MX_uint}}), - arr, ref_ndim, ref_shape) + x, ref_ndim, ref_shape) tuple(map(Int, flipdim(unsafe_wrap(Array, ref_shape[], ref_ndim[]),1))...) end -function size(arr :: NDArray, dim :: Int) - size(arr)[dim] + +function size(x::NDArray{T,N}, dim::Int) where {T,N} + if dim > N + 1 + else + size(x)[dim] + end end +size(x::NDArray, dims::Int...) = map(d -> size(x, d), dims) + """ length(x::NDArray) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index f6d1b1281b08..367de8177126 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -770,6 +770,15 @@ function test_show() end end +function test_size() + info("NDArray::size") + let A = [1 2; 3 4; 5 6], x = mx.NDArray(A) + @test size(A) == size(x) + @test size(A, 1, 2, 3, 4, 5) == size(x, 1, 2, 3, 4, 5) + @inferred size(x, 1, 2, 3, 4, 5) + end +end # function test_size() + ################################################################################ # Run tests ################################################################################ @@ -802,6 +811,7 @@ end test_fill() test_transpose() test_show() + test_size() end end From 8a19651a680b671137d26f4b148c02efcf52c55c Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 3 Dec 2017 00:59:57 +0800 Subject: [PATCH 573/630] ndarray: implement endof (#351) --- src/ndarray.jl | 2 ++ test/unittest/ndarray.jl | 8 ++++++++ 2 files changed, 10 insertions(+) diff --git a/src/ndarray.jl b/src/ndarray.jl index 045b7c28eb1e..f655803beaf4 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -295,6 +295,8 @@ end Base.first(x::NDArray) = _first(x) +Base.endof(x::NDArray) = length(x) + """ slice(arr :: NDArray, start:stop) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 367de8177126..d6259b317c03 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -161,6 +161,13 @@ function test_first() end end # function test_first +function test_endof() + info("NDArray::endof") + let A = [1 2; 3 4; 5 6], x = mx.NDArray(A) + @test endof(A) == endof(x) + end +end # function test_endof + function test_plus() dims = rand_dims() t1, a1 = rand_tensors(dims) @@ -789,6 +796,7 @@ end # function test_size() test_slice() test_linear_idx() test_first() + test_endof() test_plus() test_minus() test_mul() From fd7fb79cfa27dbac515d80b829e88a13c91fc66d Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 3 Dec 2017 01:02:50 +0800 Subject: [PATCH 574/630] ndarray: make _plus type stable (#352) --- src/ndarray.jl | 9 +++++++-- 1 file changed, 7 insertions(+), 2 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index f655803beaf4..91cb7d106ea9 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -571,10 +571,10 @@ function add_to!(dst::NDArray{T}, args::NDArrayOrReal...) where T if isa(arg, Real) _plus_scalar(dst, scalar = convert(T, arg), out = dst) else - _plus(dst, arg, out = dst) + _plus!(dst, arg) end end - return dst + dst end import Base: + @@ -1100,6 +1100,9 @@ _mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) # remapping to solving type unstablility ################################################################################ +@_remap _plus(x::NDArray, y::NDArray) _plus(x, y) +@_remap _plus!(x::NDArray, y::NDArray) _plus(x, y) + @_remap _minus(x::NDArray, y::NDArray) _minus(x, y) @_remap _minus!(x::NDArray, y::NDArray) _minus(x, y) @@ -1228,6 +1231,8 @@ const _op_import_bl = [ # import black list; do not import these funcs "dot", "transpose", "prod", + + "_plus", "_minus", ] From b9855c484c66f56ec52eef8636a4c34be524a4d3 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 4 Dec 2017 11:45:20 +0800 Subject: [PATCH 575/630] ndarray: type convert of _mul_scalar (#356) Ref: #353 --- src/ndarray.jl | 5 +++-- test/unittest/ndarray.jl | 7 +++++++ 2 files changed, 10 insertions(+), 2 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 91cb7d106ea9..e818dca64178 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -630,13 +630,14 @@ broadcast_(::typeof(-), x::Real, y::NDArray) = x - y Elementwise multiplication into `dst` of either a scalar or an `NDArray` of the same shape. Inplace updating. """ -function mul_to!(dst::NDArray{T}, arg::NDArrayOrReal) where T +function mul_to!(dst::NDArray, arg::NDArrayOrReal) @assert dst.writable if isa(arg, Real) - _mul_scalar(dst, scalar = convert(T, arg), out = dst) + _mul_scalar(dst, scalar = arg, out = dst) else _mul(dst, arg, out = dst) end + dst end import Base: * diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index d6259b317c03..7ae60e43d13a 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -329,6 +329,13 @@ function test_mul() y = x .* x @test copy(y) == [1. 4.] end + + info("NDArray::mul::scalar::type convert") + let x = mx.NDArray([1, 2, 3]) + y = x .* π + @test eltype(x) == Int + @test copy(y) == [3, 6, 9] + end end function test_div() From ad57be93073b1ea11411a5bdc4a70e68db56fbbe Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 4 Dec 2017 11:48:25 +0800 Subject: [PATCH 576/630] ndarray: type convertion of _plus_scalar (#360) Ref: #353 --- src/ndarray.jl | 4 ++-- test/unittest/ndarray.jl | 9 +++++++++ 2 files changed, 11 insertions(+), 2 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index e818dca64178..01f99bfccc31 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -565,11 +565,11 @@ end Add a bunch of arguments into `dst`. Inplace updating. """ -function add_to!(dst::NDArray{T}, args::NDArrayOrReal...) where T +function add_to!(dst::NDArray, args::NDArrayOrReal...) @assert dst.writable for arg in args if isa(arg, Real) - _plus_scalar(dst, scalar = convert(T, arg), out = dst) + _plus_scalar(dst, scalar = arg, out = dst) else _plus!(dst, arg) end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 7ae60e43d13a..7136b994df75 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -220,6 +220,15 @@ function test_plus() @test copy(x .+ 42) == [43 44; 45 46] @test copy(0 .+ x .+ y .+ 41) == [43 44; 45 46] end + + info("NDArray::plus::scalar::type convert") + let x = mx.NDArray([1, 2, 3]) + y = x .+ 0.5 + @test copy(y) == copy(x) + + y = x .+ 2.9 + @test copy(y) == [3, 4, 5] + end end function test_minus() From 642b17b1c06f81ecf485588f00006b581d53ae41 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 4 Dec 2017 11:53:34 +0800 Subject: [PATCH 577/630] ndarray: type convertion of _rdiv_scalar (#358) Ref: #353 --- src/ndarray.jl | 5 +++-- test/unittest/ndarray.jl | 7 +++++++ 2 files changed, 10 insertions(+), 2 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 01f99bfccc31..013e6b5ec3ff 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -680,9 +680,10 @@ end Elementwise divide a scalar by an `NDArray`. Inplace updating. """ -function rdiv_from!(x::Real, y::NDArray{T}) where {T} +function rdiv_from!(x::Real, y::NDArray) @assert y.writable - _rdiv_scalar(y, scalar = convert(T, x), out = y) + _rdiv_scalar(y, scalar = x, out = y) + y end import Base: / diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 7136b994df75..1a66034c3801 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -417,6 +417,13 @@ function test_rdiv() y = 1 ./ Float32[1 2; 3 4] @test copy(x) ≈ y end + + info("NDArray:rdiv::type convert") + let x = mx.NDArray([1, 2, 3]) + y = 5.5 ./ x + @test eltype(y) == Int # this differs from julia + @test copy(y) == [5, 2, 1] + end end # function test_rdiv From ce0e237895bdc58051de8b489893c9823f43a798 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 6 Dec 2017 23:01:42 +0800 Subject: [PATCH 578/630] doc: sort out table for ndarray api (#362) --- docs/src/api.md | 15 ++++++++++++++- docs/src/api/ndarray.md | 27 +++++++++++++++++++++++++++ 2 files changed, 41 insertions(+), 1 deletion(-) diff --git a/docs/src/api.md b/docs/src/api.md index fa48c540721a..4984129863d0 100644 --- a/docs/src/api.md +++ b/docs/src/api.md @@ -1,5 +1,18 @@ # API Documentation ```@contents -Pages = ["api/context.md", "api/model.md", "api/initializers.md", "api/optimizers.md", "api/callbacks.md", "api/metric.md", "api/io.md", "api/ndarray.md", "api/symbolic-node.md", "api/nn-factory.md", "api/executor.md", "api/visualize.md"] +Pages = [ + "api/symbolic-node.md", + "api/ndarray.md", + "api/context.md", + "api/model.md", + "api/initializers.md", + "api/optimizers.md", + "api/callbacks.md", + "api/metric.md", + "api/io.md", + "api/nn-factory.md", + "api/executor.md", + "api/visualize.md", +] ``` diff --git a/docs/src/api/ndarray.md b/docs/src/api/ndarray.md index 4c6832c58969..660bd95fc070 100644 --- a/docs/src/api/ndarray.md +++ b/docs/src/api/ndarray.md @@ -1,5 +1,32 @@ # NDArray API +## Arithmetic Operations + +In the following example `y` can be a `Real` value or another `NDArray` + +| API | Example | | +|-----|----------|----------------------------| +| `+` | `x .+ y` | Elementwise summation | +| `-` | `x .- y` | Elementwise minus | +| `*` | `x .* y` | Elementwise multiplication | +| `/` | `x ./ y` | Elementwise division | +| `^` | `x .^ y` | Elementwise power | + + +## Trigonometric functions + +| API | Example | | +|----------------|------------|-----------------------------| +| [`sin`](@ref) | `sin.(x)` | Elementwise sine | +| [`cos`](@ref) | `cos.(x)` | Elementwise cosine | +| [`tan`](@ref) | `tan.(x)` | Elementwise tangent | +| [`asin`](@ref) | `asin.(x)` | Elementwise inverse sine | +| [`acos`](@ref) | `acos.(x)` | Elementwise inverse cosine | +| [`atan`](@ref) | `atan.(x)` | Elementwise inverse tangent | + + +## Reference + ```@autodocs Modules = [MXNet.mx] Pages = ["ndarray.jl"] From f8d4f620e2371ac1cb87a32c5d7037aa947efbb8 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 7 Dec 2017 09:32:12 +0800 Subject: [PATCH 579/630] ndarray: type convertion of _minus_scalar (#354) Ref: #353 --- src/ndarray.jl | 5 +++-- test/unittest/ndarray.jl | 5 +++++ 2 files changed, 8 insertions(+), 2 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 013e6b5ec3ff..0d8845f2ad5f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -598,13 +598,14 @@ broadcast_(::typeof(+), x::Real, y::NDArray) = x + y Subtract a bunch of arguments from `dst`. Inplace updating. """ -function sub_from!(dst::NDArray{T}, arg::NDArrayOrReal) where T +function sub_from!(dst::NDArray, arg::NDArrayOrReal) @assert dst.writable if isa(arg, Real) - _minus_scalar(dst, scalar = convert(T, arg), out = dst) + _minus_scalar(dst, scalar = arg, out = dst) else _minus!(dst, arg) end + dst end import Base: - diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 1a66034c3801..f111f9443141 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -281,6 +281,11 @@ function test_minus() @test t6 - scalar_small ≈ copy(a6 .- scalar_small) @test t6 - scalar_large ≈ copy(a6 .- scalar_large) + info("NDArray::minus::scalar::type convert") + let x = mx.NDArray([1, 2, 3]) + @test copy(x .- π) ≈ [-2, -1, 0] + end + info("NDArray::minus::type stablility") let x = mx.zeros(dims), y = mx.ones(dims) @inferred x - y From 14f974849d133de974b694b2f2caf4be0f4408b8 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 8 Dec 2017 10:31:32 +0800 Subject: [PATCH 580/630] ndarray: do not auto-import _full, _ones and _zeros (#359) --- src/ndarray.jl | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 0d8845f2ad5f..8e60ee4e792c 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -737,7 +737,7 @@ end Create an `NDArray` filled with the value `x`, like `Base.fill`. """ -function fill(x, dims::NTuple{N, Integer}, ctx::Context=cpu()) where N +function fill(x, dims::NTuple{N,Integer}, ctx::Context=cpu()) where N arr = empty(typeof(x), dims, ctx) arr[:] = x arr @@ -1224,6 +1224,9 @@ function _get_ndarray_function_def(name :: String) end const _op_import_bl = [ # import black list; do not import these funcs + "_full", # we already have `mx.fill` + "_ones", # we already have `mx.ones` + "_zeros", # we already have `mx.zeros` "mean", "reshape", "sum", From daf787c992dc4fa2d09b5a06cb08e509186ea646 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 9 Dec 2017 13:46:06 +0800 Subject: [PATCH 581/630] ndarray: make trigonometric functions dot-call only (#361) - Also, renamed arc* funcs to a* to keep consistent with Base - deprecated non-dot-call --- NEWS.md | 16 +++++++++++ src/MXNet.jl | 1 + src/broadcast.jl | 9 ++++++ src/deprecated.jl | 8 ++++++ src/ndarray.jl | 59 +++++++++++++++++++++++++++++++++------- src/util.jl | 10 ++++++- test/unittest/ndarray.jl | 22 +++++++++++++++ test/unittest/util.jl | 2 ++ 8 files changed, 116 insertions(+), 11 deletions(-) create mode 100644 src/broadcast.jl diff --git a/NEWS.md b/NEWS.md index 307e8180eb71..79df75eee52c 100644 --- a/NEWS.md +++ b/NEWS.md @@ -32,6 +32,22 @@ ``` +## API Changes + +### `NDArray` + +* Please use dot-call on following trigonometric functions. + Also, the `arc*` has been renamed to keep consistent with `Base`. + (#TBD) + + * `sin.(x)` + * `cos.(x)` + * `tan.(x)` + * `arcsin(x)` -> `asin.(x)` + * `arccos(x)` -> `acos.(x)` + * `arctan(x)` -> `atan.(x)` + + # v0.3.0 (2017.11.16) * Update `libmxnet` to diff --git a/src/MXNet.jl b/src/MXNet.jl index d80bbd3d3cdd..631fbf0a2de0 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -26,6 +26,7 @@ include("base.jl") include("context.jl") include("util.jl") +include("broadcast.jl") include("ndarray.jl") include("random.jl") diff --git a/src/broadcast.jl b/src/broadcast.jl new file mode 100644 index 000000000000..a5fdacd829d0 --- /dev/null +++ b/src/broadcast.jl @@ -0,0 +1,9 @@ +using TakingBroadcastSeriously: Broadcasted, unwrap + +for f in :[tan, asin, acos, atan, + sinh, cosh, tanh, asinh, acosh, atanh].args + # copy from TakingBroadcastSeriously + @eval Base.$f(a::Broadcasted...) = Broadcasted(broadcast_($f, unwrap.(a)...)) + @eval Base.$f(a::Broadcasted, b) = Broadcasted(broadcast_($f, unwrap(a), b)) + @eval Base.$f(b, a::Broadcasted) = Broadcasted(broadcast_($f, b, unwrap(a))) +end diff --git a/src/deprecated.jl b/src/deprecated.jl index b2816fad5432..dc19f5663b12 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -8,3 +8,11 @@ # srand (#282) @deprecate srand!(seed_state::Int) srand(seed_state) + +# v0.4 +@deprecate sin(x::NDArray) sin.(x) +@deprecate cos(x::NDArray) cos.(x) +@deprecate tan(x::NDArray) tan.(x) +@deprecate arcsin(x::NDArray) asin.(x) +@deprecate arccos(x::NDArray) acos.(x) +@deprecate arctan(x::NDArray) atan.(x) diff --git a/src/ndarray.jl b/src/ndarray.jl index 8e60ee4e792c..37894882bc33 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -993,7 +993,11 @@ end const _mxsig = Dict{Symbol,Expr}() -function _autoimport(name::Symbol) +function _autoimport(name::Symbol, sig::Expr) + if name == :broadcast_ + name = _broadcast_target(sig) + end + if isdefined(Base, name) :(import Base: $name) else @@ -1010,11 +1014,28 @@ function _outexpr(name::Symbol, x #= the first arg of `sig` =#) end end +_broadcast_target(sig::Expr) = sig.args[2].args[].args[end] + +""" +Generate docstring from function signature +""" +function _docsig(fname::Symbol, sig::Expr) + if fname !== :broadcast_ + " $sig" + else + name = _broadcast_target(sig) + sig_ = Expr(:call, Symbol(name, "."), sig.args[3:end]...) + str = " $sig_" + @eval @doc $str $name + "" + end +end + macro _remap(sig::Expr, imp::Expr) fname = (sig.head == :call) ? sig.args[1] : sig.args[1].args[1] # case of `where` opname = string(imp.args[1]) - import_expr = _autoimport(fname) + import_expr = _autoimport(fname, sig) if isa(imp.args[2], Expr) && imp.args[2].head == :parameters ndin = imp.args[3:end] @@ -1055,7 +1076,7 @@ macro _remap(sig::Expr, imp::Expr) $retexpr end - docstr = " $sig" + docstr = _docsig(fname, sig) func_def = Expr(:function, sig, func_body) esc(quote @@ -1099,6 +1120,14 @@ _mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap prod(arr::NDArray) prod(arr) @_remap prod(arr::NDArray, dims) prod(arr; axis = 0 .- dims, keepdims = true) +# trigonometric functions, remap to keep consistent with Base +@_remap broadcast_(::typeof(sin), x::NDArray) sin(x) +@_remap broadcast_(::typeof(cos), x::NDArray) cos(x) +@_remap broadcast_(::typeof(tan), x::NDArray) tan(x) +@_remap broadcast_(::typeof(asin), x::NDArray) arcsin(x) +@_remap broadcast_(::typeof(acos), x::NDArray) arccos(x) +@_remap broadcast_(::typeof(atan), x::NDArray) arctan(x) + ################################################################################ # remapping to solving type unstablility ################################################################################ @@ -1227,19 +1256,29 @@ const _op_import_bl = [ # import black list; do not import these funcs "_full", # we already have `mx.fill` "_ones", # we already have `mx.ones` "_zeros", # we already have `mx.zeros` - "mean", - "reshape", - "sum", + + # arithmetic + "_plus", + "_minus", + + "dot", "max", "max_axis", + "mean", "min", "min_axis", - "dot", - "transpose", "prod", + "reshape", + "sum", + "transpose", - "_plus", - "_minus", + # trigonometric + "sin", + "cos", + "tan", + "arcsin", + "arccos", + "arctan", ] macro _import_ndarray_functions() diff --git a/src/util.jl b/src/util.jl index b0f91c824566..c53fb9a597fa 100644 --- a/src/util.jl +++ b/src/util.jl @@ -210,7 +210,15 @@ function _firstarg(sig::Expr) if sig.head ∈ (:where, :(::)) _firstarg(sig.args[1]) elseif sig.head == :call - i = (sig.args[2] isa Expr && sig.args[2].head == :parameters) ? 3 : 2 + i = if sig.args[2] isa Expr && sig.args[2].head == :parameters + # there are some keyward arguments locate at args[2] + 3 + elseif sig.args[1] === :broadcast_ + # case of broadcasting, skip the first arg `::typeof(...)` + 3 + else + 2 + end _firstarg(sig.args[i]) end end diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index f111f9443141..32fabd3c4bc5 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -814,6 +814,27 @@ function test_size() end end # function test_size() +function check_trigonometric(f) + info("NDArray::$f") + let A = [.1 .2; .3 .4], x = mx.NDArray(A) + B = f.(A) + y = f.(x) + @test copy(y) ≈ B + end + + let A = Float32[.1 .2; .3 .4], x = mx.NDArray(A) + B = f.(A) + y = f.(x) + @test copy(y) ≈ B + end +end # function check_trigonometric + +function test_trigonometric() + for f ∈ [sin, cos, tan, asin, acos, atan] + check_trigonometric(f) + end +end # function test_trigonometric + ################################################################################ # Run tests ################################################################################ @@ -848,6 +869,7 @@ end # function test_size() test_transpose() test_show() test_size() + test_trigonometric() end end diff --git a/test/unittest/util.jl b/test/unittest/util.jl index d27b509bd010..823decffd442 100644 --- a/test/unittest/util.jl +++ b/test/unittest/util.jl @@ -15,6 +15,8 @@ function test_firstarg() @test mx._firstarg(:(f(x::mx.NDArray{T}, y) where {T})) == :x @test mx._firstarg(:(f(x::mx.NDArray{T,N}, y) where {T,N})) == :x @test mx._firstarg(:(f(x::mx.NDArray{T,N} where {T,N}, y))) == :x + @test mx._firstarg(:(broadcast_(::typeof(asin), x::mx.NDArray))) == :x + @test mx._firstarg(:(broadcast_(::typeof(asin), x::mx.NDArray, y::mx.NDArray))) == :x end # function test_firstarg From 233fcfc5a89d69037290964c38066bbe0bda6a87 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 9 Dec 2017 14:26:02 +0800 Subject: [PATCH 582/630] ndarray: change internal api of plus to help autograd (#364) address https://github.com/dmlc/MXNet.jl/pull/274#issuecomment-349951876 --- src/ndarray.jl | 28 +++++++++++++--------------- 1 file changed, 13 insertions(+), 15 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 37894882bc33..c9b17924f998 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -587,8 +587,10 @@ Summation. Multiple arguments of either scalar or `NDArray` could be added together. Note at least the first or second argument needs to be an `NDArray` to avoid ambiguity of built-in summation. """ -+(x::NDArray, ys::NDArrayOrReal...) = add_to!(copy(x, context(x)), ys...) -+(x::Real, y::NDArray, zs::NDArrayOrReal...) = add_to!(copy(y, context(y)), x, zs...) ++(x::NDArray) = x ++(x::NDArray, y::NDArray) = _plus(x, y) ++(x::NDArray, y::Real) = _plus_scalar(x, scalar = y) ++(y::Real, x::NDArray) = _plus_scalar(x, scalar = y) broadcast_(::typeof(+), x::NDArray, y::NDArrayOrReal) = x + y broadcast_(::typeof(+), x::Real, y::NDArray) = x + y @@ -1205,20 +1207,16 @@ function _get_ndarray_function_def(name :: String) args = MX_handle[] end - if length(output_vars) > 0 - output_handles = map((x) -> Base.cconvert(MX_handle, x), output_vars) - # XXX: Julia 0.4 has bug: [Array{MX_handle}] == Array{MX_handle} - output_handles_pp = Array{Array{MX_handle}}(1) - output_handles_pp[1] = Base.cconvert(Ptr{MX_handle}, output_handles) + output_handles_pp = if length(output_vars) > 0 + [map(x -> x.handle, output_vars)] else - output_handles_pp = [Base.convert(Ptr{MX_handle}, 0)] + [Ptr{MX_handle}(C_NULL)] end num_outputs_p = [convert(Cint, num_outputs)] kw_keys_str = String[string(x[1]) for x in kwargs] kw_vals_str = String[dump_mx_param(x[2]) for x in kwargs] - #op_handle = _get_cached_libmx_op_handle($(QuoteNode(name))) op_handle = _get_cached_libmx_op_handle($(name)) @mxcall(:MXImperativeInvoke, (MX_handle, Cint, Ptr{MX_handle}, @@ -1229,13 +1227,13 @@ function _get_ndarray_function_def(name :: String) length(kwargs), kw_keys_str, kw_vals_str) if out == nothing - handle_array = unsafe_wrap(Array, output_handles_pp[], num_outputs_p[]) - handle_array = [MX_NDArrayHandle(x) for x in handle_array] - arrays = [NDArray(hdr) for hdr in handle_array] - if length(arrays) == 1 - return arrays[1] + n = num_outputs_p[] + hdls = unsafe_wrap(Array{MX_handle}, output_handles_pp[], n) + xs = NDArray[NDArray(MX_NDArrayHandle(x)) for x in hdls] + if n == 1 + return xs[] else - return arrays + return xs end else return out From eb819b03055fb4ba984ff9cbb0a0c78ec98eb2a2 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 9 Dec 2017 14:28:40 +0800 Subject: [PATCH 583/630] ndarray: change internal api of mul/div to help autograd (#366) address https://github.com/dmlc/MXNet.jl/pull/274#issuecomment-349951876 --- src/ndarray.jl | 28 +++++++++++++--------------- 1 file changed, 13 insertions(+), 15 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index c9b17924f998..28374943a6c9 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -650,12 +650,12 @@ import Base: * Currently only multiplication a scalar with an `NDArray` is implemented. """ -*(x:: NDArray, y::Real) = x .* y -*(x::Real, y::NDArray) = y .* x +*(x::NDArray, y::Real) = _mul_scalar(x, scalar = y) +*(y::Real, x::NDArray) = _mul_scalar(x, scalar = y) -broadcast_(::typeof(*), x::NDArray, y::NDArrayOrReal) = - mul_to!(copy(x, context(x)), y) -broadcast_(::typeof(*), x::Real, y::NDArray) = y .* x +broadcast_(::typeof(*), x::NDArray, y::Real) = x * y +broadcast_(::typeof(*), y::Real, x::NDArray) = x * y +broadcast_(::typeof(*), x::NDArray, y::NDArray) = _mul(x, y) """ *(A::NDArray, B::NDArray) @@ -703,25 +703,23 @@ of the same shape. * Matrix division (solving linear systems) is not implemented yet. """ -/(x::NDArray, y::Real) = x ./ y +/(x::NDArray, y::Real) = _div_scalar(x, scalar = y) -broadcast_(::typeof(/), x::NDArray, y::NDArrayOrReal) = - div_from!(copy(x, context(x)), y) - -broadcast_(::typeof(/), x::Real, y::NDArray) = - rdiv_from!(x, copy(y, context(y))) +broadcast_(::typeof(/), x::NDArray, y::NDArray) = _div(x, y) +broadcast_(::typeof(/), x::NDArray, y::Real) = _div_scalar(x, scalar = y) +broadcast_(::typeof(/), y::Real, x::NDArray) = _rdiv_scalar(x, scalar = y) import Base: ^ # document of `.^` is merged into SymbolicNode's broadcast_(::typeof(^), x::NDArray, y::NDArray) = _power(x, y) -broadcast_(::typeof(^), x::NDArray, s::Real) = _power_scalar(x, scalar=s) -broadcast_(::typeof(^), s::Real, x::NDArray) = _rpower_scalar(x, scalar=s) +broadcast_(::typeof(^), x::NDArray, s::Real) = _power_scalar(x, scalar = s) +broadcast_(::typeof(^), s::Real, x::NDArray) = _rpower_scalar(x, scalar = s) broadcast_(::typeof(^), ::Irrational{:e}, x::NDArray) = exp(x) -broadcast_(::typeof(^), x::NDArray, s::Irrational) = _power_scalar(x, scalar=s) -broadcast_(::typeof(^), s::Irrational, x::NDArray) = _rpower_scalar(x, scalar=s) +broadcast_(::typeof(^), x::NDArray, s::Irrational) = _power_scalar(x, scalar = s) +broadcast_(::typeof(^), s::Irrational, x::NDArray) = _rpower_scalar(x, scalar = s) """ fill!(arr::NDArray, x) From 2ca5565b1b3a8a4cc219ab92b03029711731ccd1 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 9 Dec 2017 14:28:55 +0800 Subject: [PATCH 584/630] ndarray: change internal api of minus to help autograd (#365) address https://github.com/dmlc/MXNet.jl/pull/274#issuecomment-349951876 Although this patch cannot pass `@inferred`, but `code_warntype` give me this: ```julia end::MXNet.mx.NDArray{_,_} where _ where _ ``` And seems it doesn't hurt performance. --- src/ndarray.jl | 7 ++++--- test/unittest/ndarray.jl | 6 ------ 2 files changed, 4 insertions(+), 9 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 28374943a6c9..7854a6ec9a4c 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -620,9 +620,10 @@ import Base: - Subtraction `x - y`, of scalar types or `NDArray`. Or create the negative of `x`. """ --(x::NDArray) = _mul_scalar(x, scalar=-one(eltype(x))) --(x::NDArray, y::NDArrayOrReal) = sub_from!(copy(x, context(x)), y) --(x::Real, y::NDArray) = -y .+ x +-(x::NDArray) = _mul_scalar(x, scalar = -one(eltype(x))) +-(x::NDArray, y::NDArray) = _minus(x, y) +-(x::NDArray, y::Real) = _minus_scalar(x, scalar = y) +-(y::Real, x::NDArray) = _rminus_scalar(x, scalar = y) broadcast_(::typeof(-), x::NDArray, y::NDArrayOrReal) = x - y broadcast_(::typeof(-), x::Real, y::NDArray) = x - y diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 32fabd3c4bc5..9f69503f7f13 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -285,12 +285,6 @@ function test_minus() let x = mx.NDArray([1, 2, 3]) @test copy(x .- π) ≈ [-2, -1, 0] end - - info("NDArray::minus::type stablility") - let x = mx.zeros(dims), y = mx.ones(dims) - @inferred x - y - @inferred x .- y - end end function test_mul() From 12198f08e42fdcadab6ef183f5691ffe586f8641 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 11 Dec 2017 03:12:06 +0800 Subject: [PATCH 585/630] ndarray: copy(AbstractArray, context) (#367) julia> copy(1:4, mx.cpu()) 4 mx.NDArray{Int64,1} @ CPU0: 1 2 3 4 julia> copy(1.:4, mx.cpu()) 4 mx.NDArray{Float64,1} @ CPU0: 1.0 2.0 3.0 4.0 --- NEWS.md | 18 ++++++++++++++++++ src/ndarray.jl | 11 +++++------ test/unittest/ndarray.jl | 11 +++++++++++ 3 files changed, 34 insertions(+), 6 deletions(-) diff --git a/NEWS.md b/NEWS.md index 79df75eee52c..2ed915e80e56 100644 --- a/NEWS.md +++ b/NEWS.md @@ -32,6 +32,24 @@ ``` +* `copy(AbstractArray, context)` is implemented now. (#TBD) + + ```julia + julia> copy(1:4, mx.cpu()) + 4 mx.NDArray{Int64,1} @ CPU0: + 1 + 2 + 3 + 4 + + julia> copy(1.:4, mx.cpu()) + 4 mx.NDArray{Float64,1} @ CPU0: + 1.0 + 2.0 + 3.0 + 4.0 + ``` + ## API Changes ### `NDArray` diff --git a/src/ndarray.jl b/src/ndarray.jl index 7854a6ec9a4c..756e5de35419 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -401,9 +401,7 @@ which furthur translates into create a **copy** of the sub-array for Julia `Array`, while for `NDArray`, this is a *slice* that shares the memory. """ -function getindex(arr::NDArray, ::Colon) - return arr -end +getindex(arr::NDArray, ::Colon) = arr """ Shortcut for [`slice`](@ref). @@ -411,9 +409,7 @@ Shortcut for [`slice`](@ref). copy of the sub-array, while here we simply call `slice`, which shares the underlying memory. """ -function getindex(arr::NDArray, idx::UnitRange{Int}) - slice(arr, idx) -end +getindex(arr::NDArray, idx::UnitRange{Int}) = slice(arr, idx) getindex(arr::NDArray) = _first(arr) @@ -503,6 +499,9 @@ copy(x::NDArray{T,D}, ctx::Context) where {T,D} = copy(x::Array{T}, ctx::Context) where {T<:DType} = copy!(empty(T, size(x), ctx), x) +copy(x::AbstractArray, ctx::Context) = + copy!(empty(eltype(x), size(x), ctx), collect(x)) + """ convert(::Type{Array{<:Real}}, x::NDArray) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 9f69503f7f13..398912bc0201 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -44,6 +44,17 @@ function test_copy() array2 = copy(array, mx.cpu()) tensor2 = copy(array2) @test tensor ≈ tensor2 + + info("NDArray::copy::AbstractArray") + let x = copy(1:4, mx.cpu()) + @test eltype(x) == Int + @test copy(x) == [1, 2, 3, 4] + end + + let x = copy(1.:4, mx.cpu()) + @test eltype(x) == Float64 + @test copy(x) ≈ [1., 2, 3, 4] + end end function test_deepcopy() From 2d7cdc6a558e34ad061a57418e79b5f1551cea73 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 11 Dec 2017 03:21:30 +0800 Subject: [PATCH 586/630] Reexporting NDArray and SymbolicNode (#306) * Reexporting NDArray and SymbolicNode * Executor * context and empty * exporting more * context * fix test --- NEWS.md | 57 +++++++++++++++++++++++++++++++ REQUIRE | 1 + deps/build.jl | 1 - src/MXNet.jl | 85 +++++++++++++++++++++++++++++++++++++++++++--- src/context.jl | 11 ++---- src/initializer.jl | 5 +-- src/io.jl | 14 ++++---- src/metric.jl | 8 ++--- src/optimizer.jl | 6 ++-- 9 files changed, 158 insertions(+), 30 deletions(-) diff --git a/NEWS.md b/NEWS.md index 2ed915e80e56..bb08c1f9d7d2 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,5 +1,62 @@ # v0.4.0 (#TBD) +* Following material from `mx` module got exported (#TBD): + * `NDArray` + * `context()` + * `empty()` + + * `SymbolicNode` + * `Variable` + * `@var` + + * `Context` + * `cpu()` + * `gpu()` + + * `AbstractModel` + * `FeedForward` + * `predict()` + + * `MLP` + + * `Executor` + * `bind()` + * `simple_bind()` + * `forward()` + * `backward()` + + * `AbstractEvalMetric` + * `ACE` + * `Accuracy` + * `MSE` + * `MultiACE` + * `MultiMetric` + * `NMSE` + * `SeqMetric` + + * `KVStore` + + * `AbstractInitializer` + * `UniformInitializer` + * `NormalInitializer` + * `XavierInitializer` + + * `AbstractOptimizer` + * `AdaDelta` + * `AdaGrad` + * `ADAM` + * `AdaMax` + * `Nadam` + * `RMSProp` + * `SGD` + + * `AbstractDataProvider` + * `AbstractDataBatch` + * `ArrayDataProvider` + * `ArrayDataBatch` + + * `to_graphviz()` + ## New APIs ### `SymbolicNode` diff --git a/REQUIRE b/REQUIRE index 22caea9072b7..5a76dc543b25 100644 --- a/REQUIRE +++ b/REQUIRE @@ -4,3 +4,4 @@ BinDeps JSON MacroTools TakingBroadcastSeriously +Reexport diff --git a/deps/build.jl b/deps/build.jl index 8b4c254cbb39..b09e5f44242e 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -1,4 +1,3 @@ -using Compat import JSON ################################################################################ diff --git a/src/MXNet.jl b/src/MXNet.jl index 631fbf0a2de0..3583c140b64c 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -2,15 +2,13 @@ __precompile__() module MXNet +using Reexport + # we put everything in the namespace mx, because there are a lot of # functions with the same names as built-in utilities like "zeros", etc. export mx module mx -using Compat -import Compat.String -import Compat.view - import Base.Iterators: filter using Formatting @@ -22,6 +20,83 @@ import TakingBroadcastSeriously: broadcast_ import Base: round, ceil, floor, cos, sin, abs, sign, exp, sqrt, exp, log, norm, transpose +############################################################################### +# exports +############################################################################### + +# symbolic-node.jl +export SymbolicNode, + Variable, + @var + +# ndarray.jl +export NDArray, + context, + empty + +# executor.jl +export Executor, + bind, + simple_bind, + forward, + backward + +# context.jl +export Context, + cpu, + gpu + +# model.jl +export AbstractModel, + FeedForward, + predict + +# nn-factory.jl +export MLP + +# metric.jl +export AbstractEvalMetric, + ACE, + Accuracy, + MSE, + MultiACE, + MultiMetric, + NMSE, + SeqMetric + +# kvstore.jl +export KVStore + +# initializer.jl +export AbstractInitializer, + UniformInitializer, + NormalInitializer, + XavierInitializer + +# optimizer.jl +export AbstractOptimizer, + AdaDelta, + AdaGrad, + ADAM, + AdaMax, + Nadam, + RMSProp, + SGD + +# io.jl +export AbstractDataProvider, + AbstractDataBatch, + DataBatch, + ArrayDataProvider, + ArrayDataBatch + +# visualize.jl +export to_graphviz + +############################################################################### +# includes +############################################################################### + include("base.jl") include("context.jl") @@ -53,4 +128,6 @@ include("deprecated.jl") end # mx +@reexport using .mx + end # module MXNet diff --git a/src/context.jl b/src/context.jl index d627e7b5e7f7..2b83eebe97a7 100644 --- a/src/context.jl +++ b/src/context.jl @@ -12,9 +12,8 @@ end Context(dev_type :: Union{CONTEXT_TYPE, Int}, dev_id :: Int = 0) = Context(convert(CONTEXT_TYPE, dev_type), dev_id) -function Base.show(io :: IO, ctx :: Context) +Base.show(io::IO, ctx::Context) = print(io, "$(ctx.device_type)$(ctx.device_id)") -end """ cpu(dev_id) @@ -25,9 +24,7 @@ operations when no context is specified. # Arguments * `dev_id::Int = 0`: the CPU id. """ -function cpu(dev_id::Int=0) - return Context(CPU, dev_id) -end +cpu(dev_id::Int = 0) = Context(CPU, dev_id) """ gpu(dev_id) @@ -37,6 +34,4 @@ Get a GPU context with a specific id. The K GPUs on a node is typically numbered # Arguments * `dev_id :: Int = 0` the GPU device id. """ -function gpu(dev_id::Int=0) - return Context(GPU, dev_id) -end +gpu(dev_id::Int = 0) = return Context(GPU, dev_id) diff --git a/src/initializer.jl b/src/initializer.jl index f741d3e5a279..157958586642 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -118,7 +118,7 @@ struct NormalInitializer <: AbstractInitializer σ :: AbstractFloat end """ - NormalIninitializer(; mu=0, sigma=0.01) + NormalInitializer(; mu=0, sigma=0.01) Construct a `NormalInitializer` with mean `mu` and variance `sigma`. """ @@ -156,7 +156,8 @@ struct XavierInitializer <: AbstractInitializer magnitude :: Float64 end -XavierInitializer(; distribution = xv_uniform, regularization = xv_avg, magnitude = 3.0) = XavierInitializer(distribution, regularization, magnitude) +XavierInitializer(; distribution = xv_uniform, regularization = xv_avg, magnitude = 3.0) = + XavierInitializer(distribution, regularization, magnitude) function _init_weight(self :: XavierInitializer, name :: Base.Symbol, array :: NDArray) dims = size(array) diff --git a/src/io.jl b/src/io.jl index 597ea8a90c6e..c8dbee9b8e1a 100644 --- a/src/io.jl +++ b/src/io.jl @@ -25,7 +25,7 @@ abstract type AbstractDataProvider end Returns the mini-batch size of the provided data. All the provided data should have the same mini-batch size (i.e. the last dimension). """ -function get_batch_size end +get_batch_size """ provide_data(provider) -> Vector{Tuple{Base.Symbol, Tuple}} @@ -36,7 +36,7 @@ function get_batch_size end Returns a vector of (name, shape) pairs describing the names of the data it provides, and the corresponding shapes. """ -function provide_data end +provide_data """ provide_label(provider) -> Vector{Tuple{Base.Symbol, Tuple}} @@ -46,7 +46,7 @@ function provide_data end Returns a vector of (name, shape) pairs describing the names of the labels it provides, and the corresponding shapes. """ -function provide_label end +provide_label """ AbstractDataProviderState @@ -81,7 +81,7 @@ abstract type AbstractDataBatch end Returns the number of samples in this batch. This number should be greater than 0, but less than or equal to the batch size. This is used to indicate at the end of the data set, there might not be enough samples for a whole mini-batch. """ -function count_samples end +count_samples """ get_data(provider, batch) -> Vector{NDArray} @@ -94,7 +94,7 @@ Returns a vector of data in this batch, should be in the same order as declared The last dimension of each `NDArray` should always match the batch_size, even when `count_samples` returns a value less than the batch size. In this case, the data provider is free to pad the remaining contents with any value. """ -function get_data end +get_data """ get_label(provider, batch) -> Vector{NDArray} @@ -105,7 +105,7 @@ function get_data end Returns a vector of labels in this batch. Similar to [`get_data`](@ref). """ -function get_label end +get_label """ DataBatch @@ -547,7 +547,7 @@ function _get_iter_name(hdr :: MX_handle) return Symbol(unsafe_string(ref_name[])) end -const _iter_creator_cache = Dict{Symbol, MX_handle}() +const _iter_creator_cache = Dict{Symbol,MX_handle}() function _populate_iter_creator_cache!() empty!(_iter_creator_cache) h_creators = _get_iter_creators() diff --git a/src/metric.jl b/src/metric.jl index 3998af8efb8c..489df2ddd8b2 100644 --- a/src/metric.jl +++ b/src/metric.jl @@ -106,7 +106,7 @@ To calculate both mean-squared error [`Accuracy`](@ref) and log-loss [`ACE`](@re mx.fit(..., eval_metric = mx.MultiMetric([mx.Accuracy(), mx.ACE()])) ``` """ -mutable struct MultiMetric <: mx.AbstractEvalMetric +mutable struct MultiMetric <: AbstractEvalMetric metrics :: Vector{mx.AbstractEvalMetric} end @@ -122,7 +122,7 @@ function reset!(metric :: MultiMetric) nothing end -get(metric :: MultiMetric) = mapreduce(get, append!, metric.metrics) +get(metric::MultiMetric) = mapreduce(get, append!, metric.metrics) """ SeqMetric(metrics::Vector{AbstractEvalMetric}) @@ -136,8 +136,8 @@ and log-loss [`ACE`](@ref) for the second output: mx.fit(..., eval_metric = mx.SeqMetric([mx.Accuracy(), mx.ACE()])) ``` """ -mutable struct SeqMetric <: mx.AbstractEvalMetric - metrics :: Vector{mx.AbstractEvalMetric} +mutable struct SeqMetric <: AbstractEvalMetric + metrics :: Vector{AbstractEvalMetric} end function update!(metric::SeqMetric, labels::VecOfNDArray, preds::VecOfNDArray) diff --git a/src/optimizer.jl b/src/optimizer.jl index 89df56ba7050..8d46a9e407a1 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -62,7 +62,6 @@ function get_learning_rate end ################################################################################ # The learning rate module module LearningRate -using Compat import ..mx: AbstractLearningRateScheduler, OptimizationState, get_learning_rate """ @@ -138,7 +137,6 @@ end ################################################################################ # The Momentum module module Momentum -using Compat import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum """ @@ -226,9 +224,9 @@ store all the states needed for each weights. * `optimizer::AbstractOptimizer`: the underlying optimizer. """ -function get_updater(optimizer :: AbstractOptimizer) +function get_updater(optimizer::AbstractOptimizer) states = Dict{Int,Any}() - function updater(index :: Int, grad :: NDArray, weight :: NDArray) + function updater(index::Int, grad::NDArray, weight::NDArray) if !haskey(states, index) states[index] = create_state(optimizer, index, weight) end From db095288615a64b84318acd84571c938eb46af16 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 11 Dec 2017 03:23:46 +0800 Subject: [PATCH 587/630] example: fix parametric NDArray in lstm example (#370) and fix some depwarns fix #368 --- examples/char-lstm/config.jl | 43 +++++++++++++++++----------------- examples/char-lstm/lstm.jl | 4 ++-- examples/char-lstm/sampler.jl | 6 ++--- examples/char-lstm/seq-data.jl | 8 +++---- examples/char-lstm/train.jl | 8 +++---- 5 files changed, 34 insertions(+), 35 deletions(-) diff --git a/examples/char-lstm/config.jl b/examples/char-lstm/config.jl index 974989167ad1..b5961549675f 100644 --- a/examples/char-lstm/config.jl +++ b/examples/char-lstm/config.jl @@ -1,24 +1,23 @@ -const DROPOUT = 0 -const BATCH_SIZE = 32 -const SEQ_LENGTH = 32 -const DIM_HIDDEN = 256 -const DIM_EMBED = 256 -const LSTM_N_LAYER = 2 -const N_EPOCH = 21 -const BASE_LR = 0.01 -const WEIGHT_DECAY = 0.00001 -const CLIP_GRADIENT = 1 -const NAME = :ptb -const N_GPU = 4 -const USE_GPU = true -const DATA_TR_RATIO = 0.9 -const CKPOINT_PREFIX = joinpath(dirname(@__FILE__), "checkpoints/$NAME") +const DROPOUT = 0 +const BATCH_SIZE = 32 +const SEQ_LENGTH = 32 +const DIM_HIDDEN = 256 +const DIM_EMBED = 256 +const LSTM_N_LAYER = 2 +const N_EPOCH = 21 +const BASE_LR = 0.01 +const WEIGHT_DECAY = 0.00001 +const CLIP_GRADIENT = 1 +const NAME = :ptb +const N_GPU = 1 +const USE_GPU = true +const DATA_TR_RATIO = 0.9 +const CKPOINT_PREFIX = joinpath(@__DIR__, "checkpoints/$NAME") -const BATCH_SIZE_SMP= 10 -const SAMPLE_LENGTH = 100 -const SAMPLE_START = 'a' - -const UNKNOWN_CHAR = Char(0) -const INPUT_FILE = joinpath(dirname(@__FILE__), "input.txt") -const VOCAB_FILE = joinpath(dirname(@__FILE__), "vocab.dat") +const BATCH_SIZE_SMP = 10 +const SAMPLE_LENGTH = 100 +const SAMPLE_START = 'a' +const UNKNOWN_CHAR = Char(0) +const INPUT_FILE = joinpath(@__DIR__, "input.txt") +const VOCAB_FILE = joinpath(@__DIR__, "vocab.dat") diff --git a/examples/char-lstm/lstm.jl b/examples/char-lstm/lstm.jl index d930240ba1a2..de6748df9420 100644 --- a/examples/char-lstm/lstm.jl +++ b/examples/char-lstm/lstm.jl @@ -123,12 +123,12 @@ mutable struct NLL <: mx.AbstractEvalMetric NLL() = new(0.0, 0) end -function mx.update!(metric :: NLL, labels :: Vector{mx.NDArray}, preds :: Vector{mx.NDArray}) +function mx.update!(metric::NLL, labels::Vector{<:mx.NDArray}, preds::Vector{<:mx.NDArray}) @assert length(labels) == length(preds) nll = 0.0 for (label, pred) in zip(labels, preds) @mx.nd_as_jl ro=(label, pred) begin - nll -= sum(log(max(broadcast_getindex(pred, round(Int,label+1), 1:length(label)), 1e-20))) + nll -= sum(log.(max.(broadcast_getindex(pred, round.(Int,label+1), 1:length(label)), 1e-20))) end end diff --git a/examples/char-lstm/sampler.jl b/examples/char-lstm/sampler.jl index ad34f344cbcd..df4647f4f893 100644 --- a/examples/char-lstm/sampler.jl +++ b/examples/char-lstm/sampler.jl @@ -1,6 +1,6 @@ -include(joinpath(dirname(@__FILE__), "config.jl")) -include(joinpath(dirname(@__FILE__), "lstm.jl")) -include(joinpath(dirname(@__FILE__), "seq-data.jl")) +include(joinpath(@__DIR__, "config.jl")) +include(joinpath(@__DIR__, "lstm.jl")) +include(joinpath(@__DIR__, "seq-data.jl")) using StatsBase using MXNet diff --git a/examples/char-lstm/seq-data.jl b/examples/char-lstm/seq-data.jl index 0aac5609dac5..1456ae94a1a3 100644 --- a/examples/char-lstm/seq-data.jl +++ b/examples/char-lstm/seq-data.jl @@ -60,7 +60,7 @@ end #--/provide #--eachbatch-part1 -function mx.eachbatch(p :: CharSeqProvider) +function mx.eachbatch(p::CharSeqProvider) data_all = [mx.zeros(shape) for (name, shape) in mx.provide_data(p)] label_all = [mx.zeros(shape) for (name, shape) in mx.provide_label(p)] @@ -73,7 +73,7 @@ function mx.eachbatch(p :: CharSeqProvider) #--eachbatch-part2 #... - function _text_iter() + function _text_iter(c::Channel) text = p.text n_batch = floor(Int, length(text) / p.batch_size / p.seq_len) @@ -100,11 +100,11 @@ function mx.eachbatch(p :: CharSeqProvider) copy!(label_all[i], label_jl[i]) end - produce(batch) + put!(c, batch) end end - return Task(_text_iter) + return Channel(_text_iter) end #--/eachbatch-part2 diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index 30578603cafc..000534f64d7b 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -1,6 +1,6 @@ -include(joinpath(dirname(@__FILE__), "config.jl")) -include(joinpath(dirname(@__FILE__), "lstm.jl")) -include(joinpath(dirname(@__FILE__), "seq-data.jl")) +include(joinpath(@__DIR__, "config.jl")) +include(joinpath(@__DIR__, "lstm.jl")) +include(joinpath(@__DIR__, "seq-data.jl")) # build vocabulary vocab = build_vocabulary(INPUT_FILE, VOCAB_FILE) @@ -29,7 +29,7 @@ data_val = CharSeqProvider(text_val, BATCH_SIZE, SEQ_LENGTH, vocab, NAME, if USE_GPU context = [mx.gpu(i) for i = 0:N_GPU-1] else - context = [mx.cpu()] + context = mx.cpu() end #--train From 27c66ecb61314d1b77810f6929a6f0a0d85061b4 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 12 Dec 2017 10:33:06 +0800 Subject: [PATCH 588/630] sym: overload `bind` (#372) fix this on REPL: WARNING: both mx and Base export "bind"; uses of it in module MXNet must be qualified --- src/executor.jl | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/executor.jl b/src/executor.jl index cd4a9256eeca..c99517b6d76b 100644 --- a/src/executor.jl +++ b/src/executor.jl @@ -1,3 +1,5 @@ +import Base: bind + """ Executor From bfb1cc4fe5de6f42b3dc215680118e66e5d04803 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 15 Dec 2017 11:50:37 +0800 Subject: [PATCH 589/630] ndarray: remap hyperbolic function (#374) --- NEWS.md | 10 ++++++++++ src/deprecated.jl | 7 +++++++ src/ndarray.jl | 16 ++++++++++++++++ test/unittest/ndarray.jl | 27 +++++++++++++++++++++++++++ 4 files changed, 60 insertions(+) diff --git a/NEWS.md b/NEWS.md index bb08c1f9d7d2..703cb216a001 100644 --- a/NEWS.md +++ b/NEWS.md @@ -122,6 +122,16 @@ * `arccos(x)` -> `acos.(x)` * `arctan(x)` -> `atan.(x)` +* Please use dot-call on following hyperbolic functions. + Also, the `arc*` has been renamed to keep consistent with `Base`. + (#TBD) + + * `sinh.(x)` + * `cosh.(x)` + * `tanh.(x)` + * `arcsinh(x)` -> `asinh.(x)` + * `arccosh(x)` -> `acosh.(x)` + * `arctanh(x)` -> `atanh.(x)` # v0.3.0 (2017.11.16) diff --git a/src/deprecated.jl b/src/deprecated.jl index dc19f5663b12..8a8df0a56789 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -16,3 +16,10 @@ @deprecate arcsin(x::NDArray) asin.(x) @deprecate arccos(x::NDArray) acos.(x) @deprecate arctan(x::NDArray) atan.(x) + +@deprecate sinh(x::NDArray) sinh.(x) +@deprecate cosh(x::NDArray) cosh.(x) +@deprecate tanh(x::NDArray) tanh.(x) +@deprecate arcsinh(x::NDArray) asinh.(x) +@deprecate arccosh(x::NDArray) acosh.(x) +@deprecate arctanh(x::NDArray) atanh.(x) diff --git a/src/ndarray.jl b/src/ndarray.jl index 756e5de35419..900285ae5782 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1128,6 +1128,14 @@ _mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap broadcast_(::typeof(acos), x::NDArray) arccos(x) @_remap broadcast_(::typeof(atan), x::NDArray) arctan(x) +# hyperbolic funcs, remap to keep consistent with Base +@_remap broadcast_(::typeof(sinh), x::NDArray) sinh(x) +@_remap broadcast_(::typeof(cosh), x::NDArray) cosh(x) +@_remap broadcast_(::typeof(tanh), x::NDArray) tanh(x) +@_remap broadcast_(::typeof(asinh), x::NDArray) arcsinh(x) +@_remap broadcast_(::typeof(acosh), x::NDArray) arccosh(x) +@_remap broadcast_(::typeof(atanh), x::NDArray) arctanh(x) + ################################################################################ # remapping to solving type unstablility ################################################################################ @@ -1275,6 +1283,14 @@ const _op_import_bl = [ # import black list; do not import these funcs "arcsin", "arccos", "arctan", + + # hyperbolic + "sinh", + "cosh", + "tanh", + "arcsinh", + "arccosh", + "arctanh", ] macro _import_ndarray_functions() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 398912bc0201..0608d4fa6c41 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -840,6 +840,32 @@ function test_trigonometric() end end # function test_trigonometric +function check_hyperbolic(f, A) + info("NDArray::$f") + let x = NDArray(A) + B = f.(A) + y = f.(x) + @test copy(y) ≈ B + end + + let A = Float32.(A), x = NDArray(A) + B = f.(A) + y = f.(x) + @test copy(y) ≈ B + end +end # function check_hyperbolic + +function test_hyperbolic() + for f ∈ [sinh, cosh, tanh, asinh, acosh, atanh] + A = if f == acosh + [1.1, 1.2, 1.3, 1.4] + else + [.1, .2, .3, .4] + end + check_hyperbolic(f, A) + end +end # function test_hyperbolic + ################################################################################ # Run tests ################################################################################ @@ -875,6 +901,7 @@ end # function test_trigonometric test_show() test_size() test_trigonometric() + test_hyperbolic() end end From 66096167c66ca788c31effbb687f456834b67dba Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 15 Dec 2017 13:28:38 +0800 Subject: [PATCH 590/630] ndarray: support transpose on 1D array (#375) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Python doesn't have this functionality, so I implement it via `reshape`. ```julia julia> x = NDArray(Float32[1, 2, 3, 4]) 4 mx.NDArray{Float32,1} @ CPU0: 1.0 2.0 3.0 4.0 julia> x' 1×4 mx.NDArray{Float32,2} @ CPU0: 1.0 2.0 3.0 4.0 ``` --- NEWS.md | 15 +++++++++++++++ src/ndarray.jl | 3 ++- src/util.jl | 5 ----- test/unittest/ndarray.jl | 8 +++++++- 4 files changed, 24 insertions(+), 7 deletions(-) diff --git a/NEWS.md b/NEWS.md index 703cb216a001..30b204aef24d 100644 --- a/NEWS.md +++ b/NEWS.md @@ -107,6 +107,21 @@ 4.0 ``` +* Transposing a column `NDArray` to a row `NDArray` is supported now. (#TBD) + + ```julia + julia> x = NDArray(Float32[1, 2, 3, 4]) + 4 mx.NDArray{Float32,1} @ CPU0: + 1.0 + 2.0 + 3.0 + 4.0 + + julia> x' + 1×4 mx.NDArray{Float32,2} @ CPU0: + 1.0 2.0 3.0 4.0 + ``` + ## API Changes ### `NDArray` diff --git a/src/ndarray.jl b/src/ndarray.jl index 900285ae5782..b86158e88842 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1114,7 +1114,8 @@ _mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap dot(x::NDArray{T,N}, y::NDArray{S,N}) where {T,S,N} dot(y, x) # See https://github.com/dmlc/MXNet.jl/pull/123 -@_remap transpose(arr::NDArray) transpose(_only2d(arr)) +@_remap transpose(arr::NDArray{T,1}) where T reshape(arr; shape = (1, length(arr)), reverse = true) +@_remap transpose(arr::NDArray{T,2}) where T transpose(arr) @_remap permutedims(arr::NDArray, axes) transpose(arr; axes = length(axes) .- tuple(axes...)) @_remap prod(arr::NDArray) prod(arr) diff --git a/src/util.jl b/src/util.jl index c53fb9a597fa..c729bc7cd9ae 100644 --- a/src/util.jl +++ b/src/util.jl @@ -163,11 +163,6 @@ function _format_signature(narg::Int, arg_names::Ref{char_pp}) return join([unsafe_string(name) for name in arg_names] , ", ") end -@inline function _only2d(x) - @assert ndims(x) == 2 - x -end - """ libmxnet operators signature checker. diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 0608d4fa6c41..a397d7899d54 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -775,7 +775,13 @@ function test_fill() end # function test_fill function test_transpose() - info("NDArray::transpose") + info("NDArray::transpose::1D") + let A = rand(Float32, 4), x = NDArray(A) + @test size(x) == (4,) + @test size(x') == (1, 4) + end + + info("NDArray::transpose::2D") let A = rand(Float32, 2, 3), x = mx.NDArray(A) @test size(x) == (2, 3) @test size(x') == (3, 2) From 881759f1bea5451d5eab9e86b88cba6f1ef42cdf Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 15 Dec 2017 13:40:01 +0800 Subject: [PATCH 591/630] example: fix MSE init (#376) --- examples/regression-example.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/examples/regression-example.jl b/examples/regression-example.jl index e820d54001ec..38541c2b7d0c 100644 --- a/examples/regression-example.jl +++ b/examples/regression-example.jl @@ -63,7 +63,7 @@ optimizer = mx.ADAM() trainprovider, evalprovider = data_source(#= batchsize =# 200) mx.fit(model, optimizer, trainprovider, initializer = mx.NormalInitializer(0.0, 0.1), - eval_metric = mx.MSE{mx.NDArray{Float32,1}}(), + eval_metric = mx.MSE(), eval_data = evalprovider, n_epoch = 20, callbacks = [mx.speedometer()]) @@ -71,7 +71,7 @@ mx.fit(model, optimizer, trainprovider, trainprovider, evalprovider = data_source(#= batchsize =# samplesize) mx.fit(model, optimizer, trainprovider, initializer = mx.NormalInitializer(0.0, 0.1), - eval_metric = mx.MSE{mx.NDArray{Float32,1}}(), + eval_metric = mx.MSE(), eval_data = evalprovider, n_epoch = 500, # previous setting is batchsize = 200, epoch = 20 # implies we did (5000 / 200) * 20 times update in previous `fit` From 5908d97477d4b76c3a894e81981f98a6c9efbe57 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 15 Dec 2017 13:46:55 +0800 Subject: [PATCH 592/630] base: cleanup stale code in _defstruct_impl (#377) --- src/base.jl | 10 +--------- 1 file changed, 1 insertion(+), 9 deletions(-) diff --git a/src/base.jl b/src/base.jl index e75dc3b6ac65..0334260f886a 100644 --- a/src/base.jl +++ b/src/base.jl @@ -218,21 +218,13 @@ function _defstruct_impl(is_immutable, name, fields) if isa(name, Symbol) name = esc(name) super_name = :Any - elseif VERSION >= v"0.5-" + else @assert(isa(name, Expr) && name.head == :(<:) && length(name.args) == 2 && isa(name.args[1], Symbol) && isa(name.args[2], Symbol), "name must be of form 'Name <: SuperType'") super_name = esc(name.args[2]) name = esc(name.args[1]) - else - @assert(isa(name, Expr) && name.head == :comparison && - length(name.args) == 3 && name.args[2] == :(<:) && - isa(name.args[1], Symbol) && isa(name.args[3], Symbol), - "name must be of form 'Name <: SuperType'") - - super_name = esc(name.args[3]) - name = esc(name.args[1]) end field_defs = Vector{Expr}(length(fields)) # :(field2 :: Int) From a941f3aec70828682f44ae21f41543a971677fc3 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 15 Dec 2017 13:47:12 +0800 Subject: [PATCH 593/630] ndarray: add modulo operator (#373) * ndarray: add modulo operator * add news --- NEWS.md | 11 +++++++++++ src/broadcast.jl | 3 ++- src/ndarray.jl | 27 +++++++++++++++++++++++---- test/unittest/ndarray.jl | 32 ++++++++++++++++++++++++++++++++ 4 files changed, 68 insertions(+), 5 deletions(-) diff --git a/NEWS.md b/NEWS.md index 30b204aef24d..a7942b0ed469 100644 --- a/NEWS.md +++ b/NEWS.md @@ -107,6 +107,17 @@ 4.0 ``` +* modulo operator. (#TBD) + + ```julia + x = NDArray(...) + y = NDArray(...) + + x .% y + x .% 2 + 2 .% x + ``` + * Transposing a column `NDArray` to a row `NDArray` is supported now. (#TBD) ```julia diff --git a/src/broadcast.jl b/src/broadcast.jl index a5fdacd829d0..cdde7f46b2c9 100644 --- a/src/broadcast.jl +++ b/src/broadcast.jl @@ -1,6 +1,7 @@ using TakingBroadcastSeriously: Broadcasted, unwrap -for f in :[tan, asin, acos, atan, +for f in :[%, + tan, asin, acos, atan, sinh, cosh, tanh, asinh, acosh, atanh].args # copy from TakingBroadcastSeriously @eval Base.$f(a::Broadcasted...) = Broadcasted(broadcast_($f, unwrap.(a)...)) diff --git a/src/ndarray.jl b/src/ndarray.jl index b86158e88842..d62a72c39684 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -709,17 +709,32 @@ broadcast_(::typeof(/), x::NDArray, y::NDArray) = _div(x, y) broadcast_(::typeof(/), x::NDArray, y::Real) = _div_scalar(x, scalar = y) broadcast_(::typeof(/), y::Real, x::NDArray) = _rdiv_scalar(x, scalar = y) +import Base: % + +""" + .%(x::NDArray, y::NDArray) + .%(x::NDArray, y::Real) + .%(x::Real, y::NDArray) + +Elementwise modulo for `NDArray`. +""" +%(x::NDArray, y::Real) = _mod_scalar(x, scalar = y) + +broadcast_(::typeof(%), x::NDArray, y::NDArray) = _mod(x, y) +broadcast_(::typeof(%), x::NDArray, y::Real) = _mod_scalar(x, scalar = y) +broadcast_(::typeof(%), y::Real, x::NDArray) = _rmod_scalar(x, scalar = y) + import Base: ^ # document of `.^` is merged into SymbolicNode's broadcast_(::typeof(^), x::NDArray, y::NDArray) = _power(x, y) -broadcast_(::typeof(^), x::NDArray, s::Real) = _power_scalar(x, scalar = s) -broadcast_(::typeof(^), s::Real, x::NDArray) = _rpower_scalar(x, scalar = s) +broadcast_(::typeof(^), x::NDArray, s::Real) = _power_scalar(x, scalar = s) +broadcast_(::typeof(^), s::Real, x::NDArray) = _rpower_scalar(x, scalar = s) broadcast_(::typeof(^), ::Irrational{:e}, x::NDArray) = exp(x) -broadcast_(::typeof(^), x::NDArray, s::Irrational) = _power_scalar(x, scalar = s) -broadcast_(::typeof(^), s::Irrational, x::NDArray) = _rpower_scalar(x, scalar = s) +broadcast_(::typeof(^), x::NDArray, s::Irrational) = _power_scalar(x, scalar = s) +broadcast_(::typeof(^), s::Irrational, x::NDArray) = _rpower_scalar(x, scalar = s) """ fill!(arr::NDArray, x) @@ -1147,6 +1162,9 @@ _mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap _minus(x::NDArray, y::NDArray) _minus(x, y) @_remap _minus!(x::NDArray, y::NDArray) _minus(x, y) +@_remap _mod(x::NDArray, y::NDArray) _mod(x, y) +@_remap _mod!(x::NDArray, y::NDArray) _mod(x, y) + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -1265,6 +1283,7 @@ const _op_import_bl = [ # import black list; do not import these funcs # arithmetic "_plus", "_minus", + "_mod", "dot", "max", diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index a397d7899d54..7c74536a8a18 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -437,6 +437,37 @@ function test_rdiv() end # function test_rdiv +function test_mod() + info("NDArray::mod") + const A = [1 2; 3 4] + const B = [1 1; 3 3] + + let x = NDArray(A), y = NDArray(B) + C = A .% B + D = B .% A + + w = x .% y + z = y .% x + + @test copy(w) ≈ C + @test copy(z) ≈ D + end + + let x = NDArray(A) + C = A .% 2 + y = x .% 2 + @test copy(y) ≈ C + end + + info("NDArray::rmod") + let x = NDArray(A) + C = 11 .% A + y = 11 .% x + @test copy(y) ≈ C + end +end # function test_mod + + function test_gd() dims = rand_dims() tw, aw = rand_tensors(dims) @@ -888,6 +919,7 @@ end # function test_hyperbolic test_mul() test_div() test_rdiv() + test_mod() test_gd() test_saveload() test_clip() From 8135a635b06bf36df1511fa238bc15bfa7cc6e75 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 15 Dec 2017 13:48:03 +0800 Subject: [PATCH 594/630] ndarray: type convertion of _div_scalar (#357) Ref: #353 - and handle the case of integer NDArray divided by zero --- src/ndarray.jl | 12 ++++++++++-- test/unittest/ndarray.jl | 13 +++++++++++++ 2 files changed, 23 insertions(+), 2 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index d62a72c39684..33b94c05e559 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -669,13 +669,21 @@ Matrix (2D NDArray) multiplication. Elementwise divide a scalar or an `NDArray` of the same shape from `dst`. Inplace updating. """ -function div_from!(dst::NDArray{T}, arg::NDArrayOrReal) where {T} +function div_from!(dst::NDArray, arg::NDArrayOrReal) @assert dst.writable if isa(arg, Real) - _div_scalar(dst, scalar = convert(T, arg), out = dst) + _div_scalar(dst, scalar = arg, out = dst) else _div(dst, arg, out = dst) end + dst +end + +function div_from!(dst::NDArray{T}, arg::Real) where {T<:Integer} + @assert dst.writable + @assert(round(T, arg) != zero(T), "Integer divided by zero") + _div_scalar(dst, scalar = arg, out = dst) + dst end """ diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 7c74536a8a18..8bd87c65ec9e 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -396,6 +396,19 @@ function test_div() t6, a6 = rand_tensors(Float16, dims) scalar_large = 1e4 @test t6 ./ scalar_large ≈ copy(a6 ./ scalar_large) + + info("NDArray::div::scalar::type convert") + let x = mx.NDArray([1, 2, 3]) + y = x ./ 1.1 + @test eltype(y) == Int + @test copy(y) == [1, 2, 3] + + y = x ./ 2 + @test eltype(y) == Int # this differs from julia + @test copy(y) == [0, 1, 1] + + @test_throws AssertionError x ./ 0.5 + end end From 1e20f50b9ce859e19a657c8820244d159ca7cca6 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 15 Dec 2017 16:14:26 +0800 Subject: [PATCH 595/630] ndarray: protect from diving zero for non-inplace op (#378) --- src/ndarray.jl | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/src/ndarray.jl b/src/ndarray.jl index 33b94c05e559..42c69266e210 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -717,6 +717,11 @@ broadcast_(::typeof(/), x::NDArray, y::NDArray) = _div(x, y) broadcast_(::typeof(/), x::NDArray, y::Real) = _div_scalar(x, scalar = y) broadcast_(::typeof(/), y::Real, x::NDArray) = _rdiv_scalar(x, scalar = y) +function broadcast_(::typeof(/), x::NDArray{T}, y::Real) where {T<:Integer} + @assert(round(T, y) != zero(T), "Integer divided by zero") + _div_scalar(x, scalar = y) +end + import Base: % """ From d92122546f02703e99364e09c4448b990b42b0b3 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 16 Dec 2017 23:39:39 +0800 Subject: [PATCH 596/630] doc/ndarray: add ref table for hyperbolic function (#382) --- docs/src/api/ndarray.md | 14 +++++++++++++- 1 file changed, 13 insertions(+), 1 deletion(-) diff --git a/docs/src/api/ndarray.md b/docs/src/api/ndarray.md index 660bd95fc070..9582ff24a7ef 100644 --- a/docs/src/api/ndarray.md +++ b/docs/src/api/ndarray.md @@ -13,7 +13,7 @@ In the following example `y` can be a `Real` value or another `NDArray` | `^` | `x .^ y` | Elementwise power | -## Trigonometric functions +## Trigonometric Functions | API | Example | | |----------------|------------|-----------------------------| @@ -25,6 +25,18 @@ In the following example `y` can be a `Real` value or another `NDArray` | [`atan`](@ref) | `atan.(x)` | Elementwise inverse tangent | +## Hyperbolic Functions + +| API | Example | | +|-----------------|-------------|----------------------------------------| +| [`sinh`](@ref) | `sinh.(x)` | Elementwise hyperbolic sine | +| [`cosh`](@ref) | `cosh.(x)` | Elementwise hyperbolic cosine | +| [`tanh`](@ref) | `tanh.(x)` | Elementwise hyperbolic tangent | +| [`asinh`](@ref) | `asinh.(x)` | Elementwise inverse hyperbolic sine | +| [`acosh`](@ref) | `acosh.(x)` | Elementwise inverse hyperbolic cosine | +| [`atanh`](@ref) | `atanh.(x)` | Elementwise inverse hyperbolic tangent | + + ## Reference ```@autodocs From 450759868007dc2bed1024a19e5bfa17f1d305d3 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 17 Dec 2017 06:01:01 +0800 Subject: [PATCH 597/630] ndarray: `cat`, `hcat`, `vcat` (#380) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit e.g. `hcat` ```julia julia> x 4 mx.NDArray{Float64,1} @ CPU0: 1.0 2.0 3.0 4.0 julia> y 4 mx.NDArray{Float64,1} @ CPU0: 2.0 4.0 6.0 8.0 julia> [x y] 4×2 mx.NDArray{Float64,2} @ CPU0: 1.0 2.0 2.0 4.0 3.0 6.0 4.0 8.0 ``` --- NEWS.md | 28 +++++++++++++++++- src/ndarray.jl | 26 +++++++++++++++++ test/unittest/ndarray.jl | 62 ++++++++++++++++++++++++++++++++++++++++ 3 files changed, 115 insertions(+), 1 deletion(-) diff --git a/NEWS.md b/NEWS.md index a7942b0ed469..70d8626f7259 100644 --- a/NEWS.md +++ b/NEWS.md @@ -117,7 +117,33 @@ x .% 2 2 .% x ``` - + +* `cat`, `vcat`, `hcat` is implemented. (#TBD) + + E.g. `hcat` + ```julia + julia> x + 4 mx.NDArray{Float64,1} @ CPU0: + 1.0 + 2.0 + 3.0 + 4.0 + + julia> y + 4 mx.NDArray{Float64,1} @ CPU0: + 2.0 + 4.0 + 6.0 + 8.0 + + julia> [x y] + 4×2 mx.NDArray{Float64,2} @ CPU0: + 1.0 2.0 + 2.0 4.0 + 3.0 6.0 + 4.0 8.0 + ``` + * Transposing a column `NDArray` to a row `NDArray` is supported now. (#TBD) ```julia diff --git a/src/ndarray.jl b/src/ndarray.jl index 42c69266e210..139e40ef1e59 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -522,6 +522,32 @@ function deepcopy(arr::NDArray) NDArray(MX_NDArrayHandle(out_ref[])) end +""" + hcat(x::NDArray...) +""" +Base.hcat(xs::NDArray{T}...) where T = cat(2, xs...) + +""" + vcat(x::NDArray...) +""" +Base.vcat(xs::NDArray{T}...) where T = cat(1, xs...) + +""" + cat(dim, xs::NDArray...) + +Concate the `NDArray`s which have the same element type along the `dim`. +Building a diagonal matrix is not supported yet. +""" +function Base.cat(dim::Int, xs::NDArray{T}...) where T + ns = ndims.(xs) + d = Base.max(dim, maximum(ns)) + xs′ = map(zip(ns, xs)) do i + n, x = i + (d > n) ? reshape(x, -2, Base.ones(Int, d - n)...) : x + end + concat(xs′..., dim = d - dim) +end + """ @inplace diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 8bd87c65ec9e..a24126cf194b 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -179,6 +179,67 @@ function test_endof() end end # function test_endof +function test_cat() + function check_cat(f, A, B = 2A) + C = [A B] + D = [A; B] + x = NDArray(A) + y = NDArray(B) + z = NDArray(C) + d = NDArray(D) + + if f == :hcat + @test copy([x y]) == [A B] + @test copy([x y 3y x]) == [A B 3B A] + @test copy([z y x]) == [C B A] + elseif f == :vcat + @test copy([x; y]) == [A; B] + @test copy([x; y; 3y; x]) == [A; B; 3B; A] + @test copy([x; d]) == [A; D] + @test copy([d; x]) == [D; A] + else + @assert false + end + end + + let A = [1, 2, 3, 4] + info("NDArray::hcat::1D") + check_cat(:hcat, A) + + info("NDArray::vcat::1D") + check_cat(:vcat, A) + end + + let A = [1 2; 3 4] + info("NDArray::hcat::2D") + check_cat(:hcat, A) + + info("NDArray::vcat::2D") + check_cat(:vcat, A) + end + + let A = rand(4, 3, 2) + info("NDArray::hcat::3D") + check_cat(:hcat, A) + + info("NDArray::vcat::3D") + check_cat(:vcat, A) + end + + let A = rand(4, 3, 2, 2) + info("NDArray::hcat::4D") + check_cat(:hcat, A) + + info("NDArray::vcat::4D") + check_cat(:vcat, A) + end + + let A = [1, 2, 3, 4] + info("NDArray::cat::3D/1D") + check_cat(:vcat, reshape(A, 4, 1, 1), 2A) + end +end # function test_cat + function test_plus() dims = rand_dims() t1, a1 = rand_tensors(dims) @@ -927,6 +988,7 @@ end # function test_hyperbolic test_linear_idx() test_first() test_endof() + test_cat() test_plus() test_minus() test_mul() From 39ecb32463497d0750cdbf73ae534cc64a32181e Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 17 Dec 2017 06:02:02 +0800 Subject: [PATCH 598/630] base: improve MXError display (#379) --- src/base.jl | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/base.jl b/src/base.jl index 0334260f886a..8f14d44c6b3d 100644 --- a/src/base.jl +++ b/src/base.jl @@ -3,6 +3,8 @@ struct MXError <: Exception msg :: AbstractString end +Base.show(io::IO, e::MXError) = print(io, e.msg) + ################################################################################ # Common types used in MXNet API ################################################################################ From cb443b79778b42bbc4b88ff2a87e4bbf377cda07 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 18 Dec 2017 20:16:25 +0800 Subject: [PATCH 599/630] ndarray: porting Python's autograd (#274) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Ref: https://github.com/apache/incubator-mxnet/blob/065adb3702c110af7b537799be3ec9c16c27a72b/python/mxnet/autograd.py * API ported * attach_grad * grad * mark_variables * get_symbol * record * pause * train_mode * predict_mode * backward * An example ```julia x = NDArray([1 2; 3 4]) mx.attach_grad!(x) y = mx.record() do mx.square(x) end mx.backward!(y) mx.getgrad(x) # 2×2 Array{Int64,2}: # 2 4 # 6 8 ``` --- NEWS.md | 2 + src/MXNet.jl | 1 + src/autograd.jl | 387 ++++++++++++++++++++++++++++++++++++++ src/base.jl | 2 +- src/ndarray.jl | 4 +- test/unittest/autograd.jl | 386 +++++++++++++++++++++++++++++++++++++ test/unittest/ndarray.jl | 2 +- 7 files changed, 780 insertions(+), 4 deletions(-) create mode 100644 src/autograd.jl create mode 100644 test/unittest/autograd.jl diff --git a/NEWS.md b/NEWS.md index 70d8626f7259..4540cba50fef 100644 --- a/NEWS.md +++ b/NEWS.md @@ -75,6 +75,8 @@ ### `NDArray` +* A port of Python's `autograd` for `NDArray` (#274) + * `size(x, dims...)` is supported now. (#TBD) ```julia diff --git a/src/MXNet.jl b/src/MXNet.jl index 3583c140b64c..352d20aad150 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -105,6 +105,7 @@ include("broadcast.jl") include("ndarray.jl") include("random.jl") +include("autograd.jl") include("name.jl") include("symbolic-node.jl") diff --git a/src/autograd.jl b/src/autograd.jl new file mode 100644 index 000000000000..4584decb0a52 --- /dev/null +++ b/src/autograd.jl @@ -0,0 +1,387 @@ +# Autograd for NDArray +# this is a port of Python's autograd module +# https://github.com/apache/incubator-mxnet/blob/master/python/mxnet/autograd.py + +############################################################################### +# Private util functions +############################################################################### + +""" + _set_recording(state::Bool)::Bool + +Set status to recording/not recording. When recording, graph will be constructed +for gradient computation. + +## Parameters + +* `state::Bool` + +## Returns + +Previous state before this set +""" +function _set_recording(state::Bool)::Bool + prev = Ref{Cint}(C_NULL) + @mxcall(:MXAutogradSetIsRecording, (Cint, Ref{Cint}), state, prev) + prev[] +end + +_set_recording(::Void) = nothing + +""" +Set status to training/predicting. +For example, Dropout will drop inputs randomly when +`train_mode = true` while simply passing through if `train_mode = false`. + +## Parameters +* `train_mode::Bool` + +## Returns + +Previous state before this set. +""" +function _set_training(train_mode::Bool)::Bool + prev = Ref{Cint}(C_NULL) + @mxcall(:MXAutogradSetIsTraining, (Cint, Ref{Cint}), train_mode, prev) + prev[] +end + +_set_training(::Void) = nothing + +############################################################################### +# Public API +############################################################################### + +""" + is_recording()::Bool + +Get status on recording/not recording. +""" +function is_recording()::Bool + state = Ref{Cint}(C_NULL) + @mxcall(:MXAutogradIsRecording, (Ref{Cint},), state) + state[] +end + +""" + is_training()::Bool + +Get status on recording/not recording. +""" +function is_training()::Bool + state = Ref{Cint}(C_NULL) + @mxcall(:MXAutogradIsTraining, (Ref{Cint},), state) + state[] +end + +@inline function _record(f, is_record::Union{Void,Bool}, train_mode::Union{Void,Bool}) + # Port from Python's `_RecordingStateScope` context manager + # __enter__ + prev_is_record = _set_recording(is_record) + prev_train_mode = _set_training(train_mode) + + try + f() + finally + # __exit__ + if is_record != nothing && prev_is_record != is_record + _set_recording(prev_is_record) + end + if train_mode != nothing && prev_train_mode != train_mode + _set_recording(prev_train_mode) + end + end +end + +""" + record(f, train_mode = true) + record(translates = true) do + ... + end + +Returns an autograd recording scope context to be used in `do` block +and captures code that needs gradients to be calculated. + +Parameter `train_mode::Bool` controls whether the forward pass is in training +or predicting mode. +This controls the behavior of some layers such as `Dropout`, `BatchNorm`. + +!!! note + When forwarding with `train_mode = false`, the corresponding backward + should also use `train_mode = false`, otherwise gradient is undefined. + +```julia +x = mx.NDArray([1 2; 3 4]) +∇ = mx.attach_grad!(x) +y = mx.record() do + 2x +end +mx.backward!(y) + +julia> ∇ +2×2 mx.NDArray{Int64,2} @ CPU0: + 2 2 + 2 2 +``` +""" +record(f, train_mode::Bool = true) = _record(f, true, train_mode) + +""" + pause(f, train_mode = false) + pause(train_mode = false) do + ... + end + +Create a scope context for codes that do not need gradients to be calculated. + +```julia +record() do + ... + pause() do + # testing, IO, gradient updates... + end +end +``` +""" +pause(f, train_mode::Bool = false) = _record(f, false, train_mode) + +""" + train_mode(f) + train_mode() do + ... + end + +Create a scope context in which forward pass behavior is set to training mode, +without changing the recording states. + +```julia +y = model(x) +train_mode() do + z = mx.Dropout(y) + ... +end +``` +""" +train_mode(f) = _record(f, nothing, true) + +""" + predict_mode(f) + predict_mode() do + ... + end + +Create a scope context in which forward pass behavior is set to inference mode, +without changing the recording states. + +```julia +record() do + y = model(x) + predict_mode() do + y = sampling(y) + end +end +``` +""" +predict_mode(f) = _record(f, nothing, false) + +""" + backward!(head, head_grad; retain_graph = false, train_mode = true) + backward!(heads, head_grads; retain_graph = false, train_mode = true) + +Compute the gradients of heads w.r.t previously marked variables. + +## Parameters + +- `head::NDArray`: output NDArray + +- `head_grad::NDArray` or `Void`: gradient coefficient with respect to head. + +- `heads::Vector{NDArray}`: a list of output NDArray + +- `head_grads::Vector`: a list of gradient coefficient with respect ot heads. + the element should be `NDArray` or `Void` + +- `retain_graph::Bool`: whether to keep the graph after backward. e.g: + If you want to differentiate the same graph twice, + you need to pass `retain_graph=true`. + +- `train_mode::Bool`: whether to do backward for training or predicting. +""" +backward!(head::NDArray, head_grad::NDArray; kws...) = + backward!([head], [head_grad]; kws...) + +backward!(head::NDArray, head_grad::Void = nothing; kws...) = + backward!([head], head_grad; kws...) + +function backward!(heads::VecOfNDArray, head_grad::Void; + retain_graph::Bool = false, train_mode::Bool = true) + @mxcall( + :MXAutogradBackwardEx, + (MX_uint, + Ptr{MX_handle}, + Ptr{MX_handle}, + MX_uint, + Ptr{MX_handle}, + Cint, + Cint, + Cint, + Ptr{MX_handle}, + Ptr{MX_handle}), + length(heads), + map(x -> x.handle, heads), + C_NULL, + 0, + C_NULL, + retain_graph, + false, # create_graph + train_mode, + C_NULL, + C_NULL) +end + +function backward!(heads::VecOfNDArray, head_grads::Vector; + retain_graph::Bool = false, train_mode::Bool = true) + output_handles = map(x -> x.handle, heads) + ograd_handles = map(head_grads) do x + if x isa NDArray + x.handle + elseif x isa Void + MX_handle(C_NULL) + else + throw(ArgumentError("element of head_grads should be NDArray or Void")) + end + end + @assert length(output_handles) == length(ograd_handles) + @mxcall( + :MXAutogradBackwardEx, + (MX_uint, + Ptr{MX_handle}, + Ptr{MX_handle}, + MX_uint, + Ptr{MX_handle}, + Cint, + Cint, + Cint, + Ptr{MX_handle}, + Ptr{MX_handle}), + length(output_handles), + output_handles, + ograd_handles, + 0, + C_NULL, + retain_graph, + false, # create_graph + train_mode, + C_NULL, + C_NULL) +end + +""" + getgrad(arr::NDArray) + +Returns the gradient buffer attached to this `NDArray`. +If the gradient buffer isn't attached yet, return `nothing`. +""" +function getgrad(arr::NDArray) + out = Ref{MX_handle}(C_NULL) + @mxcall(:MXNDArrayGetGrad, (MX_handle, Ref{MX_handle}), arr.handle, out) + (out[] == C_NULL) ? nothing : NDArray(MX_NDArrayHandle(out[])) +end + +""" + attach_grad!(x::NDArray, grad_req::Symbol = :write) + +Attach a gradient buffer to this `NDArray`, +so that [`backward!`](@ref) can compute gradient with respect to it. + +## Parameters + +- `x::NDArray` +- `grad_req::Symbol` (default is `:write`) + +## Return + +The attached gradient buffer + +## See also + +- [`getgrad`](@ref) +""" +function attach_grad!(x::NDArray, grad_req::Symbol = :write) + # TODO: support storage type (stype in Python) + # TODO: make sure it works with gpu array + grad = zeros_like(x) + _mark_variables!([x], [grad], grad_req) + grad +end + +""" + mark_variables!(var, grad, grad_req) + mark_variables!(vars, grads, grad_reqs) + +Mark `NDArrays` as variables to compute gradient for autograd. + +## Parameters + +- `var::NDArray` +- `grad::NDArray` +- `grad_req::Symbol`: `:nop`, `:write`, `:inplace` or `:add` +- `vars::Vector{NDArray}` +- `grads::Vector{NDArray}` +- `grad_req::Vector{Symbol}` +""" +mark_variables!(var::NDArray, grad::NDArray, grad_reqs::Symbol = :write) = + _mark_variables!([var], [grad], grad_reqs) + +mark_variables!(var::VecOfNDArray, grads::VecOfNDArray, grad_reqs = :write) = + _mark_variables!(var, grads, grad_reqs) + +@inline function _getgrad_req(x::Symbol)::GRAD_REQ + val = get(grad_req_map, x, false) + if val == false + throw(ArgumentError("invalid grad_reqs $x")) + end + val +end + +@inline _getgrad_reqs(x::Symbol, n::Int) = + map((_) -> MX_uint(_getgrad_req(x)), Base.OneTo(n)) + +@inline function _getgrad_reqs(xs::Vector{Symbol}, n::Int) + if length(xs) != n + throw(ArgumentError("number of variables and grad_reqs not matched")) + end + map(MX_uint ∘ _getgrad_req, xs) +end + +@inline function _mark_variables!(vars::VecOfNDArray, grads::VecOfNDArray, + grad_reqs = :write) + n = length(vars) + if n != length(grads) + throw(ArgumentError("number of variables and gradients not matched")) + end + + var_hdls = map(x -> x.handle, vars) + grad_hdls = map(x -> x.handle, grads) + grad_reqs = _getgrad_reqs(grad_reqs, n) + + @mxcall(:MXAutogradMarkVariables, + (MX_uint, Ref{MX_handle}, Ptr{MX_uint}, Ref{MX_handle}), + length(vars), var_hdls, grad_reqs, grad_hdls) +end + +""" + symbol(x::NDArray) + +Retrieve recorded computation history as `SymbolicNode`, + where `x` is a `NDArray` representing the head of computation graph. + """ +function symbol(x::NDArray) + ref = Ref{MX_handle}(C_NULL) + @mxcall(:MXAutogradGetSymbol, (MX_handle, Ref{MX_handle}), x, ref) + SymbolicNode(MX_SymbolHandle(ref[])) +end + +############################################################################### +# TODO: User-defined differentiable function +############################################################################### diff --git a/src/base.jl b/src/base.jl index 8f14d44c6b3d..b8f73eb4e6bc 100644 --- a/src/base.jl +++ b/src/base.jl @@ -20,7 +20,7 @@ const char_pp = Ptr{char_p} ################################################################################ # OpReqType in include/mxnet/op_attr_types.h @enum GRAD_REQ GRAD_NOP=0 GRAD_WRITE=1 GRAD_INPLACE=2 GRAD_ADD=3 -const grad_req_map = Dict{Symbol, GRAD_REQ}( +const grad_req_map = Dict{Symbol,GRAD_REQ}( :nop => GRAD_NOP, # no operation, do not write anything :write => GRAD_WRITE, # write gradient to provided space :inplace => GRAD_INPLACE, # perform an inplace write diff --git a/src/ndarray.jl b/src/ndarray.jl index 139e40ef1e59..de5d6ba4fba4 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -306,10 +306,10 @@ dimension. For example, given an `NDArray` of shape (2,3,4), `slice(array, 2:3)` a `NDArray` of shape (2,3,2), sharing the data with the original array. This operation is used in data parallelization to split mini-batch into sub-batches for different devices. """ -function slice(arr :: NDArray, ::Colon) +function slice(arr::NDArray, ::Colon) arr end -function slice(arr :: NDArray, slice::UnitRange{Int}) +function slice(arr::NDArray, slice::UnitRange{Int}) dim1 = size(arr)[end] @assert(1 <= slice.start <= slice.stop <= dim1) if slice.start == 1 && slice.stop == dim1 diff --git a/test/unittest/autograd.jl b/test/unittest/autograd.jl new file mode 100644 index 000000000000..12c1022bd208 --- /dev/null +++ b/test/unittest/autograd.jl @@ -0,0 +1,386 @@ +module TestAutoGrad + +using Base.Test + +using MXNet + + +function checkgradient(f, x, y, ∇) + ∇x = mx.attach_grad!(x) + y′ = mx.record(f) + @test copy(y′) ≈ y + @test copy(∇x) |> sum == 0 + mx.backward!(y′) + @test copy(mx.getgrad(x)) ≈ ∇ +end # function checkgradient + + +function test_getgrad() + info("AutoGrad::getgrad") + + info("AutoGrad::getgrad::unattached") + @test nothing == mx.getgrad(mx.zeros(10)) + + info("AutoGrad::getgrad::attached") + x = mx.NDArray([1 2; 3 4]) + grad = mx.attach_grad!(x) + @test eltype(grad) ≡ Int + @test copy(grad) == [0 0; 0 0] + + grad[:] = 42 + @test copy(mx.getgrad(x)) == [42 42; 42 42] +end + + +function test_mark_variables!() + info("AutoGrad::mark_variables!") + x = mx.zeros(4) + ẋ = mx.zeros(4) + y = mx.zeros(4) + ẏ = mx.zeros(4) + mx.mark_variables!([x, y], [ẋ, ẏ], [:nop, :nop]) + ẋ[:] = 42 + ẏ[:] = 24 + + @test copy(mx.getgrad(x)) == [42, 42, 42, 42] + @test copy(mx.getgrad(y)) == [24, 24, 24, 24] + + info("AutoGrad::mark_variables!::invalid grad_reqs") + x = mx.zeros(4) + y = mx.zeros(4) + @test_throws ArgumentError mx.mark_variables!(x, y, :magic) + @test_throws ArgumentError mx.mark_variables!([x], [y], [:magic]) + + info("AutoGrad::mark_variables!::args length mismatch") + x = mx.zeros(4) + y = mx.zeros(4) + z = mx.zeros(4) + @test_throws ArgumentError mx.mark_variables!([x], [y, z]) + @test_throws ArgumentError mx.mark_variables!([x], [y], [:write, :nop]) +end + + +function test_record() + let x = mx.NDArray([1 2; 3 4]) + info("AutoGrad::record::backward!") + + y = [1 4; 9 16] + ∇ = [2 4; 6 8] # gradient is 2x + checkgradient(x, y, ∇) do + mx.square(x) + end + end + + let x = mx.NDArray([1 2; 3 4]) + info("AutoGrad::record::symbol") + + mx.attach_grad!(x) + y = mx.record() do + mx.square(x) + end + + @test copy(y) == [1 4; 9 16] + + @test isa(mx.symbol(y), mx.SymbolicNode) + end + + let x = mx.NDArray([1 2; 3 4]) + info("AutoGrad::record::backward!(retain_graph=true)") + + mx.attach_grad!(x) + y = mx.record() do + mx.square(x) + end + + @test copy(y) == [1 4; 9 16] + + mx.backward!(y, retain_graph=true) + # gradient is 2x + @test copy(mx.getgrad(x)) == [2 4; 6 8] + + @test isa(mx.symbol(y), mx.SymbolicNode) + end + + mx._record(nothing, nothing) do # no error with edage case + @test true + end +end # function test_record + + +function test_is_recording() + info("AutoGrad::is_recording") + mx.record() do + @test mx.is_recording() + end +end # function test_is_recording + + +function test_is_training() + info("AutoGrad::is_training") + mx.record() do + @test mx.is_training() + end + + mx.record(false) do + @test !mx.is_training() + end +end # function test_is_training + + +function test_pause() + info("AutoGrad::pause") + let x = mx.NDArray([1 2; 3 4]) + ∇ = mx.attach_grad!(x) + y = mx.record() do + y = mx.square(x) + mx.pause() do + z = mx.square(y) + @test copy(z) == [1 16; 81 256] + end + y + end + + @test copy(y) == [1 4; 9 16] + + mx.backward!(y) + @test copy(∇) == [2 4; 6 8] + end +end # function test_pause + + +function test_train_mode() + info("AutoGrad::train_mode") + let x = mx.NDArray(Float32[1 2; 3 4]) + y = mx.train_mode() do + mx.Dropout(x, p = 1) + end + + @test all(isnan.(copy(y))) + end +end # function test_train_mode + + +function test_predict_mode() + info("AutoGrad::predict_mode") + let x = mx.NDArray(Float32[1 2; 3 4]) + y = mx.predict_mode() do + mx.Dropout(x, p = 1) + end + + @test copy(y) ≈ Float32[1 2; 3 4] + end +end # function test_train_mode + + +function test_backward!() + info("AutoGrad::backward!::with head_grad") + let x = mx.NDArray(Float32[1 2; 3 4]), A = Float32[.2 .4; 0 .1] + ∇ = mx.attach_grad!(x) + y = mx.record() do + mx.square(x) + end + mx.backward!(y, mx.NDArray(A)) + @test copy(∇) ≈ [2 4; 6 8] .* A + end + + info("AutoGrad::backward!::with head_grads") + let x = mx.NDArray(Float32[1 2; 3 4]) + ∇ = mx.attach_grad!(x) + mx.record() do + x′ = mx.square(x) + y = mx.square(x) + z = mx.square(x) .+ 42 + mx.backward!([x′, y, z], [nothing, + mx.NDArray(Float32[.01 .01; 1 1]), + mx.NDArray(Float32[1 1; .1 .1])]) + end + ans = [4.02 8.04 + 12.6 16.8] + @test copy(∇) ≈ ans + end + + info("AutoGrad::backward!::ArgumentError") + let x = mx.NDArray([42]) + @test_throws ArgumentError mx.backward!([x], [24]) + end +end # function test_backward! + + +function test_symbol() + info("AutoGrad::symbol") + + let x = mx.zeros(4) + mx.attach_grad!(x) + @test isa(mx.symbol(x), mx.SymbolicNode) + end +end + + +function test_add() + info("AutoGrad::add") + + info("AutoGrad::add::x") + let x = mx.NDArray([1 2; 3 4]) + y = [1 2; 3 4] + ∇ = [1 1; 1 1] # gradient is 1 + checkgradient(x, y, ∇) do + x + end + end + + info("AutoGrad::add::+x") + let x = mx.NDArray([1 2; 3 4]) + y = [1 2; 3 4] + ∇ = [1 1; 1 1] # gradient is 1 + checkgradient(x, y, ∇) do + +x + end + end + + info("AutoGrad::add::x .+ 42") + let x = mx.NDArray([1 2; 3 4]) + y = [43 44; 45 46] + ∇ = [1 1; 1 1] # gradient is 1 + checkgradient(x, y, ∇) do + x .+ 42 + end + end + + info("AutoGrad::add::42 .+ x") + let x = mx.NDArray([1 2; 3 4]) + y = [43 44; 45 46] + ∇ = [1 1; 1 1] + checkgradient(x, y, ∇) do + 42 .+ x + end + end + + # TODO: info("AutoGrad::add::x .+ y") +end # function test_add + + +function test_sub() + info("AutoGrad::sub") + + info("AutoGrad::sub::-x") + let x = mx.NDArray([1 2; 3 4]) + y = [-1 -2; -3 -4] + ∇ = [-1 -1; -1 -1] # gradient is -1 + checkgradient(x, y, ∇) do + -x + end + end + + info("AutoGrad::sub::x .- 42") + let x = mx.NDArray([1 2; 3 4]) + y = [-41 -40; -39 -38] + ∇ = [1 1; 1 1] + checkgradient(x, y, ∇) do + x .- 42 + end + end + + info("AutoGrad::sub::42 .- x") + let x = mx.NDArray([1 2; 3 4]) + y = [41 40; 39 38] + ∇ = -[1 1; 1 1] + checkgradient(x, y, ∇) do + 42 .- x + end + end + + # TODO: info("AutoGrad::add::x .- y") +end # function test_sub + + +function test_mul() + info("AutoGrad::mul") + + info("AutoGrad::mul::2x .* x") + let x = mx.NDArray([1 2; 3 4]) + y = [2 8; 18 32] + ∇ = [4 8; 12 16] # 4x + checkgradient(x, y, ∇) do + 2x .* x + end + end + + info("AutoGrad::mul::x * 2 .* x") + let x = mx.NDArray([1 2; 3 4]) + y = [2 8; 18 32] + ∇ = [4 8; 12 16] # 4x + checkgradient(x, y, ∇) do + x * 2 .* x + end + end +end + + +function test_div() + info("AutoGrad::div") + + info("AutoGrad::div::x ./ 2") + let x = mx.NDArray(Float32[1 2; 3 4]) + y = Float32[.5 1; 1.5 2] + ∇ = [.5 .5; .5 .5] + checkgradient(x, y, ∇) do + x ./ 2 + end + end + + info("AutoGrad::rdiv::2 ./ x") + let A = Float32[1 2; 3 4], x = mx.NDArray(A) + y = 2 ./ A + ∇ = @. -2 / A^2 # -2 / x² + checkgradient(x, y, ∇) do + 2 ./ x + end + end +end # function test_div + + +function test_power() + info("AutoGrad::power") + + info("AutoGrad::power::x.^3") + let A = Float32[1 2; 3 4] + x = mx.NDArray(A) + y = A.^3 + ∇ = 3(A.^2) + checkgradient(x, y, ∇) do + x.^3 + end + end + + info("AutoGrad::power::x.^.5") + let A = Float32[1 2; 3 4] + x = mx.NDArray(A) + y = A.^.5 + ∇ = .5(A.^-.5) + checkgradient(x, y, ∇) do + x.^.5 + end + end +end + + +@testset "AutoGrad Test" begin + test_getgrad() + test_mark_variables!() + test_record() + test_is_recording() + test_is_training() + test_pause() + test_train_mode() + test_predict_mode() + test_backward!() + test_symbol() + test_add() + test_sub() + test_mul() + test_div() + test_power() +end + + +end # model TestAutoGrad diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index a24126cf194b..ef4fb1f2373c 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -502,7 +502,7 @@ function test_rdiv() @test copy(x) ≈ y end - info("NDArray:rdiv::type convert") + info("NDArray::rdiv::type convert") let x = mx.NDArray([1, 2, 3]) y = 5.5 ./ x @test eltype(y) == Int # this differs from julia From 883cdd39dd96a884fde758ce94a4d0106b5e0307 Mon Sep 17 00:00:00 2001 From: Nicu Stiurca Date: Mon, 18 Dec 2017 17:56:30 -0600 Subject: [PATCH 600/630] build: make appending lib to MXNET_HOME optional (#386) The MXNet shared libraries are not necessarily in a lib subdirectory. --- deps/build.jl | 5 +++-- src/base.jl | 1 + 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index b09e5f44242e..ff4441227cac 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -8,10 +8,11 @@ libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "master") curr_win = "20171019" # v0.12.0 if haskey(ENV, "MXNET_HOME") - info("MXNET_HOME environment detected: $(ENV["MXNET_HOME"])") + MXNET_HOME = ENV["MXNET_HOME"] + info("MXNET_HOME environment detected: $MXNET_HOME") info("Trying to load existing libmxnet...") lib = Libdl.find_library("libmxnet.$(Libdl.dlext)", - ["$(ENV["MXNET_HOME"])/lib"]) + [joinpath(MXNET_HOME, "lib"), MXNET_HOME]) if !isempty(lib) info("Existing libmxnet detected at $lib, skip building...") libmxnet_detected = true diff --git a/src/base.jl b/src/base.jl index b8f73eb4e6bc..271e35607880 100644 --- a/src/base.jl +++ b/src/base.jl @@ -32,6 +32,7 @@ const grad_req_map = Dict{Symbol,GRAD_REQ}( ################################################################################ const MXNET_LIB = Libdl.find_library("libmxnet.$(Libdl.dlext)", [joinpath(get(ENV, "MXNET_HOME", ""), "lib"), + get(ENV, "MXNET_HOME", ""), Pkg.dir("MXNet", "deps", "usr", "lib")]) if isempty(MXNET_LIB) # touch this file, so that after the user properly build libmxnet, the precompiled From bfeba817bac0216e1cb19e147acc5665bfb732cd Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 21 Dec 2017 09:50:58 +0800 Subject: [PATCH 601/630] ndarray: support matrix/tensor multiplication (#384) --- NEWS.md | 20 ++++++++++++++++++++ src/ndarray.jl | 8 ++++---- test/unittest/ndarray.jl | 23 ++++++++++++++++++++++- 3 files changed, 46 insertions(+), 5 deletions(-) diff --git a/NEWS.md b/NEWS.md index 4540cba50fef..efd3299e337c 100644 --- a/NEWS.md +++ b/NEWS.md @@ -161,6 +161,26 @@ 1.0 2.0 3.0 4.0 ``` +* Matrix/tensor multiplication is supported now. (#TBD) + + ```julia + julia> x + 2×3 mx.NDArray{Float32,2} @ CPU0: + 1.0 2.0 3.0 + 4.0 5.0 6.0 + + julia> y + 3 mx.NDArray{Float32,1} @ CPU0: + -1.0 + -2.0 + -3.0 + + julia> x * y + 2 mx.NDArray{Float32,1} @ CPU0: + -14.0 + -32.0 + ``` + ## API Changes ### `NDArray` diff --git a/src/ndarray.jl b/src/ndarray.jl index de5d6ba4fba4..ef2293486f07 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -674,7 +674,7 @@ import Base: * """ .*(x, y) -Currently only multiplication a scalar with an `NDArray` is implemented. +Elementwise multiplication for `NDArray`. """ *(x::NDArray, y::Real) = _mul_scalar(x, scalar = y) *(y::Real, x::NDArray) = _mul_scalar(x, scalar = y) @@ -686,9 +686,9 @@ broadcast_(::typeof(*), x::NDArray, y::NDArray) = _mul(x, y) """ *(A::NDArray, B::NDArray) -Matrix (2D NDArray) multiplication. +Matrix/tensor multiplication. """ -*(x::NDArray{T,2}, y::NDArray{S,2}) where {T,S} = dot(x, y) +*(x::NDArray{T}, y::NDArray{T}) where T = x ⋅ y """ div_from!(dst::NDArray, arg::NDArrayOrReal) @@ -1165,7 +1165,7 @@ _mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap minimum(arr::NDArray, dims) min(arr; axis = 0 .- dims, keepdims = true) # See https://github.com/dmlc/MXNet.jl/issues/55 -@_remap dot(x::NDArray{T,N}, y::NDArray{S,N}) where {T,S,N} dot(y, x) +@_remap dot(x::NDArray, y::NDArray) dot(y, x) # See https://github.com/dmlc/MXNet.jl/pull/123 @_remap transpose(arr::NDArray{T,1}) where T reshape(arr; shape = (1, length(arr)), reverse = true) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index ef4fb1f2373c..e7b70d2e3884 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -740,7 +740,28 @@ function test_dot() x = mx.zeros(1, 2) y = mx.zeros(1, 2, 3) - @test_throws MethodError dot(x, y) + @test_throws mx.MXError dot(x, y) # dimension mismatch + + info("NDArray::matrix mul") + let + A = [1. 2 3; 4 5 6] + B = [-1., -2, -3] + x = NDArray(A) + y = NDArray(B) + z = x * y + @test copy(z) == A * B + @test size(z) == (2,) + end + + let + A = [1. 2 3; 4 5 6] + B = [-1. -2; -3 -4; -5 -6] + x = NDArray(A) + y = NDArray(B) + z = x * y + @test copy(z) == A * B + @test size(z) == (2, 2) + end end function test_eltype() From 378789509632e51d5ca98f64bc131d5f062efb50 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 21 Dec 2017 12:48:02 +0800 Subject: [PATCH 602/630] ndarray: remap expand_dims (#381) --- NEWS.md | 1 + src/MXNet.jl | 3 ++- src/ndarray.jl | 39 +++++++++++++++++++++++++--- test/unittest/ndarray.jl | 55 ++++++++++++++++++++++++++++++---------- 4 files changed, 80 insertions(+), 18 deletions(-) diff --git a/NEWS.md b/NEWS.md index efd3299e337c..fe8f7d613687 100644 --- a/NEWS.md +++ b/NEWS.md @@ -4,6 +4,7 @@ * `NDArray` * `context()` * `empty()` + * `expand_dims()` * `SymbolicNode` * `Variable` diff --git a/src/MXNet.jl b/src/MXNet.jl index 352d20aad150..734abfd76650 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -32,7 +32,8 @@ export SymbolicNode, # ndarray.jl export NDArray, context, - empty + empty, + expand_dims # executor.jl export Executor, diff --git a/src/ndarray.jl b/src/ndarray.jl index ef2293486f07..274c306c7441 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1045,7 +1045,8 @@ end # Mapping NDArray functions to Base-like API ################################################################################ -const _mxsig = Dict{Symbol,Expr}() +const _ndsig = Dict{Symbol,Expr}() +const _nddoc = Dict{Symbol,Any}() function _autoimport(name::Symbol, sig::Expr) if name == :broadcast_ @@ -1074,6 +1075,9 @@ _broadcast_target(sig::Expr) = sig.args[2].args[].args[end] Generate docstring from function signature """ function _docsig(fname::Symbol, sig::Expr) + s = get(_nddoc, fname, "") + !isempty(s) && return s + if fname !== :broadcast_ " $sig" else @@ -1141,14 +1145,14 @@ macro _remap(sig::Expr, imp::Expr) end macro _remap(sig::Expr, imp::Symbol) - imp = _mxsig[imp] + imp = _ndsig[imp] esc(quote @_remap($sig, $imp) end) end -_mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) +_ndsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap reshape(arr::NDArray, dim...; reverse = false) reshape @_remap reshape(arr::NDArray, dim; reverse = false) reshape @@ -1175,6 +1179,34 @@ _mxsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap prod(arr::NDArray) prod(arr) @_remap prod(arr::NDArray, dims) prod(arr; axis = 0 .- dims, keepdims = true) +_nddoc[:expand_dims] = +""" + expand_dims(x::NDArray, dim) + +Insert a new axis into `dim`. + +```julia +julia> x +4 mx.NDArray{Float64,1} @ CPU0: + 1.0 + 2.0 + 3.0 + 4.0 + +julia> mx.expand_dims(x, 1) +1×4 mx.NDArray{Float64,2} @ CPU0: + 1.0 2.0 3.0 4.0 + +julia> mx.expand_dims(x, 2) +4×1 mx.NDArray{Float64,2} @ CPU0: + 1.0 + 2.0 + 3.0 + 4.0 +``` +""" +@_remap expand_dims(x::NDArray, dim) expand_dims(x; axis = -dim) + # trigonometric functions, remap to keep consistent with Base @_remap broadcast_(::typeof(sin), x::NDArray) sin(x) @_remap broadcast_(::typeof(cos), x::NDArray) cos(x) @@ -1318,6 +1350,7 @@ const _op_import_bl = [ # import black list; do not import these funcs "_full", # we already have `mx.fill` "_ones", # we already have `mx.ones` "_zeros", # we already have `mx.zeros` + "expand_dims", # arithmetic "_plus", diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index e7b70d2e3884..6b258fe99646 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -779,27 +779,53 @@ function test_eltype() end function test_reshape() - info("NDArray::reshape") - A = rand(2, 3, 4) + info("NDArray::reshape") + A = rand(2, 3, 4) - B = reshape(mx.NDArray(A), 4, 3, 2) - @test size(B) == (4, 3, 2) - @test copy(B)[3, 1, 1] == A[1, 2, 1] + B = reshape(NDArray(A), 4, 3, 2) + @test size(B) == (4, 3, 2) + @test copy(B)[3, 1, 1] == A[1, 2, 1] - C = reshape(mx.NDArray(A), (4, 3, 2)) - @test size(C) == (4, 3, 2) - @test copy(C)[3, 1, 1] == A[1, 2, 1] + C = reshape(NDArray(A), (4, 3, 2)) + @test size(C) == (4, 3, 2) + @test copy(C)[3, 1, 1] == A[1, 2, 1] - info("NDArray::reshape::reverse") - A = mx.zeros(10, 5, 4) + info("NDArray::reshape::reverse") + A = mx.zeros(10, 5, 4) - B = reshape(A, -1, 0) - @test size(B) == (40, 5) + B = reshape(A, -1, 0) + @test size(B) == (40, 5) - C = reshape(A, -1, 0, reverse=true) - @test size(C) == (50, 4) + C = reshape(A, -1, 0, reverse=true) + @test size(C) == (50, 4) end +function test_expand_dims() + info("NDArray::expand_dims") + let A = [1, 2, 3, 4], x = NDArray(A) + @test size(x) == (4,) + + y = expand_dims(x, 1) + @test size(y) == (1, 4) + + y = expand_dims(x, 2) + @test size(y) == (4, 1) + end + + let A = [1 2; 3 4; 5 6], x = NDArray(A) + @test size(x) == (3, 2) + + y = expand_dims(x, 1) + @test size(y) == (1, 3, 2) + + y = expand_dims(x, 2) + @test size(y) == (3, 1, 2) + + y = expand_dims(x, 3) + @test size(y) == (3, 2, 1) + end +end # test_expand_dims + function test_sum() info("NDArray::sum") @@ -1025,6 +1051,7 @@ end # function test_hyperbolic test_nd_as_jl() test_dot() test_reshape() + test_expand_dims() test_sum() test_mean() test_maximum() From 813bfdcfe68cf651f875f43ea9e2aff30c010102 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 22 Dec 2017 01:42:46 +0800 Subject: [PATCH 603/630] random: Base-like APIs for rand, rand!, randn, randn! (#383) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * random: Base-like APIs for rand, rand!, randn, randn! and deprecate the original APIs ```julia julia> mx.rand(2, 3) 2×3 mx.NDArray{Float32,2} @ CPU0: 0.631961 0.324175 0.0762663 0.285366 0.395292 0.074995 julia> mx.rand(2, 3, low = low, high = high) 2×3 mx.NDArray{Float32,2} @ CPU0: 7.83884 7.85793 7.64791 7.68646 8.56082 8.42189 ``` ```julia julia> mx.randn(2, 3) 2×3 mx.NDArray{Float32,2} @ CPU0: 0.962853 0.424535 -0.320123 0.478113 1.72886 1.72287 julia> mx.randn(2, 3, μ = 100) 2×3 mx.NDArray{Float32,2} @ CPU0: 99.5635 100.483 99.888 99.9889 100.533 100.072 ``` * fix depwarn --- NEWS.md | 26 +++++++++++++++++ src/deprecated.jl | 26 +++++++++++++++++ src/initializer.jl | 14 ++++----- src/random.jl | 64 ++++++++++++++++++++--------------------- test/unittest/random.jl | 8 +++--- 5 files changed, 93 insertions(+), 45 deletions(-) diff --git a/NEWS.md b/NEWS.md index fe8f7d613687..c47fcacacb05 100644 --- a/NEWS.md +++ b/NEWS.md @@ -208,6 +208,32 @@ * `arccosh(x)` -> `acosh.(x)` * `arctanh(x)` -> `atanh.(x)` +* `rand`, `rand!`, `randn`, `randn!` is more Base-like now (#TBD). + + ```julia + julia> mx.rand(2, 3) + 2×3 mx.NDArray{Float32,2} @ CPU0: + 0.631961 0.324175 0.0762663 + 0.285366 0.395292 0.074995 + + julia> mx.rand(2, 3; low = 1, high = 10) + 2×3 mx.NDArray{Float32,2} @ CPU0: + 7.83884 7.85793 7.64791 + 7.68646 8.56082 8.42189 + ``` + + ```julia + julia> mx.randn(2, 3) + 2×3 mx.NDArray{Float32,2} @ CPU0: + 0.962853 0.424535 -0.320123 + 0.478113 1.72886 1.72287 + + julia> mx.randn(2, 3, μ = 100) + 2×3 mx.NDArray{Float32,2} @ CPU0: + 99.5635 100.483 99.888 + 99.9889 100.533 100.072 + ``` + # v0.3.0 (2017.11.16) * Update `libmxnet` to diff --git a/src/deprecated.jl b/src/deprecated.jl index 8a8df0a56789..0167d57c4b83 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -23,3 +23,29 @@ @deprecate arcsinh(x::NDArray) asinh.(x) @deprecate arccosh(x::NDArray) acosh.(x) @deprecate arctanh(x::NDArray) atanh.(x) + +# @deprecate make `randn` exported accidentially +# so we make the depwarn manually +function randn(μ, σ, dims::NTuple{N,Int}, ctx::Context = cpu()) where N + warn("mx.randn(μ, σ, dims, ctx = cpu()) is deprecated, use " * + "mx.randn(dims...; μ = μ, σ = σ, context = ctx) instead.") + mx.randn(dims...; μ = μ, σ = σ, context = ctx) +end + +function randn!(μ, σ, x::NDArray) + warn("mx.randn!(μ, σ, x::NDArray) is deprecated, use " * + "mx.randn!(x; μ = μ, σ = σ) instead.") + randn!(x; μ = μ, σ = σ) +end + +function rand!(low::Real, high::Real, x::NDArray) + warn("rand!(low, high, x::NDArray) is deprecated, use " * + "rand!(x, low = low, high = high) instead.") + rand!(x, low = low, high = high) +end + +function rand(low::Real, high::Real, dims::NTuple{N,Int}, context::Context = cpu()) where N + warn("rand!(low, high, dims, x::NDArray, context = cpu()) is deprecated, use " * + "rand!(dims..., x; low = low, high = high, context = cpu()) instead.") + rand(dims...; low = low, high = high, context = context) +end diff --git a/src/initializer.jl b/src/initializer.jl index 157958586642..188c5deb6255 100644 --- a/src/initializer.jl +++ b/src/initializer.jl @@ -104,9 +104,8 @@ Construct a `UniformInitializer` with the specified scale. """ UniformInitializer() = UniformInitializer(0.07) -function _init_weight(self :: UniformInitializer, name :: Base.Symbol, array :: NDArray) - rand!(-self.scale, self.scale, array) -end +_init_weight(i::UniformInitializer, name::Symbol, x::NDArray) = + rand!(x, low = -i.scale, high = i.scale) """ NormalInitializer @@ -124,9 +123,8 @@ Construct a `NormalInitializer` with mean `mu` and variance `sigma`. """ NormalInitializer(; mu=0, sigma=0.01) = NormalInitializer(mu, sigma) -function _init_weight(self :: NormalInitializer, name :: Base.Symbol, array :: NDArray) - randn!(self.μ, self.σ, array) -end +_init_weight(i::NormalInitializer, name::Symbol, x::NDArray) = + randn!(x, μ = i.μ, σ = i.σ) """ XavierInitializer @@ -175,8 +173,8 @@ function _init_weight(self :: XavierInitializer, name :: Base.Symbol, array :: N σ = √(self.magnitude / factor) if self.distribution == xv_uniform - rand!(-σ, σ, array) + rand!(array, low = -σ, high = σ) elseif self.distribution == xv_normal - randn!(0.0, σ, array) + randn!(array; μ = 0.0, σ = σ) end end diff --git a/src/random.jl b/src/random.jl index 3c5f1dcb564b..1f612e310fe8 100644 --- a/src/random.jl +++ b/src/random.jl @@ -1,68 +1,66 @@ """ - rand!(low, high, arr::NDArray) + rand!(x::NDArray; low = 0, high = 1) Draw random samples from a uniform distribution. Samples are uniformly distributed over the half-open interval [low, high) (includes low, but excludes high). -# Examples - ```julia -julia> mx.rand(0, 1, mx.zeros(2, 2)) |> copy -2×2 Array{Float32,2}: - 0.405374 0.321043 - 0.281153 0.713927 +julia> mx.rand!(empty(2, 3)) +2×3 mx.NDArray{Float32,2} @ CPU0: + 0.385748 0.839275 0.444536 + 0.0879585 0.215928 0.104636 + +julia> mx.rand!(empty(2, 3), low = 1, high = 10) +2×3 mx.NDArray{Float32,2} @ CPU0: + 6.6385 4.18888 2.07505 + 8.97283 2.5636 1.95586 ``` """ -function rand!(low::Real, high::Real, out::NDArray) - _random_uniform(NDArray, low=low, high=high, shape=size(out), out=out) -end +rand!(x::NDArray; low = 0, high = 1) = + _random_uniform(NDArray, low = low, high = high, shape = size(x), out = x) """ - rand(low, high, shape, context=cpu()) + rand(dims...; low = 0, high = 1, context = cpu()) Draw random samples from a uniform distribution. Samples are uniformly distributed over the half-open interval [low, high) (includes low, but excludes high). -# Examples - ```julia -julia> mx.rand(0, 1, (2, 2)) |> copy -2×2 Array{Float32,2}: - 0.405374 0.321043 - 0.281153 0.713927 +julia> mx.rand(2, 2) +2×2 mx.NDArray{Float32,2} @ CPU0: + 0.487866 0.825691 + 0.0234245 0.794797 + +julia> mx.rand(2, 2; low = 1, high = 10) +2×2 mx.NDArray{Float32,2} @ CPU0: + 5.5944 5.74281 + 9.81258 3.58068 ``` """ -function rand(low::Real, high::Real, shape::NTuple{N, Int}, ctx::Context=cpu()) where N - out = empty(shape, ctx) - rand!(low, high, out) -end +rand(dims::Int...; low = 0, high = 1, context = cpu()) = + rand!(empty(dims, context), low = low, high = high) """ - randn!(mean, std, arr::NDArray) + randn!(x::NDArray; μ = 0, σ = 1) Draw random samples from a normal (Gaussian) distribution. """ -function randn!(mean::Real, stdvar::Real, out::NDArray) - _random_normal(NDArray, loc=mean, scale=stdvar, shape=size(out), out=out) -end +randn!(x::NDArray; μ = 0, σ = 1) = + _random_normal(NDArray, loc = μ, scale = σ, shape = size(x), out = x) """ - randn(mean, std, shape, context=cpu()) + randn(dims...; μ = 0, σ = 1, context = cpu()) Draw random samples from a normal (Gaussian) distribution. """ -function randn(mean::Real, stdvar::Real, shape::NTuple{N,Int}, ctx::Context=cpu()) where N - out = empty(shape, ctx) - randn!(mean, stdvar, out) -end +randn(dims::Int...; μ = 0, σ = 1, context = cpu()) = + randn!(empty(dims, context), μ = μ, σ = σ) """ srand(seed::Int) Set the random seed of libmxnet """ -function srand(seed_state::Int) - @mxcall(:MXRandomSeed, (Cint,), seed_state) -end +srand(seed_state::Int) = @mxcall(:MXRandomSeed, (Cint,), seed_state) diff --git a/test/unittest/random.jl b/test/unittest/random.jl index 30995ecf79bf..34b9d3625c0d 100644 --- a/test/unittest/random.jl +++ b/test/unittest/random.jl @@ -9,11 +9,11 @@ function test_uniform() low = -10; high = 10 seed = 123 mx.srand(seed) - ret1 = mx.rand(low, high, dims) + ret1 = mx.rand(dims..., low = low, high = high) mx.srand(seed) ret2 = mx.empty(dims) - mx.rand!(low, high, ret2) + mx.rand!(ret2, low = low, high = high) @test copy(ret1) == copy(ret2) @test abs(mean(copy(ret1)) - (high+low)/2) < 0.1 @@ -26,11 +26,11 @@ function test_gaussian() μ = 10; σ = 2 seed = 456 mx.srand(seed) - ret1 = mx.randn(μ, σ, dims) + ret1 = mx.randn(dims..., μ = μ, σ = σ) mx.srand(seed) ret2 = mx.empty(dims) - mx.randn!(μ, σ, ret2) + mx.randn!(ret2, μ = μ, σ = σ) @test copy(ret1) == copy(ret2) @test abs(mean(copy(ret1)) - μ) < 0.1 From d3cdbf6702fd8250456ffd7cbda94028948ad24e Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 28 Dec 2017 10:50:13 +0800 Subject: [PATCH 604/630] ndarray: remap activation functions (#387) * sigmoid * relu * softmax * log_softmax --- NEWS.md | 15 +++++++ docs/src/api/ndarray.md | 11 ++++++ src/MXNet.jl | 8 +++- src/broadcast.jl | 7 ++++ src/deprecated.jl | 5 +++ src/ndarray.jl | 84 +++++++++++++++++++++++++++++++++++++--- test/unittest/ndarray.jl | 68 ++++++++++++++++++++++++++++++++ 7 files changed, 191 insertions(+), 7 deletions(-) diff --git a/NEWS.md b/NEWS.md index c47fcacacb05..63ca201b56b2 100644 --- a/NEWS.md +++ b/NEWS.md @@ -5,6 +5,11 @@ * `context()` * `empty()` * `expand_dims()` + * `σ()` + * `sigmoid()` + * `relu()` + * `softmax()` + * `log_softmax()` * `SymbolicNode` * `Variable` @@ -208,6 +213,16 @@ * `arccosh(x)` -> `acosh.(x)` * `arctanh(x)` -> `atanh.(x)` +* Please use dot-call on following activation functions. + And the `dim` of `softmax` and `log_softmax` has been fixed + as Julia column-based style. + (#TBD) + + * `σ.(x)` + * `relu.(x)` + * `softmax.(x, [dim = ndims(x)])` + * `log_softmax.(x, [dim = ndims(x)])` + * `rand`, `rand!`, `randn`, `randn!` is more Base-like now (#TBD). ```julia diff --git a/docs/src/api/ndarray.md b/docs/src/api/ndarray.md index 9582ff24a7ef..76fb6a39b621 100644 --- a/docs/src/api/ndarray.md +++ b/docs/src/api/ndarray.md @@ -37,6 +37,17 @@ In the following example `y` can be a `Real` value or another `NDArray` | [`atanh`](@ref) | `atanh.(x)` | Elementwise inverse hyperbolic tangent | +## Activation Functions + +| API | Example | | +|-----------------------|-------------------|-------------------------| +| [`σ`](@ref) | `σ.(x)` | Sigmoid function | +| [`sigmoid`](@ref) | `sigmoid.(x)` | Sigmoid function | +| [`relu`](@ref) | `relu.(x)` | ReLU function | +| [`softmax`](@ref) | `softmax.(x)` | Softmax function | +| [`log_softmax`](@ref) | `log_softmax.(x)` | Softmax followed by log | + + ## Reference ```@autodocs diff --git a/src/MXNet.jl b/src/MXNet.jl index 734abfd76650..8b0b8b8a0761 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -33,7 +33,13 @@ export SymbolicNode, export NDArray, context, empty, - expand_dims + expand_dims, + # activation funcs + σ, + sigmoid, + relu, + softmax, + log_softmax # executor.jl export Executor, diff --git a/src/broadcast.jl b/src/broadcast.jl index cdde7f46b2c9..5d15adf385cc 100644 --- a/src/broadcast.jl +++ b/src/broadcast.jl @@ -8,3 +8,10 @@ for f in :[%, @eval Base.$f(a::Broadcasted, b) = Broadcasted(broadcast_($f, unwrap(a), b)) @eval Base.$f(b, a::Broadcasted) = Broadcasted(broadcast_($f, b, unwrap(a))) end + +for f in :[σ, sigmoid, relu, softmax, log_softmax].args + # copy from TakingBroadcastSeriously + @eval $f(a::Broadcasted...) = Broadcasted(broadcast_($f, unwrap.(a)...)) + @eval $f(a::Broadcasted, b) = Broadcasted(broadcast_($f, unwrap(a), b)) + @eval $f(b, a::Broadcasted) = Broadcasted(broadcast_($f, b, unwrap(a))) +end diff --git a/src/deprecated.jl b/src/deprecated.jl index 0167d57c4b83..6b24411b4125 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -49,3 +49,8 @@ function rand(low::Real, high::Real, dims::NTuple{N,Int}, context::Context = cpu "rand!(dims..., x; low = low, high = high, context = cpu()) instead.") rand(dims...; low = low, high = high, context = context) end + +@deprecate sigmoid(x::NDArray) sigmoid.(x) +@deprecate relu(x::NDArray) relu.(x) +@deprecate softmax(x::NDArray; axis = ndims(x)) softmax.(x, axis) +@deprecate log_softmax(x::NDArray; axis = ndims(x)) log_softmax.(x, axis) diff --git a/src/ndarray.jl b/src/ndarray.jl index 274c306c7441..cb8e3eb6f813 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1075,16 +1075,21 @@ _broadcast_target(sig::Expr) = sig.args[2].args[].args[end] Generate docstring from function signature """ function _docsig(fname::Symbol, sig::Expr) - s = get(_nddoc, fname, "") - !isempty(s) && return s - if fname !== :broadcast_ + s = get(_nddoc, fname, "") + !isempty(s) && return s " $sig" else name = _broadcast_target(sig) - sig_ = Expr(:call, Symbol(name, "."), sig.args[3:end]...) - str = " $sig_" - @eval @doc $str $name + str = get(_nddoc, name, "") + _nddoc[name] = false # change to false, denote docstring has been set up + if isempty(str) + sig_ = Expr(:call, Symbol(name, "."), sig.args[3:end]...) + str = " $sig_" + end + if str ≠ false + @eval @doc $str $name + end "" end end @@ -1223,6 +1228,67 @@ julia> mx.expand_dims(x, 2) @_remap broadcast_(::typeof(acosh), x::NDArray) arccosh(x) @_remap broadcast_(::typeof(atanh), x::NDArray) arctanh(x) +# activation functions +_nddoc[:σ] = _nddoc[:sigmoid] = doc""" + σ.(x::NDArray) + sigmoid.(x::NDArray) + +Computes sigmoid of x element-wise. + +```math +σ(x) = \frac{1}{(1 + exp(-x))} +``` + +The storage type of `sigmoid` output is always dense. +""" +@_remap broadcast_(::typeof(σ), x::NDArray) sigmoid(x) +@_remap broadcast_(::typeof(sigmoid), x::NDArray) sigmoid(x) + +_nddoc[:relu] = doc""" + relu.(x::NDArray) + +Computes rectified linear. + +```math +\max(x, 0) +``` +""" +@_remap broadcast_(::typeof(relu), x::NDArray) relu(x) + +_nddoc[:softmax] = doc""" + softmax.(x::NDArray, [dim = ndims(x)]) + +Applies the softmax function. + +The resulting array contains elements in the range `(0, 1)` +and the elements along the given axis sum up to 1. + +```math +softmax(\mathbf{z})_j = \frac{e^{z_j}}{\sum_{k=1}^K e^{z_k}} +``` +""" +@_remap broadcast_(::typeof(softmax), x::NDArray) softmax(x; axis = -ndims(x)) +@_remap broadcast_(::typeof(softmax), x::NDArray, dim::Int) softmax(x; axis = -dim) + +_nddoc[:log_softmax] = """ + log_softmax.(x::NDArray, [dim = ndims(x)]) + +Computes the log softmax of the input. +This is equivalent to computing softmax followed by log. + +julia> x +2×3 mx.NDArray{Float64,2} @ CPU0: + 1.0 2.0 0.1 + 0.1 2.0 1.0 + +julia> mx.log_softmax.(x) +2×3 mx.NDArray{Float64,2} @ CPU0: + -1.41703 -0.41703 -2.31703 + -2.31703 -0.41703 -1.41703 +""" +@_remap broadcast_(::typeof(log_softmax), x::NDArray) log_softmax(x; axis = -ndims(x)) +@_remap broadcast_(::typeof(log_softmax), x::NDArray, dim::Int) log_softmax(x; axis = -dim) + ################################################################################ # remapping to solving type unstablility ################################################################################ @@ -1383,6 +1449,12 @@ const _op_import_bl = [ # import black list; do not import these funcs "arcsinh", "arccosh", "arctanh", + + # activation + "sigmoid", + "relu", + "softmax", + "log_softmax", ] macro _import_ndarray_functions() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 6b258fe99646..58c5796eb00d 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -1024,6 +1024,73 @@ function test_hyperbolic() end end # function test_hyperbolic +function test_act_funcs() + info("NDArray::σ/sigmoid") + let + A = Float32[.1, .2, -.3, -.4] + B = @. 1 / (1 + e^(-A)) + x = NDArray(A) + y = σ.(x) + @test copy(y) ≈ B + + z = sigmoid.(x) + @test copy(z) ≈ B + end + + info("NDArray::relu") + let + A = [1, 2, -3, -4] + B = max.(A, 0) + x = NDArray(A) + y = relu.(x) + @test copy(y) ≈ B + end + + info("NDArray::softmax::1D") + let + A = Float32[1, 2, 3, 4] + B = exp.(A) ./ sum(exp.(A)) + x = NDArray(A) + y = softmax.(x) + @test copy(y) ≈ B + end + + info("NDArray::softmax::2D") + let + A = Float32[1 2; 3 4] + B = exp.(A) ./ sum(exp.(A), 1) + x = NDArray(A) + y = softmax.(x, 1) + @test copy(y) ≈ B + + C = exp.(A) ./ sum(exp.(A), 2) + z = softmax.(x, 2) + @test copy(z) ≈ C + end + + info("NDArray::log_softmax::1D") + let + A = Float32[1, 2, 3, 4] + B = log.(exp.(A) ./ sum(exp.(A))) + x = NDArray(A) + y = log_softmax.(x) + @test copy(y) ≈ B + end + + info("NDArray::log_softmax::2D") + let + A = Float32[1 2; 3 4] + B = log.(exp.(A) ./ sum(exp.(A), 1)) + x = NDArray(A) + y = log_softmax.(x, 1) + @test copy(y) ≈ B + + C = log.(exp.(A) ./ sum(exp.(A), 2)) + z = log_softmax.(x, 2) + @test copy(z) ≈ C + end +end # function test_act_funcs + ################################################################################ # Run tests ################################################################################ @@ -1063,6 +1130,7 @@ end # function test_hyperbolic test_size() test_trigonometric() test_hyperbolic() + test_act_funcs() end end From 9d606639c882d8d2e58040a3aabc4f944615fef7 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 31 Dec 2017 00:36:21 +0800 Subject: [PATCH 605/630] ndarray: refine signature of `clip` (#391) Before: `clip(x, a_min = -4, a_max = 4)` After: `clip(x, -4, 4)` The `a_min` and `a_max` is a required but they are keyword argument. So this commit change them to positional arguments and make sure will fill them. --- NEWS.md | 10 ++++++++++ src/MXNet.jl | 2 ++ src/deprecated.jl | 2 ++ src/ndarray.jl | 36 ++++++++++++++++++++++++++++++++++++ src/optimizer.jl | 26 +++++++++++++------------- test/unittest/ndarray.jl | 9 ++++++++- 6 files changed, 71 insertions(+), 14 deletions(-) diff --git a/NEWS.md b/NEWS.md index 63ca201b56b2..aa08666b751f 100644 --- a/NEWS.md +++ b/NEWS.md @@ -2,6 +2,8 @@ * Following material from `mx` module got exported (#TBD): * `NDArray` + * `clip()` + * `clip!()` * `context()` * `empty()` * `expand_dims()` @@ -249,6 +251,14 @@ 99.9889 100.533 100.072 ``` +* Signature of `clip` changed, it doesn't require any keyword argument now. + (#TBD) + + Before: `clip(x, a_min = -4, a_max = 4)` + After: `clip(x, -4, 4)` + +---- + # v0.3.0 (2017.11.16) * Update `libmxnet` to diff --git a/src/MXNet.jl b/src/MXNet.jl index 8b0b8b8a0761..e4c23f299dc1 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -31,6 +31,8 @@ export SymbolicNode, # ndarray.jl export NDArray, + clip, + clip!, context, empty, expand_dims, diff --git a/src/deprecated.jl b/src/deprecated.jl index 6b24411b4125..9a24aa815148 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -54,3 +54,5 @@ end @deprecate relu(x::NDArray) relu.(x) @deprecate softmax(x::NDArray; axis = ndims(x)) softmax.(x, axis) @deprecate log_softmax(x::NDArray; axis = ndims(x)) log_softmax.(x, axis) + +@deprecate clip(x; a_min = 0, a_max = 0) clip(x, a_min, a_max) diff --git a/src/ndarray.jl b/src/ndarray.jl index cb8e3eb6f813..5583e545ae11 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1184,6 +1184,41 @@ _ndsig[:reshape] = :(reshape(arr; shape = dim, reverse = !reverse)) @_remap prod(arr::NDArray) prod(arr) @_remap prod(arr::NDArray, dims) prod(arr; axis = 0 .- dims, keepdims = true) +_nddoc[:clip] = _nddoc[:clip!] = +""" + clip(x::NDArray, min, max) + clip!(x::NDArray, min, max) + +Clips (limits) the values in `NDArray`. +Given an interval, values outside the interval are clipped to the interval edges. +Clipping `x` between `min` and `x` would be: + +```julia +clip(x, min_, max_) = max(min(x, max_), min_)) +``` + +```jldoctest +julia> x = NDArray(1:9); + +julia> mx.clip(x, 2, 8)' +1×9 mx.NDArray{Int64,2} @ CPU0: + 2 2 3 4 5 6 7 8 8 +``` + +The storage type of clip output depends on storage types of inputs and the +`min`, `max` parameter values: + +- clip(default) = default +- clip(row_sparse, min <= 0, max >= 0) = row_sparse +- clip(csr, min <= 0, max >= 0) = csr +- clip(row_sparse, min < 0, max < 0) = default +- clip(row_sparse, min > 0, max > 0) = default +- clip(csr, min < 0, max < 0) = csr +- clip(csr, min > 0, max > 0) = csr +""" +@_remap clip(x::NDArray, min::Real, max::Real) clip(x; a_min = min, a_max = max) +@_remap clip!(x::NDArray, min::Real, max::Real) clip(x; a_min = min, a_max = max) + _nddoc[:expand_dims] = """ expand_dims(x::NDArray, dim) @@ -1416,6 +1451,7 @@ const _op_import_bl = [ # import black list; do not import these funcs "_full", # we already have `mx.fill` "_ones", # we already have `mx.ones` "_zeros", # we already have `mx.zeros` + "clip", "expand_dims", # arithmetic diff --git a/src/optimizer.jl b/src/optimizer.jl index 8d46a9e407a1..7a647332231b 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -243,29 +243,29 @@ Base class for all optimizer options. abstract type AbstractOptimizerOptions end """ - normalized_gradient(opts, state, weight, grad) + normalized_gradient(opts, state, W, ∇) -* `opts::AbstractOptimizerOptions`: options for the optimizer, should contain the field -`grad_clip` and `weight_decay`. -* `state::OptimizationState`: the current optimization state. -* `weight::NDArray`: the trainable weights. -* `grad::NDArray`: the original gradient of the weights. +Get the properly normalized gradient (re-scaled and clipped if necessary). - Get the properly normalized gradient (re-scaled and clipped if necessary). +* `opts::AbstractOptimizerOptions`: options for the optimizer, + should contain the field `grad_clip` and `weight_decay`. +* `state::OptimizationState`: the current optimization state. +* `W::NDArray`: the trainable weights. +* `∇::NDArray`: the original gradient of the weights. """ function normalized_gradient(opts::AbstractOptimizerOptions, state::OptimizationState, - weight::NDArray, grad::NDArray) - grad_scale = 1.0 / state.batch_size + W::NDArray, ∇::NDArray) + scale = 1.0 / state.batch_size + ∇ = ∇ * scale - grad = grad_scale * grad if opts.grad_clip > 0 - grad = clip(grad, a_min=-opts.grad_clip, a_max=opts.grad_clip) + ∇ = clip(∇, -opts.grad_clip, opts.grad_clip) end if opts.weight_decay > 0 - @inplace grad += opts.weight_decay * weight + @inplace ∇ += opts.weight_decay * W end - return grad + ∇ end include("optimizers/sgd.jl") diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 58c5796eb00d..df357f6c4c33 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -604,12 +604,19 @@ function test_clip() j_array, nd_array = rand_tensors(dims) clip_up = maximum(abs.(j_array)) / 2 clip_down = 0 - clipped = mx.clip(nd_array, a_min=clip_down, a_max=clip_up) + clipped = clip(nd_array, clip_down, clip_up) # make sure the original array is not modified @test copy(nd_array) ≈ j_array @test all(clip_down .<= copy(clipped) .<= clip_up) + + info("NDArray::clip!") + let + x = NDArray(1.0:20) + clip!(x, 5, 15) + @test all(5 .<= copy(x) .<= 15) + end end function test_power() From a4143e93daf550e8ef014aefcd335a63f3565694 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 1 Jan 2018 12:06:53 +0800 Subject: [PATCH 606/630] Bump :copyright: (#397) --- LICENSE.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/LICENSE.md b/LICENSE.md index a34c4a0f662e..5ecf95ac60bc 100644 --- a/LICENSE.md +++ b/LICENSE.md @@ -1,6 +1,6 @@ The MXNet.jl package is licensed under version 2.0 of the Apache License: -> Copyright (c) 2015: +> Copyright (c) 2015-2018: > * Chiyuan Zhang > > Apache License From ae425bfd8463cea26b043adc175962b314b519ce Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 1 Jan 2018 23:40:19 +0800 Subject: [PATCH 607/630] doc: append 'Defined in' into operator docstring (#393) e.g. ``` sum(arr::NDArray) Defined in src/operator/tensor/broadcast_reduce_op_value.cc:L85 ``` --- src/ndarray.jl | 18 +++++++++++++----- src/util.jl | 19 ++++++++++++++++++- test/unittest/util.jl | 7 +++++++ 3 files changed, 38 insertions(+), 6 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 5583e545ae11..1e6eeee81f94 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -1074,11 +1074,9 @@ _broadcast_target(sig::Expr) = sig.args[2].args[].args[end] """ Generate docstring from function signature """ -function _docsig(fname::Symbol, sig::Expr) +function _docsig(fname::Symbol, sig::Expr, opname::String) if fname !== :broadcast_ - s = get(_nddoc, fname, "") - !isempty(s) && return s - " $sig" + get(_nddoc, fname, " $sig") * "\n" * _getdocdefine(opname) else name = _broadcast_target(sig) str = get(_nddoc, name, "") @@ -1088,6 +1086,16 @@ function _docsig(fname::Symbol, sig::Expr) str = " $sig_" end if str ≠ false + # append "Defined in ..." + def = _getdocdefine(opname) + str = if str isa Markdown.MD + str = Markdown.MD(copy(str.content), copy(str.meta)) + push!(str, Markdown.Paragraph(def)) + str + else + str * def + end + @eval @doc $str $name end "" @@ -1139,7 +1147,7 @@ macro _remap(sig::Expr, imp::Expr) $retexpr end - docstr = _docsig(fname, sig) + docstr = _docsig(fname, sig, opname) func_def = Expr(:function, sig, func_body) esc(quote diff --git a/src/util.jl b/src/util.jl index c729bc7cd9ae..c4f5e63244dd 100644 --- a/src/util.jl +++ b/src/util.jl @@ -92,7 +92,7 @@ function _get_cached_libmx_op_handle(name :: String) end end -function _get_libmx_op_description(name :: String, handle :: MX_OpHandle) +function _get_libmx_op_description(name::String, handle::MX_OpHandle) # get operator information (human readable) ref_real_name = Ref{char_p}(0) ref_desc = Ref{char_p}(0) @@ -163,6 +163,23 @@ function _format_signature(narg::Int, arg_names::Ref{char_pp}) return join([unsafe_string(name) for name in arg_names] , ", ") end +""" +Extract the line of `Defined in ...` + +julia> mx._getdocdefine("sgd_update") +"Defined in src/operator/optimizer_op.cc:L53" +``` +""" +function _getdocdefine(name::String) + op = _get_libmx_op_handle(name) + str = _get_libmx_op_description(name, op)[1] + lines = split(str, '\n') + for m ∈ match.(r"^Defined in .*$", lines) + m != nothing && return m.match + end + "" +end + """ libmxnet operators signature checker. diff --git a/test/unittest/util.jl b/test/unittest/util.jl index 823decffd442..0e6107ca0acc 100644 --- a/test/unittest/util.jl +++ b/test/unittest/util.jl @@ -5,6 +5,12 @@ using Base.Test using MXNet +function test_getdocdefine() + info("Util::_getdocdefine") + @test contains(mx._getdocdefine("sgd_update"), "Defined in") +end # function test_getdocdefine + + function test_firstarg() info("Util::_firstarg") @test mx._firstarg(:(f(x, y))) == :x @@ -22,6 +28,7 @@ end # function test_firstarg @testset "Util Test" begin test_firstarg() + test_getdocdefine() end # @testset "Util" end # module TestUtil From 930090b8b94c8158ffcbc210b36ab93d810798e5 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 2 Jan 2018 08:51:51 +0800 Subject: [PATCH 608/630] ndarray: fix 1D NDArray display (#399) --- src/ndarray.jl | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 1e6eeee81f94..78adf381f29c 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -113,10 +113,11 @@ function Base.show(io::IO, x::NDArray) end # for REPL -function Base.show(io::IO, ::MIME{Symbol("text/plain")}, x::NDArray) +function Base.show(io::IO, ::MIME{Symbol("text/plain")}, x::NDArray{T, N}) where {T, N} type_ = split(string(typeof(x)), '.', limit=2)[end] - println(io, "$(join(size(x), "×")) $(type_) @ $(context(x)):") - Base.showarray(io, try_get_shared(x, sync = :read), false, header=false) + size_ = N == 1 ? "$(length(x))-element" : join(size(x), "×") + println(io, "$size_ $type_ @ $(context(x)):") + Base.showarray(io, try_get_shared(x, sync = :read), false, header = false) end Base.unsafe_convert(::Type{MX_handle}, obj::NDArray) = From a1cef7f84a69fe7b8dc6cf6d10f32775121043e1 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 2 Jan 2018 10:46:39 +0800 Subject: [PATCH 609/630] ndarray: fix type convertion in setindex! (#398) Make this case work ```julia x = mx.NDArray([1, 2, 3]); x[:] = 1.1 ``` --- src/ndarray.jl | 2 +- test/unittest/ndarray.jl | 8 ++++++++ 2 files changed, 9 insertions(+), 1 deletion(-) diff --git a/src/ndarray.jl b/src/ndarray.jl index 78adf381f29c..14e07979e768 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -356,7 +356,7 @@ end function setindex!(arr::NDArray, val::Real, ::Colon) @assert arr.writable - _set_value(out=arr, src=convert(eltype(arr), val)) + _set_value(out = arr, src = dump_mx_param(val)) end function setindex!(arr::NDArray, val::Array{T}, ::Colon) where T<:Real diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index df357f6c4c33..62fa4f9188f0 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -157,6 +157,14 @@ function test_linear_idx() x[24] = 42 @test copy(x[24]) == [42] end + + info("NDArray::setindex!::type convert") + let + x = NDArray([1, 2, 3]) + @test eltype(x) == Int + x[:] = π + @test copy(x) == [3, 3, 3] + end end # function test_linear_idx function test_first() From 86ffb5d77693a279f254aa17bc344bba8abee2b9 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 4 Jan 2018 12:21:10 +0800 Subject: [PATCH 610/630] ndarray: inplace modulo operators (#389) ```julia mod_from!(x, y) mod_from!(x, 2) rmod_from!(2, x) ``` --- NEWS.md | 10 ++++++++- src/ndarray.jl | 40 +++++++++++++++++++++++++++++++--- test/unittest/ndarray.jl | 47 ++++++++++++++++++++++++++++++++++++++++ 3 files changed, 93 insertions(+), 4 deletions(-) diff --git a/NEWS.md b/NEWS.md index aa08666b751f..431d69a6057a 100644 --- a/NEWS.md +++ b/NEWS.md @@ -117,7 +117,7 @@ 4.0 ``` -* modulo operator. (#TBD) +* Modulo operator. (#TBD) ```julia x = NDArray(...) @@ -128,6 +128,14 @@ 2 .% x ``` +* Inplace modulo operator, `mod_from!` and `rmod_from!`. (#TBD) + + ```julia + mod_from!(x, y) + mod_from!(x, 2) + rmod_from!(2, x) + ``` + * `cat`, `vcat`, `hcat` is implemented. (#TBD) E.g. `hcat` diff --git a/src/ndarray.jl b/src/ndarray.jl index 14e07979e768..c75c2e1c366f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -749,6 +749,24 @@ function broadcast_(::typeof(/), x::NDArray{T}, y::Real) where {T<:Integer} _div_scalar(x, scalar = y) end +""" + mod_from!(x::NDArray, y::NDArray) + mod_from!(x::NDArray, y::Real) + +Elementwise modulo for `NDArray`. +Inplace updating. +""" +mod_from!(x::NDArray, y::NDArray) = _mod!(x, y) +mod_from!(x::NDArray, y::Real) = _mod_scalar!(x, y) + +""" + rmod_from!(y::Real, x::NDArray) + +Elementwise modulo for `NDArray`. +Inplace updating. +""" +rmod_from!(y::Real, x::NDArray) = _rmod_scalar!(x, y) + import Base: % """ @@ -761,8 +779,8 @@ Elementwise modulo for `NDArray`. %(x::NDArray, y::Real) = _mod_scalar(x, scalar = y) broadcast_(::typeof(%), x::NDArray, y::NDArray) = _mod(x, y) -broadcast_(::typeof(%), x::NDArray, y::Real) = _mod_scalar(x, scalar = y) -broadcast_(::typeof(%), y::Real, x::NDArray) = _rmod_scalar(x, scalar = y) +broadcast_(::typeof(%), x::NDArray, y::Real) = _mod_scalar(x, y) +broadcast_(::typeof(%), y::Real, x::NDArray) = _rmod_scalar(x, y) import Base: ^ @@ -1061,8 +1079,13 @@ function _autoimport(name::Symbol, sig::Expr) end end +_isinplace(name::Symbol) = endswith(string(name), "!") + +_writable(name::Symbol, x) = + _isinplace(name) ? :(@assert $x.writable "this NDArray isn't writable") : :() + function _outexpr(name::Symbol, x #= the first arg of `sig` =#) - if endswith(string(name), "!") # `func!` + if _isinplace(name) # `func!` Ptr, 1, :([[MX_handle(x.handle)]]), :($x) else retexpr = :(NDArray(MX_NDArrayHandle(unsafe_load(hdls_ref[], 1)))) @@ -1124,7 +1147,10 @@ macro _remap(sig::Expr, imp::Expr) # handler for `func!` which has side effect on first argument. T, n_output, hdls_ref, retexpr = _outexpr(fname, _firstarg(sig)) + assert_expr = _writable(fname, _firstarg(sig)) + func_body = quote + $assert_expr op_handle = _get_cached_libmx_op_handle($opname) n_output = Ref(Cint($n_output)) hdls_ref = $hdls_ref @@ -1346,6 +1372,12 @@ julia> mx.log_softmax.(x) @_remap _mod(x::NDArray, y::NDArray) _mod(x, y) @_remap _mod!(x::NDArray, y::NDArray) _mod(x, y) +@_remap _mod_scalar(x::NDArray, y::Real) _mod_scalar(x; scalar = y) +@_remap _mod_scalar!(x::NDArray, y::Real) _mod_scalar(x; scalar = y) + +@_remap _rmod_scalar(x::NDArray, y::Real) _rmod_scalar(x; scalar = y) +@_remap _rmod_scalar!(x::NDArray, y::Real) _rmod_scalar(x; scalar = y) + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -1467,6 +1499,8 @@ const _op_import_bl = [ # import black list; do not import these funcs "_plus", "_minus", "_mod", + "_mod_scalar", + "_rmod_scalar", "dot", "max", diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 62fa4f9188f0..b52ecc722b97 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -535,6 +535,7 @@ function test_mod() @test copy(z) ≈ D end + info("NDArray::mod::scalar") let x = NDArray(A) C = A .% 2 y = x .% 2 @@ -547,6 +548,52 @@ function test_mod() y = 11 .% x @test copy(y) ≈ C end + + info("NDArray::mod_from!") + let + x = NDArray(A) + y = NDArray(B) + C = A .% B + mx.mod_from!(x, y) + @test copy(x) ≈ C + end + + let + x = NDArray(A) + y = NDArray(B) + C = B .% A + mx.mod_from!(y, x) + + @test copy(y) ≈ C + end + + info("NDArray::mod_from!::scalar") + let + x = NDArray(A) + C = A .% 2 + mx.mod_from!(x, 2) + @test copy(x) ≈ C + end + + info("NDArray::rmod_from!") + let + x = NDArray(A) + C = 11 .% A + mx.rmod_from!(11, x) + @test copy(x) ≈ C + end + + info("NDArray::mod_from!::writable") + let + x = NDArray(A) + y = NDArray(B) + x.writable = false + y.writable = false + @test_throws AssertionError mx.mod_from!(x, y) + @test_throws AssertionError mx.mod_from!(y, x) + @test_throws AssertionError mx.mod_from!(x, 2) + @test_throws AssertionError mx.rmod_from!(2, x) + end end # function test_mod From 30852dd2a60179fa7b43c0a551852a24f14732d6 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 4 Jan 2018 12:22:59 +0800 Subject: [PATCH 611/630] ndarray: support modulo operation in macro inplace (#390) * ndarray: inplace modulo operators ```julia mod_from!(x, y) mod_from!(x, 2) rmod_from!(2, x) ``` * ndarray: support modulo operation for macro inplace Blocker: #389 * update doc --- NEWS.md | 1 + docs/src/api/ndarray.md | 1 + src/MXNet.jl | 1 + src/ndarray.jl | 23 +++++++++++++---------- test/unittest/ndarray.jl | 9 +++++++++ 5 files changed, 25 insertions(+), 10 deletions(-) diff --git a/NEWS.md b/NEWS.md index 431d69a6057a..b6264f412761 100644 --- a/NEWS.md +++ b/NEWS.md @@ -7,6 +7,7 @@ * `context()` * `empty()` * `expand_dims()` + * `@inplace` * `σ()` * `sigmoid()` * `relu()` diff --git a/docs/src/api/ndarray.md b/docs/src/api/ndarray.md index 76fb6a39b621..5877d8257758 100644 --- a/docs/src/api/ndarray.md +++ b/docs/src/api/ndarray.md @@ -11,6 +11,7 @@ In the following example `y` can be a `Real` value or another `NDArray` | `*` | `x .* y` | Elementwise multiplication | | `/` | `x ./ y` | Elementwise division | | `^` | `x .^ y` | Elementwise power | +| `%` | `x .% y` | Elementwise modulo | ## Trigonometric Functions diff --git a/src/MXNet.jl b/src/MXNet.jl index e4c23f299dc1..bd27c715b61d 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -36,6 +36,7 @@ export NDArray, context, empty, expand_dims, + @inplace, # activation funcs σ, sigmoid, diff --git a/src/ndarray.jl b/src/ndarray.jl index c75c2e1c366f..c9cea4fe3597 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -572,18 +572,21 @@ will translate into which will do inplace adding of the contents of `b` into `a`. """ -macro inplace(stmt) - if stmt.head == :+= || stmt.head == :.+= - Expr(:call, :add_to!, esc(stmt.args[1]), esc(stmt.args[2])) - elseif stmt.head == :-= || stmt.head == :.-= - Expr(:call, :sub_from!, esc(stmt.args[1]), esc(stmt.args[2])) - elseif stmt.head == :.*= - Expr(:call, :mul_to!, esc(stmt.args[1]), esc(stmt.args[2])) - elseif stmt.head == :./= - Expr(:call, :div_from!, esc(stmt.args[1]), esc(stmt.args[2])) +macro inplace(ex) + f = if ex.head == :+= || ex.head == :.+= + :add_to! + elseif ex.head == :-= || ex.head == :.-= + :sub_from! + elseif ex.head == :.*= + :mul_to! + elseif ex.head == :./= + :div_from! + elseif ex.head == :.%= + :mod_from! else - error("unsupported inplace translation for $stmt") + error("unsupported inplace translation for $ex") end + Expr(:call, f, esc(ex.args[1]), esc(ex.args[2])) end """ diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index b52ecc722b97..df7238dc73a4 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -594,6 +594,15 @@ function test_mod() @test_throws AssertionError mx.mod_from!(x, 2) @test_throws AssertionError mx.rmod_from!(2, x) end + + info("NDArray::mod::inplace") + let + x = NDArray(A) + y = NDArray(B) + C = A .% B + @inplace x .%= y + @test copy(x) ≈ C + end end # function test_mod From 0ef59668f695c777ae094fdf437cf1b9165af3a0 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 4 Jan 2018 12:38:10 +0800 Subject: [PATCH 612/630] ndarray: add Base.ones(::NDArray) and Base.zeros (#363) For creating NDArray with same type and dims --- NEWS.md | 4 ++++ src/ndarray.jl | 38 +++++++++++++++----------------------- test/unittest/ndarray.jl | 22 ++++++++++++++++++++++ 3 files changed, 41 insertions(+), 23 deletions(-) diff --git a/NEWS.md b/NEWS.md index b6264f412761..f49184dfdda7 100644 --- a/NEWS.md +++ b/NEWS.md @@ -118,6 +118,10 @@ 4.0 ``` +* `Base.ones(x::NDArray)` for creating an one-ed `NDArray`. (#TBD) + +* `Base.zeros(x::NDArray)` for creating a zero-ed `NDArray`. (#TBD) + * Modulo operator. (#TBD) ```julia diff --git a/src/ndarray.jl b/src/ndarray.jl index c9cea4fe3597..94f21f00e943 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -172,8 +172,9 @@ Note that the returned `NDArray` is uninitialized. Base.similar(x::NDArray{T}) where {T} = empty(T, size(x), context(x)) """ - zeros(DType, dims[, ctx::Context = cpu()]) - zeros(DType, dims...) + zeros([DType], dims, [ctx::Context = cpu()]) + zeros([DType], dims...) + zeros(x::NDArray) Create zero-ed `NDArray` with specific shape and type. """ @@ -185,19 +186,17 @@ end zeros(::Type{T}, dims::Int...) where {T<:DType} = zeros(T, dims) -""" - zeros(dims[, ctx::Context = cpu()]) - zeros(dims...) - -Create zero-ed `NDArray` with specific shape. -""" -zeros(dims::NTuple{N, Int}, ctx::Context = cpu()) where N = +zeros(dims::NTuple{N,Int}, ctx::Context = cpu()) where N = zeros(MX_float, dims, ctx) zeros(dims::Int...) = zeros(dims) +zeros(x::NDArray)::typeof(x) = zeros_like(x) +Base.zeros(x::NDArray)::typeof(x) = zeros_like(x) + """ - ones(DType, dims::Tuple[, ctx::Context = cpu()]) - ones(DType, dim1, dim2...) + ones([DType], dims, [ctx::Context = cpu()]) + ones([DType], dims...) + ones(x::NDArray) Create an `NDArray` with specific shape & type, and initialize with 1. """ @@ -209,20 +208,13 @@ end ones(::Type{T}, dims::Int...) where T<:DType = ones(T, dims) -""" - ones(dims::Tuple[, ctx::Context = cpu()]) - ones(dim1, dim2, ...) - -Create an `NDArray` with specific shape and initialize with 1. -""" -function ones(dims::NTuple{N,Int}, ctx::Context = cpu()) where N - arr = empty(dims, ctx) - arr[:] = 1 - arr -end - +ones(dims::NTuple{N,Int}, ctx::Context = cpu()) where N = + ones(MX_float, dims, ctx) ones(dims::Int...) = ones(dims) +ones(x::NDArray)::typeof(x) = ones_like(x) +Base.ones(x::NDArray)::typeof(x) = ones_like(x) + import Base: size, length, ndims, eltype """ diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index df7238dc73a4..ac80fc519d13 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -29,6 +29,27 @@ function test_constructor() end # function test_constructor +function test_ones_zeros_like() + info("NDArray::Base.zeros") + let x = mx.rand(1, 10, (1, 3, 2, 4)) + y = zeros(x) + @test sum(copy(y)) == 0 + + y = mx.zeros(x) + @test sum(copy(y)) == 0 + end + + info("NDArray::Base.ones") + let x = mx.rand(1, 10, (1, 3, 2, 4)) + y = ones(x) + @test sum(copy(y)) == 1 * 3 * 2 * 4 + + y = mx.ones(x) + @test sum(copy(y)) == 1 * 3 * 2 * 4 + end +end # function test_ones_zeros_like + + function test_copy() dims = rand_dims() tensor = rand(mx.MX_float, dims) @@ -1167,6 +1188,7 @@ end # function test_act_funcs ################################################################################ @testset "NDArray Test" begin test_constructor() + test_ones_zeros_like() test_assign() test_copy() test_slice() From 49399fc9d351ddcb1e08e910b0b39d67d314d714 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 7 Jan 2018 14:29:11 +0800 Subject: [PATCH 613/630] ndarray: broadcasting along dimension on arith operators (#401) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * `+` * `-` * `*` * `/` * `%` * `^` ```julia julia> x = NDArray([1 2 3; 4 5 6]) 2×3 mx.NDArray{Int64,2} @ CPU0: 1 2 3 4 5 6 julia> y = NDArray([1; 10]) 2-element mx.NDArray{Int64,1} @ CPU0: 1 10 julia> x .+ y 2×3 mx.NDArray{Int64,2} @ CPU0: 2 3 4 14 15 16 ``` --- NEWS.md | 28 +++++++++++ src/deprecated.jl | 40 +++++++++++++++ src/ndarray.jl | 72 ++++++++++++++++++++++---- test/unittest/ndarray.jl | 106 ++++++++++++++++++++++++++++++++++++++- 4 files changed, 234 insertions(+), 12 deletions(-) diff --git a/NEWS.md b/NEWS.md index f49184dfdda7..ee00a6260396 100644 --- a/NEWS.md +++ b/NEWS.md @@ -206,6 +206,34 @@ ### `NDArray` +* Broadcasting along dimension supported on following operators (#TBD): + + * `+` + * `-` + * `*` + * `/` + * `%` + * `^` + + ```julia + julia> x = NDArray([1 2 3; + 4 5 6]) + 2×3 mx.NDArray{Int64,2} @ CPU0: + 1 2 3 + 4 5 6 + + julia> y = NDArray([1; + 10]) + 2-element mx.NDArray{Int64,1} @ CPU0: + 1 + 10 + + julia> x .+ y + 2×3 mx.NDArray{Int64,2} @ CPU0: + 2 3 4 + 14 15 16 + ``` + * Please use dot-call on following trigonometric functions. Also, the `arc*` has been renamed to keep consistent with `Base`. (#TBD) diff --git a/src/deprecated.jl b/src/deprecated.jl index 9a24aa815148..aa12e264f729 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -56,3 +56,43 @@ end @deprecate log_softmax(x::NDArray; axis = ndims(x)) log_softmax.(x, axis) @deprecate clip(x; a_min = 0, a_max = 0) clip(x, a_min, a_max) + +function broadcast_plus(x::NDArray, y::NDArray) + warn("broadcast_plus(x, y) is deprecated, use x .+ y instead.") + x .+ y +end + +function broadcast_add(x::NDArray, y::NDArray) + warn("broadcast_add(x, y) is deprecated, use x .+ y instead.") + x .+ y +end + +function broadcast_sub(x::NDArray, y::NDArray) + warn("broadcast_sub(x, y) is deprecated, use x .- y instead.") + x .- y +end + +function broadcast_minus(x::NDArray, y::NDArray) + warn("broadcast_minus(x, y) is deprecated, use x .- y instead.") + x .- y +end + +function broadcast_mul(x::NDArray, y::NDArray) + warn("broadcast_mul(x, y) is deprecated, use x .* y instead.") + x .* y +end + +function broadcast_div(x::NDArray, y::NDArray) + warn("broadcast_div(x, y) is deprecated, use x ./ y instead.") + x ./ y +end + +function broadcast_mod(x::NDArray, y::NDArray) + warn("broadcast_mod(x, y) is deprecated, use x .% y instead.") + x .% y +end + +function broadcast_power(x::NDArray, y::NDArray) + warn("broadcast_power(x, y) is deprecated, use x.^y instead.") + x.^y +end diff --git a/src/ndarray.jl b/src/ndarray.jl index 94f21f00e943..9aab4ebcaf9a 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -613,8 +613,12 @@ added together. Note at least the first or second argument needs to be an +(x::NDArray, y::Real) = _plus_scalar(x, scalar = y) +(y::Real, x::NDArray) = _plus_scalar(x, scalar = y) -broadcast_(::typeof(+), x::NDArray, y::NDArrayOrReal) = x + y -broadcast_(::typeof(+), x::Real, y::NDArray) = x + y +broadcast_(::typeof(+), x::NDArray, y::Real) = x + y +broadcast_(::typeof(+), x::Real, y::NDArray) = x + y + +broadcast_(::typeof(+), x::NDArray{T,N}, y::NDArray{T,N}) where {T,N} = x + y +broadcast_(::typeof(+), x::NDArray{T,N}, y::NDArray{T,M}) where {T,N,M} = + _broadcast_add(x, y) """ sub_from!(dst::NDArray, args::NDArrayOrReal...) @@ -646,8 +650,12 @@ Or create the negative of `x`. -(x::NDArray, y::Real) = _minus_scalar(x, scalar = y) -(y::Real, x::NDArray) = _rminus_scalar(x, scalar = y) -broadcast_(::typeof(-), x::NDArray, y::NDArrayOrReal) = x - y -broadcast_(::typeof(-), x::Real, y::NDArray) = x - y +broadcast_(::typeof(-), x::NDArray, y::Real) = x - y +broadcast_(::typeof(-), x::Real, y::NDArray) = x - y + +broadcast_(::typeof(-), x::NDArray{T,N}, y::NDArray{T,N}) where {T,N} = x - y +broadcast_(::typeof(-), x::NDArray{T,N}, y::NDArray{T,M}) where {T,N,M} = + _broadcast_minus(x, y) """ mul_to!(dst::NDArray, arg::NDArrayOrReal) @@ -675,9 +683,13 @@ Elementwise multiplication for `NDArray`. *(x::NDArray, y::Real) = _mul_scalar(x, scalar = y) *(y::Real, x::NDArray) = _mul_scalar(x, scalar = y) -broadcast_(::typeof(*), x::NDArray, y::Real) = x * y -broadcast_(::typeof(*), y::Real, x::NDArray) = x * y -broadcast_(::typeof(*), x::NDArray, y::NDArray) = _mul(x, y) +broadcast_(::typeof(*), x::NDArray, y::Real) = x * y +broadcast_(::typeof(*), y::Real, x::NDArray) = x * y + +broadcast_(::typeof(*), x::NDArray{T,N}, y::NDArray{T,N}) where {T,N} = + _mul(x, y) +broadcast_(::typeof(*), x::NDArray{T,N}, y::NDArray{T,M}) where {T,N,M} = + _broadcast_mul(x, y) """ *(A::NDArray, B::NDArray) @@ -735,10 +747,14 @@ of the same shape. """ /(x::NDArray, y::Real) = _div_scalar(x, scalar = y) -broadcast_(::typeof(/), x::NDArray, y::NDArray) = _div(x, y) broadcast_(::typeof(/), x::NDArray, y::Real) = _div_scalar(x, scalar = y) broadcast_(::typeof(/), y::Real, x::NDArray) = _rdiv_scalar(x, scalar = y) +broadcast_(::typeof(/), x::NDArray{T,N}, y::NDArray{T,N}) where {T,N} = + _div(x, y) +broadcast_(::typeof(/), x::NDArray{T,N}, y::NDArray{T,M}) where {T,N,M} = + _broadcast_div(x, y) + function broadcast_(::typeof(/), x::NDArray{T}, y::Real) where {T<:Integer} @assert(round(T, y) != zero(T), "Integer divided by zero") _div_scalar(x, scalar = y) @@ -773,15 +789,18 @@ Elementwise modulo for `NDArray`. """ %(x::NDArray, y::Real) = _mod_scalar(x, scalar = y) -broadcast_(::typeof(%), x::NDArray, y::NDArray) = _mod(x, y) broadcast_(::typeof(%), x::NDArray, y::Real) = _mod_scalar(x, y) broadcast_(::typeof(%), y::Real, x::NDArray) = _rmod_scalar(x, y) +broadcast_(::typeof(%), x::NDArray{T,N}, y::NDArray{T,N}) where {T,N} = + _mod(x, y) +broadcast_(::typeof(%), x::NDArray{T,N}, y::NDArray{T,M}) where {T,N,M} = + _broadcast_mod(x, y) + import Base: ^ # document of `.^` is merged into SymbolicNode's -broadcast_(::typeof(^), x::NDArray, y::NDArray) = _power(x, y) broadcast_(::typeof(^), x::NDArray, s::Real) = _power_scalar(x, scalar = s) broadcast_(::typeof(^), s::Real, x::NDArray) = _rpower_scalar(x, scalar = s) @@ -789,6 +808,11 @@ broadcast_(::typeof(^), ::Irrational{:e}, x::NDArray) = exp(x) broadcast_(::typeof(^), x::NDArray, s::Irrational) = _power_scalar(x, scalar = s) broadcast_(::typeof(^), s::Irrational, x::NDArray) = _rpower_scalar(x, scalar = s) +broadcast_(::typeof(^), x::NDArray{T,N}, y::NDArray{T,N}) where {T,N} = + _power(x, y) +broadcast_(::typeof(^), x::NDArray{T,N}, y::NDArray{T,M}) where {T,N,M} = + _broadcast_power(x, y) + """ fill!(arr::NDArray, x) @@ -1373,6 +1397,24 @@ julia> mx.log_softmax.(x) @_remap _rmod_scalar(x::NDArray, y::Real) _rmod_scalar(x; scalar = y) @_remap _rmod_scalar!(x::NDArray, y::Real) _rmod_scalar(x; scalar = y) +@_remap _broadcast_add(x::NDArray, y::NDArray) broadcast_add(x, y) +@_remap _broadcast_add!(x::NDArray, y::NDArray) broadcast_add(x, y) + +@_remap _broadcast_minus(x::NDArray, y::NDArray) broadcast_minus(x, y) +@_remap _broadcast_minus!(x::NDArray, y::NDArray) broadcast_minus(x, y) + +@_remap _broadcast_mul(x::NDArray, y::NDArray) broadcast_mul(x, y) +@_remap _broadcast_mul!(x::NDArray, y::NDArray) broadcast_mul(x, y) + +@_remap _broadcast_div(x::NDArray, y::NDArray) broadcast_div(x, y) +@_remap _broadcast_div!(x::NDArray, y::NDArray) broadcast_div(x, y) + +@_remap _broadcast_mod(x::NDArray, y::NDArray) broadcast_mod(x, y) +@_remap _broadcast_mod!(x::NDArray, y::NDArray) broadcast_mod(x, y) + +@_remap _broadcast_power(x::NDArray, y::NDArray) broadcast_power(x, y) +@_remap _broadcast_power!(x::NDArray, y::NDArray) broadcast_power(x, y) + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -1529,6 +1571,16 @@ const _op_import_bl = [ # import black list; do not import these funcs "relu", "softmax", "log_softmax", + + # broadcast + "broadcast_add", + "broadcast_plus", + "broadcast_minus", + "broadcast_sub", + "broadcast_mul", + "broadcast_div", + "broadcast_mod", + "broadcast_power", ] macro _import_ndarray_functions() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index ac80fc519d13..f18b9d20f123 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -8,8 +8,8 @@ using ..Main: rand_dims ################################################################################ # Test Implementations ################################################################################ -rand_tensors(dims::NTuple{N, Int}) where {N} = rand_tensors(mx.MX_float, dims) -function rand_tensors(::Type{T}, dims::NTuple{N, Int}) where {N, T} +rand_tensors(dims::NTuple{N,Int}) where {N} = rand_tensors(mx.MX_float, dims) +function rand_tensors(::Type{T}, dims::NTuple{N,Int}) where {N,T} tensor = rand(T, dims) array = copy(tensor, mx.cpu()) return (tensor, array) @@ -330,6 +330,23 @@ function test_plus() y = x .+ 2.9 @test copy(y) == [3, 4, 5] end + + info("NDArray::broadcast_add") + let + A = [1 2 3; + 4 5 6] + B = [1, + 2] + x = NDArray(A) + y = NDArray(B) + + z = x .+ y + @test copy(z) == A .+ B + + # TODO + # @inplace x .+= y + # @test copy(x) == A .+ B + end end function test_minus() @@ -386,6 +403,23 @@ function test_minus() let x = mx.NDArray([1, 2, 3]) @test copy(x .- π) ≈ [-2, -1, 0] end + + info("NDArray::broadcast_minus") + let + A = [1 2 3; + 4 5 6] + B = [1, + 2] + x = NDArray(A) + y = NDArray(B) + + z = x .- y + @test copy(z) == A .- B + + # TODO + # @inplace x .-= y + # @test copy(x) == A .- B + end end function test_mul() @@ -445,6 +479,23 @@ function test_mul() @test eltype(x) == Int @test copy(y) == [3, 6, 9] end + + info("NDArray::broadcast_mul") + let + A = [1 2 3; + 4 5 6] + B = [1, + 2] + x = NDArray(A) + y = NDArray(B) + + z = x .* y + @test copy(z) == A .* B + + # TODO + # @inplace x .*= y + # @test copy(x) == A .* B + end end function test_div() @@ -499,6 +550,23 @@ function test_div() @test_throws AssertionError x ./ 0.5 end + + info("NDArray::broadcast_div") + let + A = Float32[1 2 3; + 4 5 6] + B = Float32[1, + 2] + x = NDArray(A) + y = NDArray(B) + + z = x ./ y + @test copy(z) == A ./ B + + # TODO + # @inplace x ./= y + # @test copy(x) == A ./ B + end end @@ -624,6 +692,23 @@ function test_mod() @inplace x .%= y @test copy(x) ≈ C end + + info("NDArray::broadcast_mod") + let + A = [1 2 3; + 4 5 6] + B = [1, + 2] + x = NDArray(A) + y = NDArray(B) + + z = x .% y + @test copy(z) == A .% B + + # TODO + # @inplace x .%= y + # @test copy(x) == A .% B + end end # function test_mod @@ -788,6 +873,23 @@ function test_power() end # TODO: Float64: wait for https://github.com/apache/incubator-mxnet/pull/8012 + + info("NDArray::broadcast_power") + let + A = [1 2 3; + 4 5 6] + B = [1, + 2] + x = NDArray(A) + y = NDArray(B) + + z = x.^y + @test copy(z) == A.^B + + # TODO + # @inplace x .^= y + # @test copy(x) == A.^B + end end # function test_power function test_sqrt() From e79ce7190d0faa2fbef5253f1b1cc6cd3ba6014a Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 10 Jan 2018 21:28:46 +0800 Subject: [PATCH 614/630] ndarray: broadcast comparison operators (#402) --- NEWS.md | 10 ++++++++- src/deprecated.jl | 30 ++++++++++++++++++++++++++ src/ndarray.jl | 46 ++++++++++++++++++++++++++++++++++++++++ test/unittest/ndarray.jl | 44 ++++++++++++++++++++++++++++++++++++-- 4 files changed, 127 insertions(+), 3 deletions(-) diff --git a/NEWS.md b/NEWS.md index ee00a6260396..12fec5fe2152 100644 --- a/NEWS.md +++ b/NEWS.md @@ -206,7 +206,9 @@ ### `NDArray` -* Broadcasting along dimension supported on following operators (#TBD): +* Broadcasting along dimension supported on following operators, + and the original `mx.broadcast_*` APIs are deprecated + (#401) (#402): * `+` * `-` @@ -214,6 +216,12 @@ * `/` * `%` * `^` + * `==` + * `!=` + * `>` + * `>=` + * `<` + * `<=` ```julia julia> x = NDArray([1 2 3; diff --git a/src/deprecated.jl b/src/deprecated.jl index aa12e264f729..a0f722805168 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -96,3 +96,33 @@ function broadcast_power(x::NDArray, y::NDArray) warn("broadcast_power(x, y) is deprecated, use x.^y instead.") x.^y end + +function broadcast_equal(x::NDArray, y::NDArray) + warn("broadcast_equal(x, y) is deprecated, use x .== y instead.") + x .== y +end + +function broadcast_not_equal(x::NDArray, y::NDArray) + warn("broadcast_not_equal(x, y) is deprecated, use x .== y instead.") + x .!= y +end + +function broadcast_greater(x::NDArray, y::NDArray) + warn("broadcast_greater(x, y) is deprecated, use x .== y instead.") + x .> y +end + +function broadcast_greater_equal(x::NDArray, y::NDArray) + warn("broadcast_greater_equal(x, y) is deprecated, use x .== y instead.") + x .>= y +end + +function broadcast_lesser(x::NDArray, y::NDArray) + warn("broadcast_lesser(x, y) is deprecated, use x .== y instead.") + x .< y +end + +function broadcast_lesser_equal(x::NDArray, y::NDArray) + warn("broadcast_lesser_equal(x, y) is deprecated, use x .== y instead.") + x .<= y +end diff --git a/src/ndarray.jl b/src/ndarray.jl index 9aab4ebcaf9a..8fa4abc6482f 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -813,6 +813,28 @@ broadcast_(::typeof(^), x::NDArray{T,N}, y::NDArray{T,N}) where {T,N} = broadcast_(::typeof(^), x::NDArray{T,N}, y::NDArray{T,M}) where {T,N,M} = _broadcast_power(x, y) + +############################################################################### +# comparison +############################################################################### +broadcast_(::typeof(==), x::NDArray{T}, y::NDArray{T}) where {T} = + _broadcast_equal(x, y) + +broadcast_(::typeof(!=), x::NDArray{T}, y::NDArray{T}) where {T} = + _broadcast_not_equal(x, y) + +broadcast_(::typeof(>), x::NDArray{T}, y::NDArray{T}) where {T} = + _broadcast_greater(x, y) + +broadcast_(::typeof(>=), x::NDArray{T}, y::NDArray{T}) where {T} = + _broadcast_greater_equal(x, y) + +broadcast_(::typeof(<), x::NDArray{T}, y::NDArray{T}) where {T} = + _broadcast_lesser(x, y) + +broadcast_(::typeof(<=), x::NDArray{T}, y::NDArray{T}) where {T} = + _broadcast_lesser_equal(x, y) + """ fill!(arr::NDArray, x) @@ -1415,6 +1437,24 @@ julia> mx.log_softmax.(x) @_remap _broadcast_power(x::NDArray, y::NDArray) broadcast_power(x, y) @_remap _broadcast_power!(x::NDArray, y::NDArray) broadcast_power(x, y) +@_remap _broadcast_equal(x::NDArray, y::NDArray) broadcast_equal(x, y) +@_remap _broadcast_equal!(x::NDArray, y::NDArray) broadcast_equal(x, y) + +@_remap _broadcast_not_equal(x::NDArray, y::NDArray) broadcast_not_equal(x, y) +@_remap _broadcast_not_equal!(x::NDArray, y::NDArray) broadcast_not_equal(x, y) + +@_remap _broadcast_greater(x::NDArray, y::NDArray) broadcast_greater(x, y) +@_remap _broadcast_greater!(x::NDArray, y::NDArray) broadcast_greater(x, y) + +@_remap _broadcast_greater_equal(x::NDArray, y::NDArray) broadcast_greater_equal(x, y) +@_remap _broadcast_greater_equal!(x::NDArray, y::NDArray) broadcast_greater_equal(x, y) + +@_remap _broadcast_lesser(x::NDArray, y::NDArray) broadcast_lesser(x, y) +@_remap _broadcast_lesser!(x::NDArray, y::NDArray) broadcast_lesser(x, y) + +@_remap _broadcast_lesser_equal(x::NDArray, y::NDArray) broadcast_lesser_equal(x, y) +@_remap _broadcast_lesser_equal!(x::NDArray, y::NDArray) broadcast_lesser_equal(x, y) + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -1581,6 +1621,12 @@ const _op_import_bl = [ # import black list; do not import these funcs "broadcast_div", "broadcast_mod", "broadcast_power", + "broadcast_equal", + "broadcast_not_equal", + "broadcast_greater", + "broadcast_greater_equal", + "broadcast_lesser", + "broadcast_lesser_equal", ] macro _import_ndarray_functions() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index f18b9d20f123..b96e524dea93 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -31,7 +31,7 @@ end # function test_constructor function test_ones_zeros_like() info("NDArray::Base.zeros") - let x = mx.rand(1, 10, (1, 3, 2, 4)) + let x = mx.rand(1, 3, 2, 4, low = 1, high = 10) y = zeros(x) @test sum(copy(y)) == 0 @@ -40,7 +40,7 @@ function test_ones_zeros_like() end info("NDArray::Base.ones") - let x = mx.rand(1, 10, (1, 3, 2, 4)) + let x = mx.rand(1, 3, 2, 4, low = 1, high = 10) y = ones(x) @test sum(copy(y)) == 1 * 3 * 2 * 4 @@ -1285,6 +1285,45 @@ function test_act_funcs() end end # function test_act_funcs +macro check_equal(op) + quote + A = [1 2 3 + 4 5 6] + B = [1, + 6] + x = NDArray(A) + y = NDArray(B) + a = broadcast($op, x, y) + @test copy(a) == broadcast($op, A, B) + + C = [3 2 1 + 6 5 4] + z = NDArray(C) + b = broadcast($op, x, z) + @test copy(b) == broadcast($op, A, C) + end +end + +function test_equal() + info("NDArray::broadcast_equal") + @check_equal == + + info("NDArray::broadcast_not_equal") + @check_equal != + + info("NDArray::broadcast_greater") + @check_equal > + + info("NDArray::broadcast_greater_equal") + @check_equal >= + + info("NDArray::broadcast_lesser") + @check_equal < + + info("NDArray::broadcast_lesser_equal") + @check_equal <= +end # function test_equal + ################################################################################ # Run tests ################################################################################ @@ -1326,6 +1365,7 @@ end # function test_act_funcs test_trigonometric() test_hyperbolic() test_act_funcs() + test_equal() end end From 2ab0584725468d135dc5ecc40a885ad44ea83268 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 13 Jan 2018 16:25:38 +0800 Subject: [PATCH 615/630] ndarray: copy!(NDArray, AbstractArray) (#405) ```julia julia> x = mx.zeros(3) 3-element mx.NDArray{Float32,1} @ CPU0: 0.0 0.0 0.0 julia> copy!(x, 3:5) 3-element mx.NDArray{Float32,1} @ CPU0: 3.0 4.0 5.0 ``` --- NEWS.md | 16 ++++++++++++++++ src/ndarray.jl | 3 ++- test/unittest/ndarray.jl | 9 +++++++++ 3 files changed, 27 insertions(+), 1 deletion(-) diff --git a/NEWS.md b/NEWS.md index 12fec5fe2152..401ee450380e 100644 --- a/NEWS.md +++ b/NEWS.md @@ -118,6 +118,22 @@ 4.0 ``` +* `copy!(NDArray, AbstractArray)` is implemented now. (#TBD) + + ```julia + julia> x = mx.zeros(3) + 3-element mx.NDArray{Float32,1} @ CPU0: + 0.0 + 0.0 + 0.0 + + julia> copy!(x, 3:5) + 3-element mx.NDArray{Float32,1} @ CPU0: + 3.0 + 4.0 + 5.0 + ``` + * `Base.ones(x::NDArray)` for creating an one-ed `NDArray`. (#TBD) * `Base.zeros(x::NDArray)` for creating a zero-ed `NDArray`. (#TBD) diff --git a/src/ndarray.jl b/src/ndarray.jl index 8fa4abc6482f..9532e2b7f70b 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -430,7 +430,7 @@ end import Base: copy!, copy, convert, deepcopy """ - copy!(dst :: Union{NDArray, Array}, src :: Union{NDArray, Array}) + copy!(dst::Union{NDArray, Array}, src::Union{NDArray, Array}) Copy contents of `src` into `dst`. """ @@ -453,6 +453,7 @@ function copy!(dst::Array{T}, src::NDArray{T}) where T<:DType end copy!(dst::Array{<:Real}, src::NDArray) = copy!(dst, copy(src)) +copy!(dst::NDArray, src::AbstractArray) = copy!(dst, collect(src)) function copy!(dst::NDArray{T}, src::Array{<:Real}) where {T} @assert dst.writable diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index b96e524dea93..1b656902480c 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -76,6 +76,15 @@ function test_copy() @test eltype(x) == Float64 @test copy(x) ≈ [1., 2, 3, 4] end + + info("NDArray::copy!::AbstractArray") + let + x = mx.zeros(4) + copy!(x, 1:4) + + @test eltype(x) == Float32 + @test copy(x) == [1, 2, 3, 4] + end end function test_deepcopy() From 1c990bc9dc387dee5f92e802d222b5af7a33f47e Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 17 Jan 2018 14:45:22 +0800 Subject: [PATCH 616/630] ndarray: new constructor NDArray(Type, AbstractArray) (#404) ```julia julia> NDArray([1, 2, 3]) 3-element mx.NDArray{Int64,1} @ CPU0: 1 2 3 julia> NDArray(Float32, [1, 2, 3]) 3-element mx.NDArray{Float32,1} @ CPU0: 1.0 2.0 3.0 ``` --- NEWS.md | 17 +++++++++++++++++ src/ndarray.jl | 2 ++ test/unittest/ndarray.jl | 12 ++++++++++++ 3 files changed, 31 insertions(+) diff --git a/NEWS.md b/NEWS.md index 401ee450380e..11e853c2149e 100644 --- a/NEWS.md +++ b/NEWS.md @@ -84,6 +84,23 @@ ### `NDArray` +* A handy constructor: `NDArray(Type, AbstractArray)` is added. (#TBD) + + E.g. + ```julia + julia> NDArray([1, 2, 3]) + 3-element mx.NDArray{Int64,1} @ CPU0: + 1 + 2 + 3 + + julia> NDArray(Float32, [1, 2, 3]) + 3-element mx.NDArray{Float32,1} @ CPU0: + 1.0 + 2.0 + 3.0 + ``` + * A port of Python's `autograd` for `NDArray` (#274) * `size(x, dims...)` is supported now. (#TBD) diff --git a/src/ndarray.jl b/src/ndarray.jl index 9532e2b7f70b..8130679b2ae3 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -98,6 +98,8 @@ end NDArray(x::AbstractArray{T}) where {T<:DType} = copy(collect(x), cpu()) NDArray(x::Array{T}) where {T<:DType} = copy(x, cpu()) +NDArray(::Type{T}, x::AbstractArray) where {T<:DType} = + copy(convert(AbstractArray{T}, x), cpu()) NDArray(handle, writable = true) = NDArray{eltype(handle), ndims(handle)}(handle, writable) diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 1b656902480c..26fb7327a21d 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -26,6 +26,18 @@ function test_constructor() check_absarray(1:10) check_absarray(1.0:10) + + info("NDArray::NDArray(Type, AbstractArray)") + let + x = mx.NDArray(Float32, [1, 2, 3]) + @test eltype(x) == Float32 + @test copy(x) == [1, 2, 3] + end + let + x = mx.NDArray(Float32, [1.1, 2, 3]) + @test eltype(x) == Float32 + @test copy(x) ≈ [1.1, 2, 3] + end end # function test_constructor From 0fba766d7c6ba44f3d3f3beeeddfd5c3087b5f23 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Fri, 19 Jan 2018 09:13:52 +0800 Subject: [PATCH 617/630] ndarray: broadcast_min/max (#403) --- NEWS.md | 4 +++- src/broadcast.jl | 3 ++- src/deprecated.jl | 10 ++++++++++ src/ndarray.jl | 23 ++++++++++++++++++++++- test/unittest/ndarray.jl | 26 ++++++++++++++++++++++++++ 5 files changed, 63 insertions(+), 3 deletions(-) diff --git a/NEWS.md b/NEWS.md index 11e853c2149e..f8d1f1073456 100644 --- a/NEWS.md +++ b/NEWS.md @@ -241,7 +241,7 @@ * Broadcasting along dimension supported on following operators, and the original `mx.broadcast_*` APIs are deprecated - (#401) (#402): + (#401) (#402) (#403): * `+` * `-` @@ -255,6 +255,8 @@ * `>=` * `<` * `<=` + * `max` + * `min` ```julia julia> x = NDArray([1 2 3; diff --git a/src/broadcast.jl b/src/broadcast.jl index 5d15adf385cc..9686db5d6412 100644 --- a/src/broadcast.jl +++ b/src/broadcast.jl @@ -2,7 +2,8 @@ using TakingBroadcastSeriously: Broadcasted, unwrap for f in :[%, tan, asin, acos, atan, - sinh, cosh, tanh, asinh, acosh, atanh].args + sinh, cosh, tanh, asinh, acosh, atanh, + min, max].args # copy from TakingBroadcastSeriously @eval Base.$f(a::Broadcasted...) = Broadcasted(broadcast_($f, unwrap.(a)...)) @eval Base.$f(a::Broadcasted, b) = Broadcasted(broadcast_($f, unwrap(a), b)) diff --git a/src/deprecated.jl b/src/deprecated.jl index a0f722805168..b722faec6c70 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -126,3 +126,13 @@ function broadcast_lesser_equal(x::NDArray, y::NDArray) warn("broadcast_lesser_equal(x, y) is deprecated, use x .== y instead.") x .<= y end + +function broadcast_maximum(x::NDArray, y::NDArray) + warn("broadcast_maximum(x, y) is deprecated, use max.(x, y) instead.") + max.(x, y) +end + +function broadcast_minimum(x::NDArray, y::NDArray) + warn("broadcast_minimum(x, y) is deprecated, use min.(x, y) instead.") + min.(x, y) +end diff --git a/src/ndarray.jl b/src/ndarray.jl index 8130679b2ae3..3bfd7fccc8d2 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -816,10 +816,10 @@ broadcast_(::typeof(^), x::NDArray{T,N}, y::NDArray{T,N}) where {T,N} = broadcast_(::typeof(^), x::NDArray{T,N}, y::NDArray{T,M}) where {T,N,M} = _broadcast_power(x, y) - ############################################################################### # comparison ############################################################################### + broadcast_(::typeof(==), x::NDArray{T}, y::NDArray{T}) where {T} = _broadcast_equal(x, y) @@ -838,6 +838,19 @@ broadcast_(::typeof(<), x::NDArray{T}, y::NDArray{T}) where {T} = broadcast_(::typeof(<=), x::NDArray{T}, y::NDArray{T}) where {T} = _broadcast_lesser_equal(x, y) + +############################################################################### +# min/max +############################################################################### + +import Base: min, max + +broadcast_(::typeof(max), x::NDArray{T}, y::NDArray{T}) where {T} = + _broadcast_maximum(x, y) + +broadcast_(::typeof(min), x::NDArray{T}, y::NDArray{T}) where {T} = + _broadcast_minimum(x, y) + """ fill!(arr::NDArray, x) @@ -1458,6 +1471,12 @@ julia> mx.log_softmax.(x) @_remap _broadcast_lesser_equal(x::NDArray, y::NDArray) broadcast_lesser_equal(x, y) @_remap _broadcast_lesser_equal!(x::NDArray, y::NDArray) broadcast_lesser_equal(x, y) +@_remap _broadcast_maximum(x::NDArray, y::NDArray) broadcast_maximum(x, y) +@_remap _broadcast_maximum!(x::NDArray, y::NDArray) broadcast_maximum(x, y) + +@_remap _broadcast_minimum(x::NDArray, y::NDArray) broadcast_minimum(x, y) +@_remap _broadcast_minimum!(x::NDArray, y::NDArray) broadcast_minimum(x, y) + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -1630,6 +1649,8 @@ const _op_import_bl = [ # import black list; do not import these funcs "broadcast_greater_equal", "broadcast_lesser", "broadcast_lesser_equal", + "broadcast_maximum", + "broadcast_minimum", ] macro _import_ndarray_functions() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 26fb7327a21d..4d2993defdb0 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -1078,6 +1078,19 @@ function test_maximum() @test copy(maximum(X, [1, 2])) == maximum(A, [1, 2]) @test copy(maximum(X, (1, 2))) == maximum(A, (1, 2)) end + + info("NDArray::broadcast_maximum") + let + A = [1 2 3; + 4 5 6] + B = [1, + 2] + x = NDArray(A) + y = NDArray(B) + + z = max.(x, y) + @test copy(z) == max.(A, B) + end end function test_minimum() @@ -1091,6 +1104,19 @@ function test_minimum() @test copy(minimum(X, [1, 2])) == minimum(A, [1, 2]) @test copy(minimum(X, (1, 2))) == minimum(A, (1, 2)) end + + info("NDArray::broadcast_minimum") + let + A = [1 2 3; + 4 5 6] + B = [1, + 2] + x = NDArray(A) + y = NDArray(B) + + z = min.(x, y) + @test copy(z) == min.(A, B) + end end function test_prod() From 39beaaf14d6c7da64224ba0c0167aeccc0aa9d9e Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 22 Jan 2018 13:59:40 +0800 Subject: [PATCH 618/630] remap broadcast_to/axis/axes (#406) - export `broadcast_to`, `broadcast_axis`, `broadcast_axes` --- NEWS.md | 3 ++ src/MXNet.jl | 6 ++- src/ndarray.jl | 80 ++++++++++++++++++++++++++++++++++++++-- test/unittest/ndarray.jl | 26 +++++++++++++ 4 files changed, 111 insertions(+), 4 deletions(-) diff --git a/NEWS.md b/NEWS.md index f8d1f1073456..826ae72f01e7 100644 --- a/NEWS.md +++ b/NEWS.md @@ -13,6 +13,9 @@ * `relu()` * `softmax()` * `log_softmax()` + * `broadcast_to()` + * `broadcast_axis()` + * `broadcast_axes()` * `SymbolicNode` * `Variable` diff --git a/src/MXNet.jl b/src/MXNet.jl index bd27c715b61d..9bae62d30b73 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -42,7 +42,11 @@ export NDArray, sigmoid, relu, softmax, - log_softmax + log_softmax, + # broadcast utils + broadcast_to, + broadcast_axis, + broadcast_axes # executor.jl export Executor, diff --git a/src/ndarray.jl b/src/ndarray.jl index 3bfd7fccc8d2..b5b95e7fbbcd 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -76,7 +76,7 @@ end # NDArray Type ################################################################################ """ - NDArray + NDArray{T,N} Wrapper of the `NDArray` type in `libmxnet`. This is the basic building block of tensor-based computation. @@ -89,11 +89,11 @@ of tensor-based computation. C/C++/Python shape (100,1,28,28), while in Julia, the same piece of memory have shape (28,28,1,100). """ -mutable struct NDArray{T,D} +mutable struct NDArray{T,N} handle :: MX_NDArrayHandle writable :: Bool - NDArray{T,D}(handle, writable = true) where {T,D} = new(handle, writable) + NDArray{T,N}(handle, writable = true) where {T,N} = new(handle, writable) end NDArray(x::AbstractArray{T}) where {T<:DType} = copy(collect(x), cpu()) @@ -1477,6 +1477,77 @@ julia> mx.log_softmax.(x) @_remap _broadcast_minimum(x::NDArray, y::NDArray) broadcast_minimum(x, y) @_remap _broadcast_minimum!(x::NDArray, y::NDArray) broadcast_minimum(x, y) +_nddoc[:broadcast_to] = """ + broadcast_to(x::NDArray, dims) + broadcast_to(x::NDArray, dims...) + +Broadcasts the input array to a new shape. + +In the case of broacasting doesn't work out of box, +you can expand the NDArray first. + +```jldoctest +julia> x = mx.ones(2, 3, 4); + +julia> y = mx.ones(1, 1, 4); + +julia> x .+ mx.broadcast_to(y, 2, 3, 4) +2×3×4 mx.NDArray{Float32,3} @ CPU0: +[:, :, 1] = + 2.0 2.0 2.0 + 2.0 2.0 2.0 + +[:, :, 2] = + 2.0 2.0 2.0 + 2.0 2.0 2.0 + +[:, :, 3] = + 2.0 2.0 2.0 + 2.0 2.0 2.0 + +[:, :, 4] = + 2.0 2.0 2.0 + 2.0 2.0 2.0 +``` +""" +@_remap broadcast_to(x::NDArray, dims) broadcast_to(x; shape = dims) +@_remap broadcast_to(x::NDArray, dims...) broadcast_to(x; shape = dims) + +_nddoc[:broadcast_axis] = _nddoc[:broadcast_axes] = """ + broadcast_axis(x::NDArray, dim, size) + broadcast_axes(x::NDArray, dim, size) + +Broadcasts the input array over particular axis(axes). +Parameter `dim` and `size` could be a scalar, a Tuple or an Array. + +`broadcast_axes` is just an alias. + +```jldoctest +julia> x +1×2×1 mx.NDArray{Int64,3} @ CPU0: +[:, :, 1] = + 1 2 + +julia> mx.broadcast_axis(x, 1, 2) +2×2×1 mx.NDArray{Int64,3} @ CPU0: +[:, :, 1] = + 1 2 + 1 2 + +julia> mx.broadcast_axis(x, 3, 2) +1×2×2 mx.NDArray{Int64,3} @ CPU0: +[:, :, 1] = + 1 2 + +[:, :, 2] = + 1 2 +``` +""" +@_remap(broadcast_axis(x::NDArray, dim, size), + broadcast_axis(x; axis = ndims(x) .- dim, size = size)) +@_remap(broadcast_axes(x::NDArray, dim, size), + broadcast_axes(x; axis = ndims(x) .- dim, size = size)) + ################################################################################ # NDArray functions dynamically imported from libmxnet ################################################################################ @@ -1651,6 +1722,9 @@ const _op_import_bl = [ # import black list; do not import these funcs "broadcast_lesser_equal", "broadcast_maximum", "broadcast_minimum", + "broadcast_to", + "broadcast_axis", + "broadcast_axes", ] macro _import_ndarray_functions() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index 4d2993defdb0..ba5830a5810f 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -1371,6 +1371,30 @@ function test_equal() @check_equal <= end # function test_equal +function test_broadcast_to() + info("NDArray::broadcast_to") + A = [1 2 3] + x = NDArray(A) + @test mx.broadcast_to(x, (1, 3)) |> copy == A + @test mx.broadcast_to(x, (5, 3)) |> copy == repeat(A, outer = (5, 1)) + + @test mx.broadcast_to(x, 1, 3) |> copy == A + @test mx.broadcast_to(x, 5, 3) |> copy == repeat(A, outer = (5, 1)) +end # function test_broadcast_to + +function test_broadcast_axis() + info("NDArray::broadcast_axis") + A = reshape([1, 2, 3], 1, 3, 1) + x = NDArray(A) + + @test mx.broadcast_axis(x, 1, 4) |> copy == [A; A; A; A] + @test mx.broadcast_axis(x, 3, 2) |> copy == cat(3, A, A) + + info("NDArray::broadcast_axes") + @test mx.broadcast_axes(x, 1, 4) |> copy == [A; A; A; A] + @test mx.broadcast_axes(x, 3, 2) |> copy == cat(3, A, A) +end # function test_broadcast_axis + ################################################################################ # Run tests ################################################################################ @@ -1413,6 +1437,8 @@ end # function test_equal test_hyperbolic() test_act_funcs() test_equal() + test_broadcast_to() + test_broadcast_axis() end end From ec2b6995dc2283e52f40b8ab1f6485230d02c779 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 24 Jan 2018 10:36:39 +0800 Subject: [PATCH 619/630] ndarray: remap hypot (#407) close #400 --- src/broadcast.jl | 3 ++- src/deprecated.jl | 5 +++++ src/ndarray.jl | 9 +++++++++ test/unittest/ndarray.jl | 14 ++++++++++++++ 4 files changed, 30 insertions(+), 1 deletion(-) diff --git a/src/broadcast.jl b/src/broadcast.jl index 9686db5d6412..1b58addec321 100644 --- a/src/broadcast.jl +++ b/src/broadcast.jl @@ -3,7 +3,8 @@ using TakingBroadcastSeriously: Broadcasted, unwrap for f in :[%, tan, asin, acos, atan, sinh, cosh, tanh, asinh, acosh, atanh, - min, max].args + min, max, + hypot].args # copy from TakingBroadcastSeriously @eval Base.$f(a::Broadcasted...) = Broadcasted(broadcast_($f, unwrap.(a)...)) @eval Base.$f(a::Broadcasted, b) = Broadcasted(broadcast_($f, unwrap(a), b)) diff --git a/src/deprecated.jl b/src/deprecated.jl index b722faec6c70..67b1707cdee6 100644 --- a/src/deprecated.jl +++ b/src/deprecated.jl @@ -136,3 +136,8 @@ function broadcast_minimum(x::NDArray, y::NDArray) warn("broadcast_minimum(x, y) is deprecated, use min.(x, y) instead.") min.(x, y) end + +function broadcast_hypot(x::NDArray, y::NDArray) + warn("broadcast_hypot(x, y) is deprecated, use hypot.(x, y) instead.") + hypot.(x, y) +end diff --git a/src/ndarray.jl b/src/ndarray.jl index b5b95e7fbbcd..d2ceb8498ca0 100644 --- a/src/ndarray.jl +++ b/src/ndarray.jl @@ -875,6 +875,11 @@ end fill(x, dims::Integer...) = fill(x, dims) +import Base: hypot + +broadcast_(::typeof(hypot), x::NDArray{T}, y::NDArray{T}) where {T} = + _broadcast_hypot(x, y) + """ Manipulating as Julia Arrays ---------------------------- @@ -1477,6 +1482,9 @@ julia> mx.log_softmax.(x) @_remap _broadcast_minimum(x::NDArray, y::NDArray) broadcast_minimum(x, y) @_remap _broadcast_minimum!(x::NDArray, y::NDArray) broadcast_minimum(x, y) +@_remap _broadcast_hypot(x::NDArray, y::NDArray) broadcast_hypot(x, y) +@_remap _broadcast_hypot!(x::NDArray, y::NDArray) broadcast_hypot(x, y) + _nddoc[:broadcast_to] = """ broadcast_to(x::NDArray, dims) broadcast_to(x::NDArray, dims...) @@ -1725,6 +1733,7 @@ const _op_import_bl = [ # import black list; do not import these funcs "broadcast_to", "broadcast_axis", "broadcast_axes", + "broadcast_hypot", ] macro _import_ndarray_functions() diff --git a/test/unittest/ndarray.jl b/test/unittest/ndarray.jl index ba5830a5810f..891dffd0f390 100644 --- a/test/unittest/ndarray.jl +++ b/test/unittest/ndarray.jl @@ -1395,6 +1395,19 @@ function test_broadcast_axis() @test mx.broadcast_axes(x, 3, 2) |> copy == cat(3, A, A) end # function test_broadcast_axis +function test_hypot() + info("NDArray::hypot") + A = [3 3 3] + B = [4, 4] + C = hypot.(A, B) + + x = NDArray(A) + y = NDArray(B) + z = hypot.(x, y) + + @test copy(z) == C +end # function test_hypot + ################################################################################ # Run tests ################################################################################ @@ -1439,6 +1452,7 @@ end # function test_broadcast_axis test_equal() test_broadcast_to() test_broadcast_axis() + test_hypot() end end From 157b0887438c6a1bcd635b51fa0b4eae3972972f Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 28 Jan 2018 18:17:43 +0800 Subject: [PATCH 620/630] doc: update predict section of mnist tutorial (#411) --- docs/src/tutorial/mnist.md | 21 ++++++++------------- examples/mnist/mlp.jl | 21 ++++++++------------- 2 files changed, 16 insertions(+), 26 deletions(-) diff --git a/docs/src/tutorial/mnist.md b/docs/src/tutorial/mnist.md index a12e10b37821..2d1c68e23e66 100644 --- a/docs/src/tutorial/mnist.md +++ b/docs/src/tutorial/mnist.md @@ -245,21 +245,16 @@ data provider, and compute the prediction accuracy manually: ```julia # collect all labels from eval data -labels = Array[] -for batch in eval_provider - push!(labels, copy(mx.get_label(batch))) -end -labels = cat(1, labels...) +labels = reduce( + vcat, + copy(mx.get(eval_provider, batch, :softmax_label)) for batch ∈ eval_provider) +# labels are 0...9 +labels .= labels .+ 1 # Now we use compute the accuracy -correct = 0 -for i = 1:length(labels) - # labels are 0...9 - if indmax(probs[:,i]) == labels[i]+1 - correct += 1 - end -end -println(mx.format("Accuracy on eval set: {1:.2f}%", 100correct/length(labels))) +pred = map(i -> indmax(probs[1:10, i]), 1:size(probs, 2)) +correct = sum(pred .== labels) +@printf "Accuracy on eval set: %.2f%%\n" 100correct/length(labels) ``` Alternatively, when the dataset is huge, one can provide a callback to diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index 3f713654d5b9..e5aa279c4f77 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -46,18 +46,13 @@ mx.fit(model, optimizer, train_provider, eval_data=eval_provider, n_epoch=20) probs = mx.predict(model, eval_provider) # collect all labels from eval data -labels = Array[] -for batch in eval_provider - push!(labels, copy(mx.get(eval_provider, batch, :softmax_label))) -end -labels = cat(1, labels...) +labels = reduce( + vcat, + copy(mx.get(eval_provider, batch, :softmax_label)) for batch ∈ eval_provider) +# labels are 0...9 +labels .= labels .+ 1 # Now we use compute the accuracy -correct = 0 -for i = 1:length(labels) - # labels are 0...9 - if indmax(probs[:,i]) == labels[i]+1 - correct += 1 - end -end -println(mx.format("Accuracy on eval set: {1:.2f}%", 100correct/length(labels))) +pred = map(i -> indmax(probs[1:10, i]), 1:size(probs, 2)) +correct = sum(pred .== labels) +@printf "Accuracy on eval set: %.2f%%\n" 100correct/length(labels) From 9f4f53338ab5f96c8ff71273e95005f038755b23 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Wed, 31 Jan 2018 11:33:23 +0800 Subject: [PATCH 621/630] Optimizer module overhaul (#396) --- NEWS.md | 100 +++++++++++ README.md | 3 +- docs/src/api/optimizer.md | 16 ++ docs/src/tutorial/mnist.md | 6 +- docs/src/user-guide/overview.md | 4 +- examples/char-lstm/train.jl | 2 +- examples/cifar10/cifar10.jl | 2 +- examples/mnist/lenet-stn.jl | 2 +- examples/mnist/lenet.jl | 2 +- examples/mnist/mlp-test.jl | 9 +- examples/mnist/mlp.jl | 2 +- examples/regression-example.jl | 2 +- src/MXNet.jl | 5 +- src/base.jl | 1 + src/kvstore.jl | 2 +- src/model.jl | 24 ++- src/optimizer.jl | 306 +++++++++++++++++--------------- src/optimizers/adadelta.jl | 130 +++++++------- src/optimizers/adagrad.jl | 94 +++++----- src/optimizers/adam.jl | 104 ++++++----- src/optimizers/adamax.jl | 108 +++++------ src/optimizers/nadam.jl | 148 ++++++++------- src/optimizers/rmsprop.jl | 102 +++++------ src/optimizers/sgd.jl | 114 ++++++------ test/unittest/optimizer.jl | 68 +++++++ 25 files changed, 772 insertions(+), 584 deletions(-) create mode 100644 test/unittest/optimizer.jl diff --git a/NEWS.md b/NEWS.md index 826ae72f01e7..d531d9ea0caf 100644 --- a/NEWS.md +++ b/NEWS.md @@ -61,6 +61,9 @@ * `Nadam` * `RMSProp` * `SGD` + * `getupdater()` + * `normgrad!()` + * `update!()` * `AbstractDataProvider` * `AbstractDataBatch` @@ -344,6 +347,103 @@ Before: `clip(x, a_min = -4, a_max = 4)` After: `clip(x, -4, 4)` +### Optimizer + +We overhauled the optimizer APIs, introducing breaking changes. +There are tons of renaming, and we try to increase the flexibility. +Making it decouples from some high-level, so user can use it without +understand some detail implementations of `fit!`. + +See #396. + +* All the keyword argument of optimizers have been renamed. + Now we have more elegant keyword arguments than Python's, + thanks to well Unicode support on Julia's REPL and editor plugin. + *These are breaking changes, no deprecation warning.* + + | old | new | comment | + |---------------------------|-----------|--------------------------------| + | `opts.lr` | `η` | type `\eta` in REPL | + | `opts.momentum` | `μ` | type `\mu` in REPL | + | `opts.grad_clip` | `clip` | type `\nablac` in REPL | + | `opts.weight_decay` | `λ` | type `\lambda` in REPL | + | `opts.lr_schedular` | `η_sched` | type `\eta_sched` in REPL | + | `opts.momentum_schedular` | `μ_sched` | type `\mu_sched` in REPL | + + For instance, one accessed the learning via `SGD().opts.lr`, + but now, it's `SGD().η`. + +* New keyword argument `scale` for gradient rescaling. + + Docstring: + ``` + If != 0, multiply the gradient with `∇r` before updating. + Often choose to be `1.0 / batch_size`. + If leave it default, high-level API like `fit!` will set it to + `1.0 / batch_size`, since `fit!` knows the `batch_size`. + ``` + +* Keyword arguments of `NadamScheduler` has been renamed. + *This is a breaking change, no deprecation warning.* + + * Before + + ```julia + NadamScheduler(; mu0 = 0.99, delta = 0.004, gamma = 0.5, alpha = 0.96) + ``` + + * After + + ```julia + NadamScheduler(; μ = 0.99, δ = 0.004, γ = 0.5, α = 0.96) + ``` + +* The attribute `optimizer.state` is removed. + `OptimizationState` is only used by high-level abstraction, like `fit!`. + +* `LearningRate` scheduler API changes: + + * `get_learning_rate` is removed. + Please use `Base.get` to get learning rate. + + ```julia + julia> sched = mx.LearningRate.Exp(.1) + MXNet.mx.LearningRate.Exp(0.1, 0.9, 0) + + julia> get(sched) + 0.1 + + julia> update!(sched); + + julia> get(sched) + 0.09000000000000001 + ``` + + * `update!` to bump counter of `Scheduler.t` + ```julia + julia> sched.t + 1 + + julia> update!(sched); + + julia> sched.t + 2 + + julia> update!(sched); + + julia> sched.t + 3 + ``` + +* `Momentum` module API changes: + + * `get_momentum_scheduler` is removed. Please use `Base.get` instead. + + ```julia + julia> get(mx.Momentum.Fixed(.9)) + 0.9 + ``` + ---- # v0.3.0 (2017.11.16) diff --git a/README.md b/README.md index c6600cdc9fd5..74208b9ac034 100644 --- a/README.md +++ b/README.md @@ -37,7 +37,8 @@ train_provider, eval_provider = get_mnist_providers(batch_size) model = mx.FeedForward(mlp, context=mx.cpu()) # optimization algorithm -optimizer = mx.SGD(lr=0.1, momentum=0.9) +# where η is learning rate and μ is momentum +optimizer = mx.SGD(η=0.1, μ=0.9) # fit parameters mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) diff --git a/docs/src/api/optimizer.md b/docs/src/api/optimizer.md index 17974a577913..28d01cc9fd89 100644 --- a/docs/src/api/optimizer.md +++ b/docs/src/api/optimizer.md @@ -1,5 +1,21 @@ # Optimizers +Says, you have the parameter `W` inited for your model and +got its gradient stored as `∇` (perhaps from AutoGrad APIs). +Here is minimal snippet of getting your parameter `W` baked by `SGD`. + +```@repl +using MXNet + +opt = SGD(η = 10) +decend! = getupdater(opt) + +W = NDArray(Float32[1, 2, 3, 4]); +∇ = NDArray(Float32[.1, .2, .3, .4]); + +decend!(1, ∇, W) +``` + ```@autodocs Modules = [MXNet.mx, MXNet.mx.LearningRate, MXNet.mx.Momentum] Pages = ["optimizer.jl"] diff --git a/docs/src/tutorial/mnist.md b/docs/src/tutorial/mnist.md index 2d1c68e23e66..76430fd1b1d0 100644 --- a/docs/src/tutorial/mnist.md +++ b/docs/src/tutorial/mnist.md @@ -100,10 +100,10 @@ help. The last thing we need to specify is the optimization algorithm (a.k.a. *optimizer*) to use. We use the basic SGD with a fixed learning rate 0.1 -and momentum 0.9: +, momentum 0.9 and weight decay 0.00001: ```julia -optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) +optimizer = mx.SGD(η=0.1, μ=0.9, λ=0.00001) ``` Now we can do the training. Here the `n_epoch` parameter specifies that @@ -205,7 +205,7 @@ on GPU, and train it. model = mx.FeedForward(lenet, context=mx.gpu()) # optimizer -optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) +optimizer = mx.SGD(η=0.05, μ=0.9, λ=0.00001) # fit parameters mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) diff --git a/docs/src/user-guide/overview.md b/docs/src/user-guide/overview.md index cddeed6bc8c9..a81d7ff30e9e 100644 --- a/docs/src/user-guide/overview.md +++ b/docs/src/user-guide/overview.md @@ -147,10 +147,10 @@ macroexpand(:(@mx.inplace a += b)) As we can see, it translate the `+=` operator to an explicit `add_to!` function call, which invokes into libmxnet to add the contents of `b` into `a` directly. For example, the following is the update rule in the -`SGD Optimizer` (both `grad` and `weight` are `NDArray` objects): +`SGD Optimizer` (both gradient `∇` and weight `W` are `NDArray` objects): ```julia -@inplace weight += -lr * (grad_scale * grad + self.weight_decay * weight) +@inplace W .+= -η .* (∇ + λ .* W) ``` Note there is no much magic in `mx.inplace`: it only does a shallow diff --git a/examples/char-lstm/train.jl b/examples/char-lstm/train.jl index 000534f64d7b..8b7a682c9560 100644 --- a/examples/char-lstm/train.jl +++ b/examples/char-lstm/train.jl @@ -34,7 +34,7 @@ end #--train model = mx.FeedForward(lstm, context=context) -optimizer = mx.ADAM(lr=BASE_LR, weight_decay=WEIGHT_DECAY, grad_clip=CLIP_GRADIENT) +optimizer = mx.ADAM(η=BASE_LR, λ=WEIGHT_DECAY, clip=CLIP_GRADIENT) mx.fit(model, optimizer, data_tr, eval_data=data_val, n_epoch=N_EPOCH, initializer=mx.UniformInitializer(0.1), diff --git a/examples/cifar10/cifar10.jl b/examples/cifar10/cifar10.jl index 165ee1934568..5d3d2eeafe41 100644 --- a/examples/cifar10/cifar10.jl +++ b/examples/cifar10/cifar10.jl @@ -77,7 +77,7 @@ gpus = [mx.Context(mx.GPU, i) for i = 0:num_gpus-1] model = mx.FeedForward(softmax, context=gpus) # optimizer -optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.0001) +optimizer = mx.SGD(η=0.05, μ=0.9, λ=0.0001) # fit parameters mx.fit(model, optimizer, train_provider, n_epoch=num_epoch, eval_data=test_provider, diff --git a/examples/mnist/lenet-stn.jl b/examples/mnist/lenet-stn.jl index 23ca9de3fdb3..ae94bf9b16f7 100644 --- a/examples/mnist/lenet-stn.jl +++ b/examples/mnist/lenet-stn.jl @@ -57,7 +57,7 @@ train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) model = mx.FeedForward(lenet, context=mx.cpu()) # optimizer -optimizer = mx.ADAM(lr=0.01, weight_decay=0.00001) +optimizer = mx.ADAM(η=0.01, λ=0.00001) # fit parameters initializer=mx.XavierInitializer(distribution = mx.xv_uniform, regularization = mx.xv_avg, magnitude = 1) diff --git a/examples/mnist/lenet.jl b/examples/mnist/lenet.jl index af3e8c41dc71..64bcdea9cba9 100644 --- a/examples/mnist/lenet.jl +++ b/examples/mnist/lenet.jl @@ -39,7 +39,7 @@ train_provider, eval_provider = get_mnist_providers(batch_size; flat=false) model = mx.FeedForward(lenet, context=mx.gpu()) # optimizer -optimizer = mx.SGD(lr=0.05, momentum=0.9, weight_decay=0.00001) +optimizer = mx.SGD(η=0.05, μ=0.9, λ=0.00001) # fit parameters mx.fit(model, optimizer, train_provider, n_epoch=20, eval_data=eval_provider) diff --git a/examples/mnist/mlp-test.jl b/examples/mnist/mlp-test.jl index 56bd00b6a122..dac2c9cd84eb 100644 --- a/examples/mnist/mlp-test.jl +++ b/examples/mnist/mlp-test.jl @@ -72,7 +72,14 @@ end function test_mnist_mlp() info("MNIST::SGD") - @test mnist_fit_and_predict(mx.SGD(lr=0.1, momentum=0.9), mx.UniformInitializer(0.01), 2) > 90 + @test mnist_fit_and_predict(mx.SGD(η=.2), mx.UniformInitializer(.01), 2) > 90 + + info("MNIST::SGD::η scheduler") + @test mnist_fit_and_predict(mx.SGD(η_sched=mx.LearningRate.Inv(.25)), + mx.UniformInitializer(.01), 2) > 90 + + info("MNIST::SGD::momentum μ") + @test mnist_fit_and_predict(mx.SGD(η=.1, μ=.9), mx.UniformInitializer(.01), 2) > 90 info("MNIST::ADAM") @test mnist_fit_and_predict(mx.ADAM(), mx.NormalInitializer(), 2) > 90 diff --git a/examples/mnist/mlp.jl b/examples/mnist/mlp.jl index e5aa279c4f77..8a73d2aa7637 100644 --- a/examples/mnist/mlp.jl +++ b/examples/mnist/mlp.jl @@ -36,7 +36,7 @@ train_provider, eval_provider = get_mnist_providers(batch_size) model = mx.FeedForward(mlp, context=mx.cpu()) # optimizer -optimizer = mx.SGD(lr=0.1, momentum=0.9, weight_decay=0.00001) +optimizer = mx.SGD(η=0.1, μ=0.9, λ=0.00001) # fit parameters mx.fit(model, optimizer, train_provider, eval_data=eval_provider, n_epoch=20) diff --git a/examples/regression-example.jl b/examples/regression-example.jl index 38541c2b7d0c..7d05baf3c632 100644 --- a/examples/regression-example.jl +++ b/examples/regression-example.jl @@ -55,7 +55,7 @@ net = @mx.chain mx.Variable(:data) => model = mx.FeedForward(net, context=mx.cpu()) # set up the optimizer: select one, explore parameters, if desired -#optimizer = mx.SGD(lr=0.01, momentum=0.9, weight_decay=0.00001) +#optimizer = mx.SGD(η=0.01, μ=0.9, λ=0.00001) optimizer = mx.ADAM() # train, reporting loss for training and evaluation sets diff --git a/src/MXNet.jl b/src/MXNet.jl index 9bae62d30b73..b550104a4e5b 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -95,7 +95,10 @@ export AbstractOptimizer, AdaMax, Nadam, RMSProp, - SGD + SGD, + getupdater, + normgrad!, + update! # io.jl export AbstractDataProvider, diff --git a/src/base.jl b/src/base.jl index 271e35607880..a3dcbbf7fe35 100644 --- a/src/base.jl +++ b/src/base.jl @@ -159,6 +159,7 @@ end # NTuple{N, Int} passed to libmxnet. # # TODO: find a better solution in case this cause issues in the future. +# I made `@_remap` in `ndarray.jl`. (Iblis Lin) ################################################################################ dump_mx_param(val::Any) = string(val) dump_mx_param(val::Float64) = @sprintf("%.16e", val) diff --git a/src/kvstore.jl b/src/kvstore.jl index fa4768cceaf7..c4d3ad9724a7 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -127,6 +127,6 @@ function set_optimizer(self :: KVStore, optimizer :: AbstractOptimizer) if ismatch(r"dist", string(get_type(self))) && is_worker # TODO else - set_updater(self, get_updater(optimizer)) + set_updater(self, getupdater(optimizer)) end end diff --git a/src/model.jl b/src/model.jl index 06b7a2cf8a13..2f6dfef1c6d1 100644 --- a/src/model.jl +++ b/src/model.jl @@ -286,7 +286,8 @@ end kvstore :: Union{Symbol, KVStore} = :local, force_init :: Bool = false, callbacks :: Vector{AbstractCallback} = AbstractCallback[], - verbosity :: Int = 3 + verbosity :: Int = 3, + η_decay :: Symbol = :epoch, ) function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, @@ -309,12 +310,11 @@ end Alias to [`fit`](@ref). """ -function train(self :: FeedForward, optimizer :: AbstractOptimizer, data :: AbstractDataProvider; kwargs...) - fit(self, optimizer, data; kwargs...) -end +train(m::FeedForward, opt::AbstractOptimizer, data::AbstractDataProvider; kw...) = + fit(m, opt, data; kw...) """ - fit(model :: FeedForward, optimizer, data; kwargs...) + fit(model::FeedForward, optimizer, data; kwargs...) Train the `model` on `data` with the `optimizer`. @@ -343,6 +343,7 @@ Train the `model` on `data` with the `optimizer`. - `1`: Print starting and final messages - `2`: Print one time messages and a message at the start of each epoch - `3`: Print a summary of the training and validation accuracy for each epoch +* `η_decay::Symbol`: `:epoch` or `:batch`, decay learning rate on epoch or batch. """ function fit(self::FeedForward, optimizer::AbstractOptimizer, data::AbstractDataProvider; kwargs...) @@ -418,10 +419,11 @@ function fit(self::FeedForward, optimizer::AbstractOptimizer, data::AbstractData aux_arrays = [NDArray[exec.aux_arrays[i] for exec in train_execs] for i = 1:length(aux_names)] op_state = OptimizationState(batch_size) - optimizer.state = op_state + # set up the gradient rescaling if user not set + iszero(optimizer.scale) && (optimizer.scale = 1 / batch_size) if !update_on_kvstore - updater = get_updater(optimizer) + updater = getupdater(optimizer) end if !isa(kvstore, Void) @@ -481,7 +483,6 @@ function fit(self::FeedForward, optimizer::AbstractOptimizer, data::AbstractData op_state.curr_iter += 1 op_state.curr_batch += 1 - optimizer.state = op_state # update parameters for idx = 1:length(param_names) @@ -514,6 +515,9 @@ function fit(self::FeedForward, optimizer::AbstractOptimizer, data::AbstractData end end + # trigger learning rate decay + opts.η_decay == :batch && update!(optimizer.η_sched) + # invoke callbacks after finishing each iteration _invoke_callbacks(self, opts.callbacks, op_state, AbstractBatchCallback) @@ -577,6 +581,10 @@ function fit(self::FeedForward, optimizer::AbstractOptimizer, data::AbstractData copy!(self.aux_params[name], aux_avg) end end + + # trigger learning rate decay + opts.η_decay == :epoch && update!(optimizer.η_sched) + _invoke_callbacks(self, opts.callbacks, op_state, AbstractEpochCallback; metric=metric) end # end of all epochs diff --git a/src/optimizer.jl b/src/optimizer.jl index 7a647332231b..06f93a5942d2 100644 --- a/src/optimizer.jl +++ b/src/optimizer.jl @@ -1,3 +1,7 @@ +############################################################################### +# Types +############################################################################### + """ AbstractOptimizer @@ -19,12 +23,10 @@ Base type for all momentum scheduler. """ abstract type AbstractMomentumScheduler end - - """ OptimizationState -# Attributes: +### Attributes * `batch_size`: The size of the mini-batch used in stochastic training. * `curr_epoch`: The current epoch count. Epoch 0 means no training yet, during the first @@ -45,99 +47,113 @@ mutable struct OptimizationState curr_batch :: Int curr_iter :: Int end + OptimizationState(batch_size::Int) = OptimizationState(batch_size, 0, 0, 0) +############################################################################### +# LearningRate module +############################################################################### -""" - get_learning_rate(scheduler, state) +module LearningRate -# Arguments -* `scheduler::AbstractLearningRateScheduler`: a learning rate scheduler. -* `state::OptimizationState`: the current state about epoch, mini-batch and iteration count. +import Base: get +import ..mx: AbstractLearningRateScheduler, OptimizationState, update! + +export initlrsched + +initlrsched(η::Real) = LearningRate.Fixed(η) + +update!(a::AbstractLearningRateScheduler) = (isdefined(a, :t) && (a.t += 1)) -Returns the current learning rate. """ -function get_learning_rate end + get(sched::AbstractLearningRateScheduler) -################################################################################ -# The learning rate module -module LearningRate -import ..mx: AbstractLearningRateScheduler, OptimizationState, get_learning_rate +Returns the current learning rate. +""" +get(::AbstractLearningRateScheduler) = nothing """ - LearningRate.Fixed + LearningRate.Fixed(η) Fixed learning rate scheduler always return the same learning rate. """ -mutable struct Fixed <: AbstractLearningRateScheduler - learning_rate :: Float64 +struct Fixed <: AbstractLearningRateScheduler + η::Float64 end -get_learning_rate(self :: Fixed, state :: OptimizationState) = self.learning_rate -""" - LearningRate.Exp +get(f::Fixed) = f.η + +doc""" + LearningRate.Exp(η₀; γ = 0.9) -``\eta_t = \eta_0\gamma^t``. Here ``t`` is the epoch count, or the iteration -count if `decay_on_iteration` is set to true. +```math +\eta_t = \eta_0\gamma^t +``` + +Where `t` is the epoch count, or the iteration count. """ mutable struct Exp <: AbstractLearningRateScheduler - learning_rate :: Float64 - gamma :: Float64 - on_iteration :: Bool + η₀::Float64 + γ ::Float64 + t ::Int end -function Exp(base_lr::Real; gamma::Real=0.9, decay_on_iteration::Bool=false) - @assert(0 < gamma < 1) - Exp(Float64(base_lr), Float64(gamma), decay_on_iteration) + +function Exp(η₀; γ = 0.9, t = 0) + @assert 0 < γ < 1 + Exp(η₀, γ, t) end -get_learning_rate(self :: Exp, state :: OptimizationState) = - self.learning_rate * self.gamma ^ (self.on_iteration ? state.curr_iter : state.curr_epoch) -""" - LearningRate.Inv -``\eta_t = \eta_0 * (1 + \gamma * t)^(-power)``. -Here ``t`` is the epoch count, or the iteration count if `decay_on_iteration` -is set to true. +get(a::Exp) = a.η₀ * a.γ^a.t + +doc""" + LearningRate.Inv(η₀; γ = 0.9, p = 0.5) + +```math +\eta_t = \eta_0 (1 + \gamma t)^{-p} +``` + +Where `t` is the epoch count, or the iteration count. """ mutable struct Inv <: AbstractLearningRateScheduler - learning_rate :: Float64 - gamma :: Float64 - power :: Float64 - on_iteration :: Bool + η₀::Float64 + γ ::Float64 + p ::Float64 + t ::Int end -function Inv(base_lr :: Real; gamma::Real=0.9, power::Real=0.5, decay_on_iteration::Bool=false) - @assert(0 < gamma < 1) - @assert(0 <= power) - Inv(Float64(base_lr), Float64(gamma), Float64(power), decay_on_iteration) -end -get_learning_rate(self :: Inv, state :: OptimizationState) = - self.learning_rate * ( 1 + self.gamma * (self.on_iteration ? state.curr_iter : state.curr_epoch)) ^ (-self.power) -end# module LearningRate -################################################################################ -function get_lr_scheduler(scheduler :: Any, lr :: Real) - if isa(scheduler, AbstractLearningRateScheduler) - return scheduler - else - return LearningRate.Fixed(lr) - end + +function Inv(η₀; γ = 0.9, p = 0.5, t = 0) + @assert 0 < γ < 1 + @assert 0 <= p + Inv(η₀, γ, p, t) end +get(i::Inv) = i.η₀ * (1 + i.γ*i.t)^(-i.p) + +end # module LearningRate + +using .LearningRate + +############################################################################### +# Momentum module +############################################################################### + +module Momentum + +import Base: get +import ..mx: AbstractMomentumScheduler, OptimizationState + +export initmomsched """ - get_momentum(scheduler, state) + get(sched) -* `scheduler::AbstractMomentumScheduler`: the momentum scheduler. -* `state::OptimizationState`: the state about current epoch, mini-batch and iteration count. +* `sched::AbstractMomentumScheduler`: the momentum scheduler. Returns the current momentum. """ -function get_momentum -end +get - -################################################################################ -# The Momentum module -module Momentum -import ..mx: AbstractMomentumScheduler, OptimizationState, get_momentum +initmomsched(μ::Real) = iszero(μ) ? Momentum.Null() : Momentum.Fixed(μ) """ Momentum.Null @@ -147,7 +163,8 @@ explicitly indicate momentum should not be used. """ struct Null <: AbstractMomentumScheduler end -get_momentum(self :: Null, state :: OptimizationState) = 0.0 + +get(::Null) = 0.0 """ Momentum.Fixed @@ -155,119 +172,116 @@ get_momentum(self :: Null, state :: OptimizationState) = 0.0 Fixed momentum scheduler always returns the same value. """ mutable struct Fixed <: AbstractMomentumScheduler - momentum :: Float64 + μ::Float64 end -get_momentum(self :: Fixed, state :: OptimizationState) = self.momentum -""" - Momentum.NadamScheduler +get(f::Fixed) = f.μ + +doc""" + NadamScheduler(; μ = 0.99, δ = 0.004, γ = 0.5, α = 0.96) Nesterov-accelerated adaptive momentum scheduler. -Description in "Incorporating Nesterov Momentum into Adam." -[http://cs229.stanford.edu/proj2015/054_report.pdf] -(http://cs229.stanford.edu/proj2015/054_report.pdf) - -``\mu_t = \mu_0 * (1 - \gamma * \alpha^{t * \delta})``. -Here -* ``t`` is the iteration count -* ``\delta``: default `0.004` is scheduler decay, -* ``\gamma``: default `0.5` -* ``\alpha``: default `0.96` -* ``\mu_0``: default `0.99` +Description in [Incorporating Nesterov Momentum into Adam] +(http://cs229.stanford.edu/proj2015/054_report.pdf). + +```math +\mu_t = \mu_0 * (1 - \gamma * \alpha^{t * \delta}) +``` + +Where +* `t`: iteration count +* `μ`: default `0.99`, μ₀ +* `δ`: default `0.004` is scheduler decay. +* `γ`: default `0.5` +* `α`: default `0.96` """ -mutable struct NadamScheduler <: AbstractMomentumScheduler - mu0 :: Float64 - delta :: Float64 - gamma :: Float64 - alpha :: Float64 -end -function NadamScheduler(;mu0::Real=0.99, delta::Real=0.004, - gamma::Real=0.5, alpha::Real=0.96) - @assert(0.0 <= delta) - @assert(0.0 <= alpha <= 1.0) - @assert(0.0 <= mu0 <= 1.0) - @assert(0.0 <= gamma <= 1.0) - NadamScheduler(Float64(mu0), Float64(delta), Float64(gamma), Float64(alpha)) +struct NadamScheduler <: AbstractMomentumScheduler + μ::Float64 + δ::Float64 + γ::Float64 + α::Float64 end -get_momentum(self :: NadamScheduler, state :: OptimizationState) = - self.mu0 * (1.0 - self.gamma*self.alpha^(state.curr_iter * self.delta)), - self.mu0 * (1.0 - self.gamma*self.alpha^((state.curr_iter + 1) * self.delta)) - -end # module Momentum -################################################################################ -function get_momentum_scheduler(scheduler :: Any, momentum :: Real) - if isa(scheduler, AbstractMomentumScheduler) - return scheduler - elseif momentum == 0 - return Momentum.Null() - else - return Momentum.Fixed(momentum) - end + +function NadamScheduler(; μ = 0.99, δ = 0.004, γ = 0.5, α = 0.96) + @assert 0.0 <= μ < 1.0 + @assert 0.0 <= δ + @assert 0.0 <= γ <= 1.0 + @assert 0.0 <= α <= 1.0 + NadamScheduler(μ, δ, γ, α) end -function get_momentum_scheduler(scheduler :: Any, - another_scheduler :: AbstractMomentumScheduler) +""" + get(n::NadamScheduler, t) - if isa(scheduler, AbstractMomentumScheduler) - return scheduler - else - return another_scheduler - end -end +Where `t` is the iteration count. +""" +get(n::NadamScheduler, t) = + n.μ * (1.0 - n.γ * n.α^( t * n.δ)), + n.μ * (1.0 - n.γ * n.α^((t + 1) * n.δ)) + +end # module Momentum + +using .Momentum + +############################################################################### +# Public APIs +############################################################################### """ - get_updater(optimizer) + getupdater(optimizer) -A utility function to create an updater function, that uses its closure to -store all the states needed for each weights. +A utility function to create an updater function of `KVStore`, +that uses its closure to store all the states needed for each weights. -* `optimizer::AbstractOptimizer`: the underlying optimizer. +Ther returned function has following signature: + +```julia +decend!(index::Int, ∇::NDArray, x::NDArray) +``` + +If the optimizer is stateful and need access/store states during updating, +`index` will be the key to access/store states. """ -function get_updater(optimizer::AbstractOptimizer) +function getupdater(optimizer::AbstractOptimizer) states = Dict{Int,Any}() - function updater(index::Int, grad::NDArray, weight::NDArray) + function updater(index::Int, ∇::NDArray, x::NDArray) if !haskey(states, index) - states[index] = create_state(optimizer, index, weight) + states[index] = create_state(optimizer, index, x) end - update(optimizer, index, weight, grad, states[index]) + update!(optimizer, index, x, ∇, states[index]) end - return updater + updater end """ - AbstractOptimizerOptions - -Base class for all optimizer options. -""" -abstract type AbstractOptimizerOptions end - -""" - normalized_gradient(opts, state, W, ∇) + normgrad(optimizer, W, ∇) Get the properly normalized gradient (re-scaled and clipped if necessary). -* `opts::AbstractOptimizerOptions`: options for the optimizer, - should contain the field `grad_clip` and `weight_decay`. -* `state::OptimizationState`: the current optimization state. +* `optimizer`: the optimizer, + should contain the field `scale`, `clip` and `λ`. * `W::NDArray`: the trainable weights. * `∇::NDArray`: the original gradient of the weights. """ -function normalized_gradient(opts::AbstractOptimizerOptions, state::OptimizationState, - W::NDArray, ∇::NDArray) - scale = 1.0 / state.batch_size - ∇ = ∇ * scale - - if opts.grad_clip > 0 - ∇ = clip(∇, -opts.grad_clip, opts.grad_clip) - end - if opts.weight_decay > 0 - @inplace ∇ += opts.weight_decay * W - end +function normgrad!(opt::AbstractOptimizer, W::NDArray, ∇::NDArray) + # rescaling + s = opt.scale + !iszero(s) && @inplace ∇ .*= s + # gradient clipping + c = opt.clip + c > 0 && clip!(∇, -c, c) + # weight decay + λ = opt.λ + λ > 0 && @inplace ∇ += λ .* W ∇ end +############################################################################### +# Builtin Optimizers +############################################################################### + include("optimizers/sgd.jl") include("optimizers/adam.jl") include("optimizers/adagrad.jl") diff --git a/src/optimizers/adadelta.jl b/src/optimizers/adadelta.jl index 3915d036496a..9fee3517a3cb 100644 --- a/src/optimizers/adadelta.jl +++ b/src/optimizers/adadelta.jl @@ -1,91 +1,87 @@ -@defstruct AdaDeltaOptions <: AbstractOptimizerOptions ( - (lr :: Real = 1.0, lr > 0), - (rho :: Real = 0.95, rho > 0 && rho < 1), - (epsilon :: Real = 1e-6, epsilon > 0), - (grad_clip :: Real = 0, grad_clip >= 0), - (weight_decay :: Real = 0.00001, weight_decay >= 0), - lr_scheduler :: Any = nothing -) - -""" - AdaDelta +doc""" + AdaDelta(; kwargs...) Scale learning rates by the ratio of accumulated gradients to accumulated updates, see [1] and notes for further description. - AdaDelta(; kwargs...) - -# Attributes -* `lr::Real`: default `1.0`, the learning rate controlling the - size of update steps -* `rho::Real`: default `0.9`, squared gradient moving average decay factor -* `epsilon::Real`: default `1e-6`, small value added for - numerical stability -* `grad_clip::Real`: default `0`, if positive, will clip the gradient - into the range `[-grad_clip, grad_clip]`. -* `weight_decay::Real`: default `0.00001`, weight decay is equivalent +### Attributes +* `η`: default `1.0`, learning rate. +* `ρ`: default `0.95`, squared gradient moving average decay factor. +* `ϵ`: default `1e-6`, small value added for numerical stability. +* `clip`: default `0`, gradient clipping. + If positive, will clip the gradient into the range `[-clip, clip]`. +* `scale`: default `0`, gradient rescaling. + If != 0, multiply the gradient with `scale` before updating. + Often choose to be `1.0 / batch_size`. + If leave it default, high-level API like `fit!` will set it to + `1.0 / batch_size`, since `fit!` knows the `batch_size`. +* `λ`: default `0.00001`, weight decay is equivalent to adding a global l2 regularizer for all the parameters. -# Notes -`rho` should be between 0 and 1. A value of `rho` close to 1 will decay the +### Notes +`ρ` should be between 0 and 1. A value of `ρ` close to 1 will decay the moving average slowly and a value close to 0 will decay the moving average fast. -`rho` = 0.95 and `epsilon` = 1e-6 are suggested in the paper and reported to +`ρ = 0.95` and `ϵ = 1e-6` are suggested in the paper and reported to work for multiple datasets (MNIST, speech). In the paper, no learning rate is -considered (so `lr` = 1.0). Probably best to keep it at this value. +considered (so `η = 1.0`). Probably best to keep it at this value. -`epsilon` is important for the very first update (so the numerator does -not become 0). +`ϵ` is important for the very first update (so the numerator does not become 0). -Using the step size `lr` and a decay factor `rho` the learning rate is +Using the step size `η` and a decay factor `ρ` the learning rate is calculated as: -``r_t &= \rho r_{t-1} + (1-\rho)*g^2\\ -\eta_t &= \eta \frac{\sqrt{s_{t-1} + \epsilon}} {\sqrt{r_t + \epsilon}}\\ -s_t &= \rho s_{t-1} + (1-\rho)*(\eta_t*g)^2`` -# References -* [1]: Zeiler, M. D. (2012): - ADADELTA: An Adaptive Learning Rate Method. arXiv Preprint arXiv:1212.5701. +```math +\begin{align*} + r_t &= ρ r_{t-1} + (1 - ρ) g^2 \\ + η_t &= η \frac{\sqrt{s_{t-1} + ϵ}} {\sqrt{r_t + ϵ}} \\ + s_t &= ρ s_{t-1} + (1 - ρ) (η_t \times g)^2 +\end{align*} +``` + +### References +1. Zeiler, M. D. (2012): + ADADELTA: An Adaptive Learning Rate Method. arXiv Preprint arXiv:1212.5701. """ - -mutable struct AdaDelta <: AbstractOptimizer - opts :: AdaDeltaOptions - state :: OptimizationState - - function AdaDelta(; kwargs...) - opts = AdaDeltaOptions(;kwargs...) - opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) - - new(opts) - end -end +AdaDelta + +@defstruct AdaDelta <: AbstractOptimizer ( + (η :: Real = 1.0, η > 0), + (ρ :: Real = 0.95, 0 < ρ < 1 ), + (ϵ :: Real = 1e-6, ϵ > 0), + (clip :: Real = 0, clip >= 0), + scale :: Real = 0, + (λ :: Real = 1e-5, λ >= 0), + η_sched :: Any = initlrsched(η) +) mutable struct AdaDeltaState - acc :: NDArray - delta_acc :: NDArray + x :: NDArray + Δx :: NDArray end -function create_state(self :: AdaDelta, index :: Int, weight :: NDArray) - return AdaDeltaState(zeros(size(weight), context(weight)), - zeros(size(weight), context(weight))) -end +create_state(::AdaDelta, ::Int, W::NDArray) = + AdaDeltaState(zeros(size(W), context(W)), zeros(size(W), context(W))) + +function update!(ada::AdaDelta, ::Int, W::NDArray, ∇::NDArray, s::AdaDeltaState) + η = get(ada.η_sched) + x = s.x + Δx = s.Δx + ρ = ada.ρ + ϵ = ada.ϵ -function update(self :: AdaDelta, index :: Int, weight :: NDArray, - grad :: NDArray, state :: AdaDeltaState) - lr = get_learning_rate(self.opts.lr_scheduler, self.state) - grad = normalized_gradient(self.opts, self.state, weight, grad) + normgrad!(ada, W, ∇) - # Update state.acc as in RMSProp - @inplace state.acc .*= self.opts.rho - @inplace state.acc .+= (1 - self.opts.rho) * grad .* grad + # Update s.acc as in RMSProp + @inplace x .*= ρ + @inplace x .+= (1 - ρ) .* ∇.^2 - # Compute update using the "old" state.delta_acc - update = grad .* sqrt(state.delta_acc + self.opts.epsilon) ./ - (sqrt(state.acc + self.opts.epsilon)) - @inplace weight .+= -lr * update + # Compute update using the "old" Δx + Δxₜ = ∇ .* sqrt(Δx .+ ϵ) ./ sqrt(x .+ ϵ) # FIXME: sqrt dot-call + @inplace W .+= -η .* Δxₜ - # update state.delta_acc using update - @inplace state.delta_acc .*= self.opts.rho - @inplace state.delta_acc .+= (1 - self.opts.rho) * update .* update + # update Δx using update + @inplace Δx .*= ρ + @inplace Δx .+= (1 - ρ) .* Δxₜ.^2 end diff --git a/src/optimizers/adagrad.jl b/src/optimizers/adagrad.jl index a5eee0bbd102..c72bac1e3b7e 100644 --- a/src/optimizers/adagrad.jl +++ b/src/optimizers/adagrad.jl @@ -1,66 +1,60 @@ -@defstruct AdaGradOptions <: AbstractOptimizerOptions ( - (lr :: Real = 0.1, lr > 0), - (epsilon :: Real = 1e-6, epsilon > 0), - (grad_clip :: Real = 0, grad_clip >= 0), - (weight_decay :: Real = 0.00001, weight_decay >= 0), - lr_scheduler :: Any = nothing -) - -""" - AdaGrad +doc""" + AdaGrad(; kwargs...) Scale learning rates by dividing with the square root of accumulated squared gradients. See [1] for further description. - AdaGrad(; kwargs...) - -# Attributes -* `lr::Real`: default `0.1`, the learning rate controlling the - size of update steps -* `epsilon::Real`: default `1e-6`, small value added for - numerical stability -* `grad_clip::Real`: default `0`, if positive, will clip the gradient - into the range `[-grad_clip, grad_clip]`. -* `weight_decay::Real`: default `0.00001`, weight decay is equivalent +### Arguments +* `η`: default `0.1`, learning rate. +* `ϵ`: default `1e-6`, small value added for numerical stability. +* `clip`: default `0`, gradient clipping. + If positive, will clip the gradient into the range `[-clip, clip]`. +* `scale`: default `0`, gradient rescaling. + If != 0, multiply the gradient with `scale` before updating. + Often choose to be `1.0 / batch_size`. + If leave it default, high-level API like `fit!` will set it to + `1.0 / batch_size`, since `fit!` knows the `batch_size`. +* `λ`: default `0.00001`, weight decay is equivalent to adding a global l2 regularizer for all the parameters. -# Notes -Using step size lr AdaGrad calculates the learning rate for feature i at +### Notes +Using step size `η` AdaGrad calculates the learning rate for feature `i` at time step t as: -``η_{t,i} = \frac{lr}{\sqrt{\sum^t_{t^\prime} g^2_{t^\prime,i} + ϵ}} g_{t,i}`` + +```math +η_{t,i} = \frac{lr}{\sqrt{\sum^t_{t^\prime} g^2_{t^\prime,i} + ϵ}} g_{t,i} +``` + as such the learning rate is monotonically decreasing. Epsilon is not included in the typical formula, see [2]. -# References -* [1]: Duchi, J., Hazan, E., & Singer, Y. (2011): - Adaptive subgradient methods for online learning and - stochastic optimization. JMLR, 12:2121-2159. -* [2]: Chris Dyer: Notes on AdaGrad. - [http://www.ark.cs.cmu.edu/cdyer/adagrad.pdf] - (http://www.ark.cs.cmu.edu/cdyer/adagrad.pdf) +### References +1. Duchi, J., Hazan, E., & Singer, Y. (2011): + Adaptive subgradient methods for online learning and + stochastic optimization. JMLR, 12:2121-2159. +2. Chris Dyer: Notes on AdaGrad. + [http://www.ark.cs.cmu.edu/cdyer/adagrad.pdf] + (http://www.ark.cs.cmu.edu/cdyer/adagrad.pdf) """ +AdaGrad + +@defstruct AdaGrad <: AbstractOptimizer ( + (η :: Real = 0.1, η > 0), + (ϵ :: Real = 1e-6, ϵ > 0), + (clip :: Real = 0, clip >= 0), + scale :: Real = 0, + (λ :: Real = 1e-5, λ >= 0), + η_sched :: Any = initlrsched(η) +) -mutable struct AdaGrad <: AbstractOptimizer - opts :: AdaGradOptions - state :: OptimizationState - - function AdaGrad(; kwargs...) - opts = AdaGradOptions(;kwargs...) - opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) - - new(opts) - end -end +create_state(::AdaGrad, ::Int, W::NDArray) = zeros(size(W), context(W)) -function create_state(self :: AdaGrad, index :: Int, weight :: NDArray) - return zeros(size(weight), context(weight)) -end +function update!(ada::AdaGrad, ::Int, W::NDArray, ∇::NDArray, x::NDArray) + η = get(ada.η_sched) + ϵ = ada.ϵ -function update(self :: AdaGrad, index :: Int, weight :: NDArray, - grad :: NDArray, state :: NDArray) - lr = get_learning_rate(self.opts.lr_scheduler, self.state) - grad = normalized_gradient(self.opts, self.state, weight, grad) + normgrad!(ada, W, ∇) - @inplace state .+= grad .* grad - @inplace weight .+= -lr * grad ./ (sqrt(state + self.opts.epsilon)) + @inplace x .+= ∇.^2 # update state + @inplace W .+= -η .* ∇ ./ sqrt(x .+ ϵ) # FIXME: sqrt dot-call end diff --git a/src/optimizers/adam.jl b/src/optimizers/adam.jl index aa1bc90f9f78..0d5c1a23850d 100644 --- a/src/optimizers/adam.jl +++ b/src/optimizers/adam.jl @@ -1,13 +1,3 @@ -@defstruct ADAMOptions <: AbstractOptimizerOptions ( - (lr :: Real = 0.001, lr > 0), - (grad_clip :: Real = 0, grad_clip >= 0), - (weight_decay :: Real = 0.00001, weight_decay >= 0), - (beta1 :: Real = 0.9, beta1 > 0), - (beta2 :: Real = 0.999, beta2 > 0), - (epsilon :: Real = 1e-8, epsilon > 0), - lr_scheduler :: Any = nothing -) - """ ADAM @@ -16,58 +6,66 @@ Stochastic Optimization*. arXiv:1412.6980 [cs.LG]. ADAM(; kwargs...) -* `lr::Real`: default `0.001`, learning rate. -* `lr_scheduler::AbstractLearningRateScheduler`: default `nothing`, a - dynamic learning rate scheduler. If set, will overwrite the `lr` - parameter. -* `beta1::Real`: default `0.9`. -* `beta2::Real`: default `0.999`. -* `epsilon::Real`: default `1e-8`. -* `grad_clip::Real`: default `0`, if positive, will clip the gradient - into the range `[-grad_clip, grad_clip]`. -* `weight_decay::Real`: default `0.00001`, weight decay is equivalent - to adding a global l2 regularizer for all the parameters. +### Arguments +* `η`: default `0.001`, learning rate. +* `β1`: default `0.9`. +* `β2`: default `0.999`. +* `ϵ`: default `1e-8`. +* `clip`: default `0`, gradient clipping. + If positive, will clip the gradient into the range `[-clip, clip]`. +* `scale`: default `0`, gradient rescaling. + If != 0, multiply the gradient with `scale` before updating. + Often choose to be `1.0 / batch_size`. + If leave it default, high-level API like `fit!` will set it to + `1.0 / batch_size`, since `fit!` knows the `batch_size`. +* `λ`: default `0.00001`, weight decay is equivalent + to adding a global l2 regularizer for all the parameters. +* `η_sched::AbstractLearningRateScheduler`: default `LearningRate.Fixed(η)`, a + dynamic learning rate scheduler. If set, will overwrite the `η` parameter. """ -mutable struct ADAM <: AbstractOptimizer - opts :: ADAMOptions - state :: OptimizationState +ADAM - function ADAM(; kwargs...) - opts = ADAMOptions(;kwargs...) - opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) - - new(opts) - end -end +@defstruct ADAM <: AbstractOptimizer ( + (η :: Real = 0.001, η > 0), + (β1 :: Real = 0.9, 0 <= β1 < 1), + (β2 :: Real = 0.999, 0 <= β2 < 1), + (ϵ :: Real = 1e-8, ϵ > 0), + (clip :: Real = 0, clip >= 0), + scale :: Real = 0, + (λ :: Real = 1e-5, λ >= 0), + η_sched :: Any = initlrsched(η) +) mutable struct ADAMState - current_lr :: Float64 # current learning rate - mt :: NDArray - vt :: NDArray - beta1Power :: Float64 - beta2Power :: Float64 + η :: Float64 # current learning rate + mₜ :: NDArray + vₜ :: NDArray + β1ᵗ :: Float64 + β2ᵗ :: Float64 end -function create_state(self :: ADAM, index :: Int, weight :: NDArray) - return ADAMState( get_learning_rate(self.opts.lr_scheduler, self.state), - zeros(size(weight), context(weight)), - zeros(size(weight), context(weight)), - self.opts.beta1, - self.opts.beta2 ) -end +create_state(adam::ADAM, ::Int, W::NDArray) = + ADAMState(get(adam.η_sched), + zeros(size(W), context(W)), + zeros(size(W), context(W)), + adam.β1, adam.β2) + +function update!(adam::ADAM, ::Int, W::NDArray, ∇:: NDArray, s::ADAMState) + η = s.η + β1 = adam.β1 + β2 = adam.β2 + ϵ = adam.ϵ -function update(self :: ADAM, index :: Int, weight :: NDArray, grad :: NDArray, state :: ADAMState) - lr = state.current_lr - grad = normalized_gradient(self.opts, self.state, weight, grad) + normgrad!(adam, W, ∇) - state.mt = self.opts.beta1 * state.mt + (1 - self.opts.beta1) .* grad - state.vt = self.opts.beta2 * state.vt + (1 - self.opts.beta2) .* grad .* grad + s.mₜ = β1 * s.mₜ + (1 - β1) .* ∇ + s.vₜ = β2 * s.vₜ + (1 - β2) .* ∇.^2 - at = sqrt(1.0 - state.beta2Power)/(1.0 - state.beta1Power) + aₜ= sqrt(1.0 - s.β2ᵗ)/(1.0 - s.β1ᵗ) - state.beta1Power *= self.opts.beta1 - state.beta2Power *= self.opts.beta2 + # update βᵗ to βᵗ⁺¹ + s.β1ᵗ *= β1 + s.β2ᵗ *= β2 - @inplace weight .+= -lr * at * state.mt ./ - (sqrt(state.vt) + self.opts.epsilon) + @inplace W .+= -η * aₜ * s.mₜ ./ (sqrt(s.vₜ) .+ ϵ) end diff --git a/src/optimizers/adamax.jl b/src/optimizers/adamax.jl index adcdb78bf255..87ef0aa68831 100644 --- a/src/optimizers/adamax.jl +++ b/src/optimizers/adamax.jl @@ -1,77 +1,67 @@ -@defstruct AdaMaxOptions <: AbstractOptimizerOptions ( - (lr :: Real = 0.002, lr > 0), - (beta1 :: Real = 0.9, beta1 > 0 && beta1 < 1), - (beta2 :: Real = 0.999, beta2 > 0 && beta2 < 1), - (epsilon :: Real = 1e-8, epsilon > 0), - (grad_clip :: Real = 0, grad_clip >= 0), - (weight_decay :: Real = 0.00001, weight_decay >= 0), - lr_scheduler :: Any = nothing -) - """ - AdaMax + AdaMax(; kwargs...) This is a variant of of the Adam algorithm based on the infinity norm. See [1] for further description. - AdaMax(; kwargs...) - -# Attributes -* `lr::Real`: default `0.002`, the learning rate controlling the - size of update steps -* `beta1::Real`: default `0.9`, exponential decay rate - for the first moment estimates -* `beta2::Real`: default `0.999`, exponential decay rate for the - weighted infinity norm estimates -* `epsilon::Real`: default `1e-8`, small value added for - numerical stability -* `grad_clip::Real`: default `0`, if positive, will clip the gradient - into the range `[-grad_clip, grad_clip]`. -* `weight_decay::Real`: default `0.00001`, weight decay is equivalent +### Arguments +* `η`: default `0.002`, learning rate. +* `β1`: default `0.9`, exponential decay rate for the first moment estimates. +* `β2`: default `0.999`, exponential decay rate for the weighted + infinity norm estimates. +* `ϵ`: default `1e-8`, small value added for numerical stability. +* `clip`: default `0`, gradient clipping. + If positive, will clip the gradient into the range `[-clip, clip]`. +* `scale`: default `0`, gradient rescaling. + If != 0, multiply the gradient with `scale` before updating. + Often choose to be `1.0 / batch_size`. + If leave it default, high-level API like `fit!` will set it to + `1.0 / batch_size`, since `fit!` knows the `batch_size`. +* `λ`: default `0.00001`, weight decay is equivalent to adding a global l2 regularizer for all the parameters. -# References -* [1]: Kingma, Diederik, and Jimmy Ba (2014): - Adam: A Method for Stochastic Optimization. - [http://arxiv.org/abs/1412.6980v8] - (http://arxiv.org/abs/1412.6980v8). +### References +1. Kingma, Diederik, and Jimmy Ba (2014): + Adam: A Method for Stochastic Optimization. Section 7. + [http://arxiv.org/abs/1412.6980] + (http://arxiv.org/abs/1412.6980). """ +AdaMax -mutable struct AdaMax <: AbstractOptimizer - opts :: AdaMaxOptions - state :: OptimizationState - - function AdaMax(; kwargs...) - opts = AdaMaxOptions(; kwargs...) - opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) - - new(opts) - end -end +@defstruct AdaMax <: AbstractOptimizer ( + (η :: Real = 0.002, η > 0), + (β1 :: Real = 0.9, 0 <= β1 < 1), + (β2 :: Real = 0.999, 0 <= β2 < 1), + (ϵ :: Real = 1e-8, ϵ > 0), + (clip :: Real = 0, clip >= 0), + scale :: Real = 0, + (λ :: Real = 1e-5, λ >= 0), + η_sched :: Any = initlrsched(η) +) mutable struct AdaMaxState - mt :: NDArray - ut :: NDArray - beta1Power :: Float64 + mₜ :: NDArray + uₜ :: NDArray + β1ᵗ :: Float64 end -function create_state(self :: AdaMax, index :: Int, weight :: NDArray) - return AdaMaxState( zeros(size(weight), context(weight)), - zeros(size(weight), context(weight)), - self.opts.beta1 ) -end +create_state(ada::AdaMax, ::Int, W::NDArray) = + AdaMaxState(zeros(size(W), context(W)), + zeros(size(W), context(W)), + ada.β1) + +function update!(ada::AdaMax, ::Int, W::NDArray, ∇::NDArray, s::AdaMaxState) + η = get(ada.η_sched) + β1 = ada.β1 + β2 = ada.β2 + ϵ = ada.ϵ -function update(self :: AdaMax, index :: Int, weight :: NDArray, - grad :: NDArray, state :: AdaMaxState) - lr = get_learning_rate(self.opts.lr_scheduler, self.state) - grad = normalized_gradient(self.opts, self.state, weight, grad) + normgrad!(ada, W, ∇) - @inplace state.mt .*= self.opts.beta1 - @inplace state.mt .+= (1 - self.opts.beta1) * grad - state.ut = _maximum(self.opts.beta2 * state.ut, abs(grad)) + s.mₜ = β1 * s.mₜ .+ (1 - β1) .* ∇ + s.uₜ = _maximum(β2 * s.uₜ, abs(∇)) # FIXME abs dot-call - @inplace weight .+= - lr / (1 - state.beta1Power) * - state.mt ./ (state.ut + self.opts.epsilon) + @inplace W .+= -η / (1 - s.β1ᵗ) * s.mₜ ./ (s.uₜ + ϵ) - state.beta1Power *= self.opts.beta1 + s.β1ᵗ *= ada.β1 end diff --git a/src/optimizers/nadam.jl b/src/optimizers/nadam.jl index c3ac18dcc11a..524465ecb984 100644 --- a/src/optimizers/nadam.jl +++ b/src/optimizers/nadam.jl @@ -1,100 +1,94 @@ -@defstruct NadamOptions <: AbstractOptimizerOptions ( - (lr :: Real = 0.001, lr > 0), - (beta1 :: Real = 0.99, beta1 > 0 && beta1 < 1), - (beta2 :: Real = 0.999, beta2 > 0 && beta2 < 1), - (epsilon :: Real = 1e-8, epsilon > 0), - (grad_clip :: Real = 0, grad_clip >= 0), - (weight_decay :: Real = 0.00001, weight_decay >= 0), - lr_scheduler :: Any = nothing, - momentum_scheduler :: Any = nothing -) - -""" - Nadam +doc""" + Nadam(; kwargs...) Nesterov Adam optimizer: Adam RMSprop with Nesterov momentum, see [1] and notes for further description. - Nadam(; kwargs...) -# Attributes -* `lr::Real`: default `0.001`, learning rate. -* `beta1::Real`: default `0.99`. -* `beta2::Real`: default `0.999`. -* `epsilon::Real`: default `1e-8`, small value added for - numerical stability -* `grad_clip::Real`: default `0`, if positive, will clip the gradient - into the range `[-grad_clip, grad_clip]`. -* `weight_decay::Real`: default `0.00001`, weight decay is equivalent +### Arguments +* `η`: default `0.001`, learning rate. +* `β1`: default `0.99`. +* `β2`: default `0.999`. +* `ϵ`: default `1e-8`, small value added for numerical stability. +* `clip`: default `0`, gradient clipping. + If positive, will clip the gradient into the range `[-clip, clip]`. +* `scale`: default `0`, gradient rescaling. + If != 0, multiply the gradient with `scale` before updating. + Often choose to be `1.0 / batch_size`. + If leave it default, high-level API like `fit!` will set it to + `1.0 / batch_size`, since `fit!` knows the `batch_size`. +* `λ`: default `0.00001`, weight decay is equivalent to adding a global l2 regularizer for all the parameters. -* `lr_scheduler::AbstractLearningRateScheduler`: default `nothing`, a - dynamic learning rate scheduler. If set, will overwrite the `lr` +* `η_sched::AbstractLearningRateScheduler`: default `nothing`, a + dynamic learning rate scheduler. If set, will overwrite the `η` parameter. -* `momentum_scheduler::AbstractMomentumScheduler` default - `NadamScheduler` of the form - ``\mu_t = beta1 * (1 - 0.5 * 0.96^{t * 0.004})`` +* `μ_sched::NadamScheduler` default `NadamScheduler()` of the form. + + ```math + \mu_t = β_1 (1 - 0.5 \times 0.96^{t \times 0.004}) + ``` -# Notes +### Notes Default parameters follow those provided in the paper. It is recommended to leave the parameters of this optimizer at their default values. -# References -* [1]: Incorporating Nesterov Momentum into Adam. - [http://cs229.stanford.edu/proj2015/054_report.pdf] - (http://cs229.stanford.edu/proj2015/054_report.pdf) -* [2]: On the importance of initialization and momentum in deep learning - [http://www.cs.toronto.edu/~fritz/absps/momentum.pdf] - (http://www.cs.toronto.edu/~fritz/absps/momentum.pdf) +### References +1. [Incorporating Nesterov Momentum into Adam] + (http://cs229.stanford.edu/proj2015/054_report.pdf). + +2. [On the importance of initialization and momentum in deep learning] + (http://www.cs.toronto.edu/~fritz/absps/momentum.pdf). """ -mutable struct Nadam <: AbstractOptimizer - opts :: NadamOptions - state :: OptimizationState - - function Nadam(; kwargs...) - opts = NadamOptions(; kwargs...) - opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) - opts.momentum_scheduler = get_momentum_scheduler(opts.momentum_scheduler, - Momentum.NadamScheduler(mu0=opts.beta1)) - - new(opts) - end -end +Nadam + +@defstruct Nadam <: AbstractOptimizer ( + (η :: Real = 0.001, η > 0), + (β1 :: Real = 0.99, 0 <= β1 < 1), + (β2 :: Real = 0.999, 0 <= β2 < 1), + (ϵ :: Real = 1e-8, ϵ > 0), + (clip :: Real = 0, clip >= 0), + scale :: Real = 0, + (λ :: Real = 1e-5, λ >= 0), + η_sched :: Any = initlrsched(η), + μ_sched :: Momentum.NadamScheduler = Momentum.NadamScheduler(μ = β1) +) mutable struct NadamState - mt :: NDArray - nt :: NDArray - momentum :: Float64 - beta2Power :: Float64 + m :: NDArray + n :: NDArray + Πμ :: Float64 + β2ᵗ :: Float64 + t :: Int # use in NadamScheduler. + # we store `t` in state because state is created for each `index` end -function create_state(self :: Nadam, index :: Int, weight :: NDArray) - return NadamState( zeros(size(weight), context(weight)), - zeros(size(weight), context(weight)), - 1.0, - self.opts.beta2 ) -end +create_state(n::Nadam, ::Int, W::NDArray) = + NadamState(zeros(size(W), context(W)), zeros(size(W), context(W)), + 1.0, n.β2, 1) + +function update!(na::Nadam, ::Int, W::NDArray, ∇::NDArray, s::NadamState) + η = get(na.η_sched) + μₜ, μₜ₁= get(na.μ_sched, s.t) + β1, β2 = na.β1, na.β2 + ϵ = na.ϵ -function update(self :: Nadam, index :: Int, weight :: NDArray, - grad :: NDArray, state :: NadamState) - lr = get_learning_rate(self.opts.lr_scheduler, self.state) - grad = normalized_gradient(self.opts, self.state, weight, grad) + normgrad!(na, W, ∇) + s.t += 1 - mu_t, mu_t1 = - get_momentum(self.opts.momentum_scheduler, self.state) - state.momentum *= mu_t - momentum_next = state.momentum * mu_t1 + s.Πμ *= μₜ + Πμ′ = s.Πμ * μₜ₁ - grad_prime = grad / (1.0 - state.momentum) - @inplace state.mt .*= self.opts.beta1 - @inplace state.mt .+= (1.0 - self.opts.beta1) * grad - mt = state.mt / (1.0 - momentum_next) + ∇′ = ∇ / (1.0 - s.Πμ) + @inplace s.m .*= β1 + @inplace s.m .+= (1.0 - β1) * ∇ + m̂ = s.m / (1.0 - Πμ′) - @inplace state.nt .*= self.opts.beta2 - @inplace state.nt .+= (1.0 - self.opts.beta2) .* grad .* grad - nt = state.nt / (1.0 - state.beta2Power) - state.beta2Power *= self.opts.beta2 + @inplace s.n .*= β2 + @inplace s.n .+= (1.0 - β2) .* ∇.^2 + n̂ = s.n / (1.0 - s.β2ᵗ) + s.β2ᵗ *= β2 - mt_prime = (1.0 - mu_t) * grad_prime + mu_t1 * mt - @inplace weight .+= -lr * mt_prime ./ (sqrt(nt) + self.opts.epsilon) + m̄ = (1.0 - μₜ) * ∇′+ μₜ₁ * m̂ + @inplace W .+= -η * m̄ ./ (sqrt(n̂) + ϵ) end diff --git a/src/optimizers/rmsprop.jl b/src/optimizers/rmsprop.jl index 8afed0adc81d..3c51835300c4 100644 --- a/src/optimizers/rmsprop.jl +++ b/src/optimizers/rmsprop.jl @@ -1,71 +1,67 @@ -@defstruct RMSPropOptions <: AbstractOptimizerOptions ( - (lr :: Real = 0.001, lr > 0), - (rho :: Real = 0.9, rho > 0 && rho < 1), - (epsilon :: Real = 1e-6, epsilon > 0), - (grad_clip :: Real = 0, grad_clip >= 0), - (weight_decay :: Real = 0.00001, weight_decay >= 0), - lr_scheduler :: Any = nothing -) - -""" - RMSProp +doc""" + RMSProp(; kwargs...) Scale learning rates by dividing with the moving average of the root mean squared (RMS) gradients. See [1] for further description. - RMSProp(; kwargs...) +### Arguments -# Attributes -* `lr::Real`: default `0.1`, the learning rate controlling the - size of update steps -* `rho::Real`: default `0.9`, gradient moving average decay factor -* `epsilon::Real`: default `1e-6`, small value added for - numerical stability -* `grad_clip::Real`: default `0`, if positive, will clip the gradient - into the range `[-grad_clip, grad_clip]`. -* `weight_decay::Real`: default `0.00001`, weight decay is equivalent +* `η`: default `0.1`, learning rate. +* `ρ`: default `0.9`, gradient moving average decay factor. +* `ϵ`: default `1e-8`, small value added for numerical stability. +* `clip`: default `0`, gradient clipping. + If positive, will clip the gradient into the range `[-clip, clip]`. +* `scale`: default `0`, gradient rescaling. + If != 0, multiply the gradient with `scale` before updating. + Often choose to be `1.0 / batch_size`. + If leave it default, high-level API like `fit!` will set it to + `1.0 / batch_size`, since `fit!` knows the `batch_size`. +* `λ`: default `0.00001`, weight decay is equivalent to adding a global l2 regularizer for all the parameters. -# Notes -`rho` should be between 0 and 1. A value of `rho` close to 1 will decay the +### Notes +`ρ` should be between 0 and 1. A value of `ρ` close to 1 will decay the moving average slowly and a value close to 0 will decay the moving average fast. -Using the step size ``lr`` and a decay factor ``\rho`` the -learning rate ``\eta_t`` is calculated as: -``r_t &= ρ r_{t-1} + (1 - ρ)*g^2 \\ - η_t &= \frac{lr}{\sqrt{r_t + ϵ}}`` +Using the step size `η` and a decay factor `ρ the +learning rate `ηₜ` is calculated as: -# References -* [1]: Tieleman, T. and Hinton, G. (2012): - Neural Networks for Machine Learning, Lecture 6.5 - rmsprop. - Coursera. [http://www.youtube.com/watch?v=O3sxAc4hxZU] - (http://www.youtube.com/watch?v=O3sxAc4hxZU) (formula @5:20) -""" +```math +\begin{align*} + r_t &= ρ r_{t-1} + (1 - ρ)g^2 \\ + η_t &= \frac{η}{\sqrt{r_t + ϵ}} +\end{align*} +``` -mutable struct RMSProp <: AbstractOptimizer - opts :: RMSPropOptions - state :: OptimizationState - - function RMSProp(; kwargs...) - opts = RMSPropOptions(;kwargs...) - opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) +### References +1. Tieleman, T. and Hinton, G. (2012): + Neural Networks for Machine Learning, Lecture 6.5 - rmsprop. + Coursera. [http://www.youtube.com/watch?v=O3sxAc4hxZU] + (http://www.youtube.com/watch?v=O3sxAc4hxZU) (formula @5:20) +""" +RMSProp - new(opts) - end -end +@defstruct RMSProp <: AbstractOptimizer ( + (η :: Real = 0.001, η > 0), + (ρ :: Real = 0.9, 0 < ρ < 1), + (ϵ :: Real = 1e-8, ϵ > 0), + (clip :: Real = 0, clip >= 0), + scale :: Real = 0, + (λ :: Real = 1e-5, λ >= 0), + η_sched :: Any = initlrsched(η) +) -function create_state(self :: RMSProp, index :: Int, weight :: NDArray) - return zeros(size(weight), context(weight)) -end +create_state(::RMSProp, ::Int, W::NDArray) = zeros(size(W), context(W)) -function update(self :: RMSProp, index :: Int, weight :: NDArray, - grad :: NDArray, state :: NDArray) - lr = get_learning_rate(self.opts.lr_scheduler, self.state) - grad = normalized_gradient(self.opts, self.state, weight, grad) +function update!(rms::RMSProp, ::Int, W::NDArray, ∇::NDArray, s::NDArray) + η = get(rms.η_sched) + ρ = rms.ρ + ϵ = rms.ϵ - @inplace state .*= self.opts.rho - @inplace state .+= (1 - self.opts.rho) * grad .* grad + normgrad!(rms, W, ∇) - @inplace weight .+= -lr * grad ./ (sqrt(state + self.opts.epsilon)) + @inplace s .*= ρ + @inplace s .+= (1 - ρ) .* (∇.^2) + @inplace W .+= -η .* ∇ ./ sqrt(s .+ ϵ) # FIXME: sqrt should be dot-call end diff --git a/src/optimizers/sgd.jl b/src/optimizers/sgd.jl index 6e8ab34f1409..9da9f1a0b72b 100644 --- a/src/optimizers/sgd.jl +++ b/src/optimizers/sgd.jl @@ -1,69 +1,71 @@ -@defstruct SGDOptions <: AbstractOptimizerOptions ( - (lr :: Real = 0.01, lr > 0), - (momentum :: Real = 0.0, momentum >= 0), - (grad_clip :: Real = 0, grad_clip >= 0), - (weight_decay :: Real = 0.0001, weight_decay >= 0), - lr_scheduler :: Any = nothing, - momentum_scheduler :: Any = nothing -) - -""" - SGD +doc""" + SGD(; kwargs...) Stochastic gradient descent optimizer. - SGD(; kwargs...) +Vanilla SGD: -# Arguments: -* `lr::Real`: default `0.01`, learning rate. -* `lr_scheduler::AbstractLearningRateScheduler`: default `nothing`, a - dynamic learning rate scheduler. If set, will overwrite the `lr` - parameter. -* `momentum::Real`: default `0.0`, the momentum. -* `momentum_scheduler::AbstractMomentumScheduler`: default `nothing`, - a dynamic momentum scheduler. If set, will overwrite the `momentum` - parameter. -* `grad_clip::Real`: default `0`, if positive, will clip the gradient - into the bounded range `[-grad_clip, grad_clip]`. -* `weight_decay::Real`: default `0.0001`, weight decay is equivalent to - adding a global l2 regularizer to the parameters. -""" -mutable struct SGD <: AbstractOptimizer - opts :: SGDOptions - state :: OptimizationState +```math +\theta \leftarrow \theta - \eta \nabla +``` - function SGD(; kwargs...) - opts = SGDOptions(;kwargs...) - opts.lr_scheduler = get_lr_scheduler(opts.lr_scheduler, opts.lr) - opts.momentum_scheduler = get_momentum_scheduler(opts.momentum_scheduler, opts.momentum) +SGD with momentum:: - new(opts) - end -end +```math +\begin{align*} + \nu & \leftarrow \mu \nu_{t-1} - \eta \nabla \\ + \theta & \leftarrow \theta + \nu_t +\end{align*} +``` -function create_state(self :: SGD, index :: Int, weight :: NDArray) - if isa(self.opts.momentum_scheduler, Momentum.Null) - return nothing - else - return zeros(size(weight), context(weight)) - end -end +### Arguments + +* `η`: default `0.01`, learning rate. +* `μ`: default `0`, the momentum, usually set to `0.9` in this implementation. +* `λ`: default `0.0001`, weight decay is equivalent to + adding a global l2 regularizer to the parameters. +* `clip`: default `0`, gradient clipping. + If positive, will clip the gradient into the bounded range `[-clip, clip]`. +* `scale`: default `0`, gradient rescaling. + If != 0, multiply the gradient with `scale` before updating. + Often choose to be `1.0 / batch_size`. + If leave it default, high-level API like `fit!` will set it to + `1.0 / batch_size`, since `fit!` knows the `batch_size`. +* `μ_sched::AbstractMomentumScheduler`: default `Momentum.Null()`, + a dynamic momentum scheduler. If set, will overwrite the `momentum` + parameter. +* `η_sched::AbstractLearningRateScheduler`: default `LearningRate.Fixed(η)`, a + dynamic learning rate scheduler. If set, will overwrite the `η` parameter. +""" +SGD -function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: Void) - lr = get_learning_rate(self.opts.lr_scheduler, self.state) - grad = normalized_gradient(self.opts, self.state, weight, grad) - - @inplace weight += -lr * grad +@defstruct SGD <: AbstractOptimizer ( + (η :: Real = 0.01, η > 0), + (μ :: Real = 0.0, μ >= 0), + (clip :: Real = 0, clip >= 0), + scale :: Real = 0, + (λ :: Real = 0.0001, λ >= 0), + η_sched :: Any = initlrsched(η), + μ_sched :: Any = initmomsched(μ) +) + +create_state(sgd::SGD, ::Int, W::NDArray) = + isa(sgd.μ_sched, Momentum.Null) ? nothing : zeros(size(W), context(W)) + +function update!(sgd::SGD, ::Int, W::NDArray, ∇::NDArray, ::Void) + η = get(sgd.η_sched) + normgrad!(sgd, W, ∇) + @inplace W += -η * ∇ end # update with momentum -function update(self :: SGD, index :: Int, weight :: NDArray, grad :: NDArray, state :: NDArray) - lr = get_learning_rate(self.opts.lr_scheduler, self.state) - grad = normalized_gradient(self.opts, self.state, weight, grad) +function update!(sgd::SGD, ::Int, W::NDArray, ∇::NDArray, ν::NDArray) + η = get(sgd.η_sched) + μ = get(sgd.μ_sched) + + normgrad!(sgd, W, ∇) - mom = state :: NDArray - coef = get_momentum(self.opts.momentum_scheduler, self.state) - @inplace mom .*= coef - @inplace mom .+= -lr * grad - @inplace weight .+= mom + @inplace ν .*= μ + @inplace ν .+= -η .* ∇ + @inplace W .+= ν end diff --git a/test/unittest/optimizer.jl b/test/unittest/optimizer.jl new file mode 100644 index 000000000000..664d53d6421a --- /dev/null +++ b/test/unittest/optimizer.jl @@ -0,0 +1,68 @@ +module TestOptimizer + +using Base.Test + +using MXNet +using MXNet.mx.LearningRate +using MXNet.mx.Momentum + + +function test_fixed_η() + info("Optimizer::LearningRate::Fixed") + x = LearningRate.Fixed(.42) + @test get(x) == .42 + update!(x) + @test get(x) == .42 +end # function test_fixed_η + + +function check_η_decay(x) + info("Optimizer::LearningRate::$x") + + η = get(x) + @test η == 1 + + for i ∈ 1:5 + update!(x) + η′ = get(x) + @test η′ < η + η = η′ + end +end # function check_η_decay + + +test_exp_η() = LearningRate.Exp(1) |> check_η_decay + + +test_inv_η() = LearningRate.Inv(1) |> check_η_decay + + +function test_μ_null() + info("Optimizer::Momentum::Null") + x = Momentum.Null() + @test iszero(get(x)) +end + + +function test_μ_fixed() + info("Optimizer::Momentum::Fixed") + x = Momentum.Fixed(42) + @test get(x) == 42 +end + + +@testset "Optimizer Test" begin + @testset "LearningRate Test" begin + test_fixed_η() + test_exp_η() + test_inv_η() + end + + @testset "Momentum Test" begin + test_μ_null() + test_μ_fixed() + end +end + + +end # module TestOptimizer From 2c09c26b1b781fc3d612eed26edc732e54f321c5 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 4 Feb 2018 16:37:11 +0800 Subject: [PATCH 622/630] Update README: `predict` section (#412) See also #411 --- README.md | 24 ++++++++++-------------- 1 file changed, 10 insertions(+), 14 deletions(-) diff --git a/README.md b/README.md index 74208b9ac034..26a20cf3a0db 100644 --- a/README.md +++ b/README.md @@ -50,22 +50,18 @@ You can also predict using the `model` in the following way: probs = mx.predict(model, eval_provider) # collect all labels from eval data -labels = Array[] -for batch in eval_provider - push!(labels, copy(mx.get(eval_provider, batch, :softmax_label))) -end -labels = cat(1, labels...) +labels = reduce( + vcat, + copy(mx.get(eval_provider, batch, :softmax_label)) for batch ∈ eval_provider) +# labels are 0...9 +labels .= labels .+ 1 # Now we use compute the accuracy -correct = 0 -for i = 1:length(labels) - # labels are 0...9 - if indmax(probs[:,i]) == labels[i]+1 - correct += 1 - end -end +pred = map(i -> indmax(probs[1:10, i]), 1:size(probs, 2)) +correct = sum(pred .== labels) accuracy = 100correct/length(labels) -println(mx.format("Accuracy on eval set: {1:.2f}%", accuracy)) +@printf "Accuracy on eval set: %.2f%%\n" accuracy ``` -For more details, please refer to the [documentation](https://dmlc.github.io/MXNet.jl/latest) and [examples](examples). +For more details, please refer to the +[documentation](https://dmlc.github.io/MXNet.jl/latest) and [examples](examples). From 6ac37f9ae2f8755ed349a8f9e071f55ed42516b5 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 5 Feb 2018 11:35:54 +0800 Subject: [PATCH 623/630] kvstore: refine and copy docstring from Python (#388) * kvstore: refine and copy docstring from Python add a Base.show for KVStore docstring for set_updater set_updater -> setupdater! and test cases set_optimizer -> setoptimizer! sgd * docstring of setoptimizer! --- NEWS.md | 6 + src/MXNet.jl | 7 +- src/kvstore.jl | 322 ++++++++++++++++++++++++++++++++------- src/model.jl | 22 ++- test/unittest/kvstore.jl | 28 +++- 5 files changed, 312 insertions(+), 73 deletions(-) diff --git a/NEWS.md b/NEWS.md index d531d9ea0caf..71ee86ff7da4 100644 --- a/NEWS.md +++ b/NEWS.md @@ -47,6 +47,12 @@ * `SeqMetric` * `KVStore` + * `init!()` + * `push!()` + * `pull!()` + * `barrier()` + * `set_updater()` + * `set_optimizer()` * `AbstractInitializer` * `UniformInitializer` diff --git a/src/MXNet.jl b/src/MXNet.jl index b550104a4e5b..a22e4040fece 100644 --- a/src/MXNet.jl +++ b/src/MXNet.jl @@ -79,7 +79,12 @@ export AbstractEvalMetric, SeqMetric # kvstore.jl -export KVStore +export KVStore, + init!, + pull!, + barrier, + setoptimizer!, + setupdater! # initializer.jl export AbstractInitializer, diff --git a/src/kvstore.jl b/src/kvstore.jl index c4d3ad9724a7..755d6f3d1b20 100644 --- a/src/kvstore.jl +++ b/src/kvstore.jl @@ -1,3 +1,31 @@ +import Base.push! + +""" + KVStore(kv_type = :local) + +For single machine training, there are two commonly used types: + +- `local`: Copies all gradients to CPU memory and updates weights there. + +- `device`: Aggregates gradients and updates weights on GPU(s). + With this setting, the `KVStore` also attempts to use GPU peer-to-peer + communication, potentially accelerating the communication. + +For distributed training, `KVStore` also supports a number of types: + +- `dist_sync`: Behaves similarly to `local` but with one major difference. + With `dist_sync`, batch-size now means the batch size used on each machine. + So if there are `n` machines and we use batch size ``b``, + then `dist_sync` behaves like `local` with batch size `n * b`. + +- `dist_device_sync`: Identical to `dist_sync` with the difference similar + to `device` vs `local`. + +- `dist_async`: Performs asynchronous updates. + The weights are updated whenever gradients are received from any machine. + No two updates happen on the same weight at the same time. + However, the order is not guaranteed. +""" mutable struct KVStore handle :: MX_KVStoreHandle updater_c :: Ptr{Void} @@ -7,20 +35,21 @@ mutable struct KVStore end function KVStore(kv_type::Symbol = :local) - #@assert(kv_type ∈ [:local]) # TODO: update with allowed types - + @assert kv_type ∈ (:local, :device, :dist_sync, :dist_device_sync, :dist_async) ref_hdr = Ref{MX_handle}(0) - kv_type = string(kv_type) - @mxcall(:MXKVStoreCreate, (char_p, Ref{MX_handle}), kv_type, ref_hdr) - return KVStore(MX_KVStoreHandle(ref_hdr[])) + @mxcall(:MXKVStoreCreate, (char_p, Ref{MX_handle}), dump_mx_param(kv_type), ref_hdr) + KVStore(MX_KVStoreHandle(ref_hdr[])) end -function Base.unsafe_convert(::Type{MX_handle}, obj::KVStore) + +Base.unsafe_convert(::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(MX_handle, obj.handle) -end Base.convert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) Base.cconvert(t::Type{MX_handle}, obj::KVStore) = Base.unsafe_convert(t, obj) -function _flatten_kvlist(keys :: Vector{Int}, vals :: Vector{<:Vector{<:NDArray}}) +Base.show(io::IO, kv::KVStore) = + print(io, "mx.KVStore @ $(get_type(kv))") + +function _flatten_kvlist(keys::Vector{Int}, vals::Vector{<:Vector{<:NDArray}}) @assert length(keys) == length(vals) keys_flt = Int[] vals_flt = NDArray[] @@ -31,102 +60,277 @@ function _flatten_kvlist(keys :: Vector{Int}, vals :: Vector{<:Vector{<:NDArray} return (keys_flt, vals_flt) end -init!(self::KVStore, key::Int, val::NDArray) = init!(self, [key], [val]) +""" + init!(kv::KVStore, key::Int, val::NDArray) + init!(kv::KVStore, keys, vals) + +Initializes a single or a sequence of key-value pairs into the store. -init!(self::KVStore, key::Int, vals::Vector{<:NDArray}) = - init!(self, Base.ones(Int, length(vals)) * key, vals) +For each key, one must `init!` it before calling `push!` or `pull!`. +When multiple workers invoke `init!` for the same key, only +the value supplied by worker with rank `0` is used. This function returns +after data has been initialized successfully. -init!(self::KVStore, keys::Vector{Int}, vals::Vector{<:Vector{<:NDArray}}) = - init!(self, _flatten_kvlist(keys, vals)...) +```jldoctest +julia> kv = KVStore(:local) +mx.KVStore @ local -function init!(self::KVStore, keys::Vector{Int}, vals::Vector{<:NDArray}) +julia> init!(kv, 42, mx.rand(2, 3)) +``` +""" +init!(kv::KVStore, key::Int, val::NDArray) = init!(kv, [key], [val]) +init!(kv::KVStore, key::Int, vals::Vector{<:NDArray}) = + init!(kv, Base.ones(Int, length(vals)) * key, vals) +init!(kv::KVStore, keys::Vector{Int}, vals::Vector{<:Vector{<:NDArray}}) = + init!(kv, _flatten_kvlist(keys, vals)...) + +function init!(kv::KVStore, keys::Vector{Int}, vals::VecOfNDArray) @assert length(keys) == length(vals) keys = Cint[keys...] vals = MX_handle[vals...] @mxcall(:MXKVStoreInit, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}), - self, length(keys), keys, vals) + kv, length(keys), keys, vals) end -import Base.push! -function push!(self :: KVStore, key :: Int, val :: NDArray; priority :: Int = 0) - push!(self, [key], [val]; priority = priority) -end -function push!(self :: KVStore, key :: Int, vals :: Vector{<:NDArray}; priority :: Int = 0) - push!(self, Base.ones(Int, length(vals))*key, vals; priority = priority) -end -function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{<:Vector{<:NDArray}}; - priority::Int=0) - push!(self, _flatten_kvlist(keys, vals)...; priority = priority) -end -function push!(self :: KVStore, keys :: Vector{Int}, vals :: Vector{<:NDArray}; priority::Int=0) +""" + push!(kv::KVStore, key, val; priority = 0) + push!(kv::KVStore, key, vals; priority = 0) + push!(kv::KVStore, keys, vals; priority = 0) + +Pushes a single or a sequence of key-value pairs into the store. + +This function returns immediately after adding an operator to the engine. +The actual operation is executed asynchronously. If there are consecutive +pushes to the same key, there is no guarantee on the serialization of pushes. +The execution of a push does not guarantee that all previous pushes are +finished. There is no synchronization between workers by default. +One can use ``barrier()`` to sync all workers. + +`push!` and `pull!` single `NDArray`: +```jldoctest +julia> kv = KVStore(:local) +mx.KVStore @ local + +julia> x = mx.empty(2, 3); + +julia> init!(kv, 3, x) + +julia> push!(kv, 3, mx.ones(2, 3) * 8) + +julia> pull!(kv, 3, x) + +julia> x +2×3 mx.NDArray{Float32,2} @ CPU0: + 8.0 8.0 8.0 + 8.0 8.0 8.0 +``` + +Aggregate values and `push!`: +```jldoctest +julia> vals = [mx.ones((2, 3), gpu(0)) * 3, mx.ones((2, 3), gpu(1)) * 4]; + +julia> push!(kv, 3, vals) + +julia> pull!(kv, 3, x) + +julia> x +2×3 mx.NDArray{Float32,2} @ CPU0: + 7.0 7.0 7.0 + 7.0 7.0 7.0 +``` + +`push!` a list of key to single device: + +```jldoctest +julia> keys = [4, 5]; + +julia> init!(kv, keys, [empty(2, 3), empty(2, 3)]) + +julia> push!(kv, keys, [x, x]) + +julia> y, z = empty(2, 3), empty(2, 3); + +julia> pull!(kv, keys, [y, z]) +``` +""" +push!(kv::KVStore, key::Int, val::NDArray; priority::Int = 0) = + push!(kv, [key], [val]; priority = priority) +push!(kv::KVStore, key::Int, vals::Vector{<:NDArray}; priority::Int = 0) = + push!(kv, Base.ones(Int, length(vals)) * key, vals; priority = priority) +push!(kv:: KVStore, keys::Vector{Int}, vals::Vector{<:Vector{<:NDArray}}; + priority::Int = 0) = + push!(kv, _flatten_kvlist(keys, vals)...; priority = priority) + +function push!(kv::KVStore, keys::Vector{Int}, vals::Vector{<:NDArray}; priority::Int = 0) @assert length(keys) == length(vals) keys = Cint[keys...] vals = MX_handle[vals...] @mxcall(:MXKVStorePush, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}, Cint), - self, length(keys), keys, vals, priority) + kv, length(keys), keys, vals, priority) end -function pull!(self :: KVStore, key :: Int, out :: NDArray; priority :: Int = 0) - pull!(self, [key], [out]) -end -function pull!(self :: KVStore, key :: Int, outs :: Vector{<:NDArray}; priority :: Int = 0) - pull!(self, Base.ones(Int, length(outs))*key, outs; priority = priority) -end -function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{<:Vector{<:NDArray}}; priority::Int=0) - pull!(self, _flatten_kvlist(keys, outs)...; priority = priority) -end -function pull!(self :: KVStore, keys :: Vector{Int}, outs :: Vector{<:NDArray}; priority::Int=0) +""" Pulls a single value or a sequence of values from the store. + +This function returns immediately after adding an operator to the engine. +Subsequent attempts to read from the `out` variable will be blocked until the +pull operation completes. + +`pull` is executed asynchronously after all previous `pull` calls and only +the last `push` call for the same input key(s) are finished. + +The returned values are guaranteed to be the latest values in the store. + +See [`pull!`](@ref) for more examples. +""" +pull!(kv::KVStore, key::Int, out::NDArray; priority::Int = 0) = + pull!(kv, [key], [out], priority = priority) +pull!(kv::KVStore, key::Int, outs::Vector{<:NDArray}; priority::Int = 0) = + pull!(kv, Base.ones(Int, length(outs))*key, outs; priority = priority) +pull!(kv::KVStore, keys::Vector{Int}, outs::Vector{<:Vector{<:NDArray}}; + priority::Int = 0) = + pull!(kv, _flatten_kvlist(keys, outs)...; priority = priority) + +function pull!(kv::KVStore, keys::Vector{Int}, outs::Vector{<:NDArray}; priority::Int = 0) @assert length(keys) == length(outs) keys = Cint[keys...] outs = MX_handle[outs...] @mxcall(:MXKVStorePull, (MX_handle, MX_uint, Ptr{Cint}, Ptr{MX_handle}, Cint), - self, length(keys), keys, outs, priority) + kv, length(keys), keys, outs, priority) end -function get_type(self :: KVStore) +function get_type(kv::KVStore) type_ref = Ref{char_p}(0) - @mxcall(:MXKVStoreGetType, (MX_handle, Ref{char_p}), self, type_ref) + @mxcall(:MXKVStoreGetType, (MX_handle, Ref{char_p}), kv, type_ref) return Symbol(unsafe_string(type_ref[])) end -function get_num_workers(self :: KVStore) +function get_num_workers(kv::KVStore) ref_size = Ref{Cint}(0) - @mxcall(:MXKVStoreGetGroupSize, (MX_handle, Ref{Cint}), self, ref_size) + @mxcall(:MXKVStoreGetGroupSize, (MX_handle, Ref{Cint}), kv, ref_size) return Int(ref_size[]) end -function get_rank(self :: KVStore) +function get_rank(kv::KVStore) ref_rank = Ref{Cint}(0) - @mxcall(:MXKVStoreGetRank, (MX_handle, Ref{Cint}), self, ref_rank) + @mxcall(:MXKVStoreGetRank, (MX_handle, Ref{Cint}), kv, ref_rank) return Int(ref_rank[]) end +""" + barrier(kv::KVStore) + +Invokes global barrier among all worker nodes. + +For example, assume there are `n` machines. We would like machine `0` to first +`init` the values and then have all the workers `pull` the initialized value. +Before pulling, we can place invoke `barrier(kv)` to guarantee that the +initialization is finished. +""" +barrier(kv::KVStore) = @mxcall(:MXKVStoreBarrier, (MX_handle,), kv) + # TODO: Currently Julia does not support closure in c-callbacks, so we are making use of the # extra handle parameter of the API to pass the updater object around. Fix this when someday # full closure cfunction is supported in Julia. -function _kvstore_update_wrapper(index::Cint, nd_recv::MX_handle, nd_local::MX_handle, updater::Ptr{Void}) - updater_func = unsafe_pointer_to_objref(updater) :: Function - updater_func(Int(index), NDArray(MX_NDArrayHandle(nd_recv)), NDArray(MX_NDArrayHandle(nd_local))) - return nothing +function _kvstore_update_wrapper(key::Cint, nd_recv::MX_handle, nd_local::MX_handle, + updater::Ptr{Void}) + updater_func = unsafe_pointer_to_objref(updater) + updater_func(Int(key), NDArray(MX_NDArrayHandle(nd_recv)), + NDArray(MX_NDArrayHandle(nd_local))) + nothing end -function set_updater(self :: KVStore, updater :: Function) - self.updater = updater # keep a reference to the julia object so that updater_c is kept valid - self.updater_c = cfunction(_kvstore_update_wrapper, Void, (Cint, MX_handle, MX_handle, Ptr{Void})) +""" + setupdater!(kv, updater) + +Sets a `push!` updater into the store. + +This function only changes the local store. +When running on multiple machines one must use `set_optimizer`. + +```jldoctest +julia> update(key, val, orig) = mx.@inplace orig += val .* .2 +update (generic function with 1 method) + +julia> kv = KVStore(:local) +mx.KVStore @ local + +julia> mx.setupdater!(kv, update) + +julia> init!(kv, 42, mx.ones(2, 3)) + +julia> push!(kv, 42, mx.ones(2, 3)) + +julia> x = empty(2, 3); + +julia> pull!(kv, 42, x) + +julia> x +2×3 mx.NDArray{Float32,2} @ CPU0: + 1.2 1.2 1.2 + 1.2 1.2 1.2 +``` +""" +function setupdater!(kv::KVStore, updater) + kv.updater = updater # keep a reference to the julia object so that updater_c is kept valid + kv.updater_c = cfunction(_kvstore_update_wrapper, Void, + (Cint, MX_handle, MX_handle, Ptr{Void})) @mxcall(:MXKVStoreSetUpdater, (MX_handle, Ptr{Void}, Any), - self, self.updater_c, updater) + kv, kv.updater_c, updater) end -function set_optimizer(self :: KVStore, optimizer :: AbstractOptimizer) - ref_is_worker = Ref{Cint}(0) - @mxcall(:MXKVStoreIsWorkerNode, (Ref{Cint},), ref_is_worker) - is_worker = ref_is_worker[] +""" + setoptimizer!(kv::KVStore, opt) + +Registers an optimizer with the kvstore. + +When using a single machine, this function updates the local optimizer. +If using multiple machines and this operation is invoked from a worker node, +it will serialized the optimizer with pickle and send it to all servers. +The function returns after all servers have been updated. + +```jldoctest +julia> kv = KVStore() +mx.KVStore @ local + +julia> W = mx.zeros(2, 3) # 2×3 weight matrix +2×3 mx.NDArray{Float32,2} @ CPU0: + 0.0 0.0 0.0 + 0.0 0.0 0.0 - if ismatch(r"dist", string(get_type(self))) && is_worker +julia> init!(kv, 42, W) + +julia> setoptimizer!(kv, SGD(η = .2)) # SGD with .2 as learning rate + +julia> ∇W = mx.ones(2, 3) # assume it's the gradient +2×3 mx.NDArray{Float32,2} @ CPU0: + 1.0 1.0 1.0 + 1.0 1.0 1.0 + +julia> push!(kv, 42, ∇W) + +julia> pull!(kv, 42, W) # fetch weight and write back to `W` + +julia> W +2×3 mx.NDArray{Float32,2} @ CPU0: + -0.2 -0.2 -0.2 + -0.2 -0.2 -0.2 +``` +""" +function setoptimizer!(kv::KVStore, opt::AbstractOptimizer) + if ismatch(r"dist", string(get_type(kv))) && _isworker() # TODO + error("not implemented") else - set_updater(self, getupdater(optimizer)) + setupdater!(kv, getupdater(opt)) end end + +function _isworker()::Bool + ref = Ref{Cint}(0) + @mxcall(:MXKVStoreIsWorkerNode, (Ref{Cint},), ref) + ref_is_worker[] +end + +# TODO: sparse support? diff --git a/src/model.jl b/src/model.jl index 2f6dfef1c6d1..a9febc922ec6 100644 --- a/src/model.jl +++ b/src/model.jl @@ -281,27 +281,25 @@ end @defstruct TrainingOptions ( initializer :: AbstractInitializer = UniformInitializer(0.01), n_epoch :: Int = 10, - eval_data :: Union{Void, AbstractDataProvider} = nothing, + eval_data :: Union{Void,AbstractDataProvider} = nothing, eval_metric :: AbstractEvalMetric = Accuracy(), - kvstore :: Union{Symbol, KVStore} = :local, + kvstore :: Union{Symbol,KVStore} = :local, force_init :: Bool = false, callbacks :: Vector{AbstractCallback} = AbstractCallback[], verbosity :: Int = 3, η_decay :: Symbol = :epoch, ) -function _invoke_callbacks(self::FeedForward, callbacks::Vector{AbstractCallback}, +function _invoke_callbacks(m::FeedForward, callbacks::Vector{AbstractCallback}, state::OptimizationState, type_filter::Type; - metric::Vector{Tuple{Symbol,T}} = Vector{Tuple{Symbol,Real}}()) where T<:Real + metric = Vector{Tuple{Symbol,Real}}()) map(callbacks) do cb - if isa(cb, type_filter) - if type_filter == AbstractEpochCallback - # epoch callback have extra access to the model object - cb(self, state, metric) - else - cb(state) - end - end + !isa(cb, type_filter) && return + + # epoch callback have extra access to the model object + type_filter == AbstractEpochCallback && return cb(m, state, metric) + + cb(state) end end diff --git a/test/unittest/kvstore.jl b/test/unittest/kvstore.jl index cf15f1a65f05..89af95203c90 100644 --- a/test/unittest/kvstore.jl +++ b/test/unittest/kvstore.jl @@ -13,7 +13,7 @@ function init_kv() vals = [mx.zeros(SHAPE) for k in KEYS] mx.init!(kv, KEYS, vals) - return kv + kv end function test_kv_basic() @@ -62,10 +62,36 @@ function test_aggregator() end end +function check_setupdater!(f) + kv = KVStore(:local) + setupdater!(kv, f) + + A = Float32[1, 2, 3, 4] + B = Float32[.5, .6, .7, .8] + x = NDArray(A) + Δ = NDArray(B) + init!(kv, 42, x) + push!(kv, 42, Δ) + pull!(kv, 42, x) + + @test copy(x) ≈ A + 2B +end # function check_setupdater! + +function test_setupdater!() + info("KVStore::setupdater!") + + f(key, Δ, x) = @mx.inplace x += 2Δ + g(key, Δ, x) = (x[:] += 2Δ) + + check_setupdater!(f) + check_setupdater!(g) +end # test_setupdater! + @testset "KVStore Test" begin test_kv_basic() test_single_kv_pair() test_aggregator() + test_setupdater!() end end From 4038704f1f8bd733bc2aab5205068dddbbf122a2 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 15 Feb 2018 15:17:34 +0800 Subject: [PATCH 624/630] build: Propagate more build flags from ENV (#414) - `ADD_CFLAGS` - `ADD_LDFLAGS` See https://github.com/dmlc/MXNet.jl/issues/413#issuecomment-365664071 --- deps/build.jl | 12 ++++++++++++ docs/src/user-guide/install.md | 21 ++++++++++++++------- 2 files changed, 26 insertions(+), 7 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index ff4441227cac..0312f6ed870c 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -68,6 +68,10 @@ else info("Did not find a CUDA installation, using CPU-only version of MXNet.") end +# propagate more build flags from ENV +const ADD_CFLAGS = get(ENV, "ADD_CFLAGS", nothing) +const ADD_LDFLAGS = get(ENV, "ADD_LDFLAGS", nothing) + function get_cpucore() if haskey(ENV, "TRAVIS") # on travis-ci 2 @@ -219,6 +223,14 @@ if !libmxnet_detected `sed -i -s 's/ADD_CFLAGS =\(.*\)/ADD_CFLAGS =\1 -DMXNET_USE_LAPACK/' config.mk` end + # propagate more build flags from ENV + if ADD_CFLAGS != nothing + `sed -i -s "s@ADD_CFLAGS =\(.*\)@ADD_CFLAGS =\1 $ADD_CFLAGS@" config.mk` + end + if ADD_LDFLAGS != nothing + `sed -i -s "s@ADD_LDFLAGS =\(.*\)@ADD_LDFLAGS =\1 $ADD_LDFLAGS@" config.mk` + end + if USE_JULIA_BLAS `make -j$(get_cpucore()) USE_BLAS=$blas_name $MSHADOW_LDFLAGS` else diff --git a/docs/src/user-guide/install.md b/docs/src/user-guide/install.md index 30ed65d48511..4583f9f925d3 100644 --- a/docs/src/user-guide/install.md +++ b/docs/src/user-guide/install.md @@ -21,13 +21,20 @@ MXNet.jl is built on top of [libmxnet](https://github.com/dmlc/mxnet). Upon installation, Julia will try to automatically download and build libmxnet. -There are three environment variables that change this behaviour. If you -already have a pre-installed version of mxnet you can use `MXNET_HOME` -to point the build-process in the right direction. If the automatic -cuda detection fails you can also set `CUDA_HOME` to override the process. -To control which version of libmxnet will be compiled, you can use the -`MXNET_COMMIT` variable to point to either a version tag (e.g. `v0.10.0`), a -branch name (e.g. `master`) or a specific commit hash (e.g. `a0b1c2d3`). +There are several environment variables that change this behaviour. + +- `MXNET_HOME`: If you already have a pre-installed version of mxnet + you can use `MXNET_HOME` to point the build-process in the right direction. +- `CUDA_HOME`: If the automatic cuda detection fails you can also set `CUDA_HOME` + to override the process. +- `MXNET_COMMIT`: To control which version of libmxnet will be compiled, + you can use the`MXNET_COMMIT` variable to point to either a version tag + (e.g. `v0.10.0`), a branch name (e.g. `master`) or a specific commit hash + (e.g. `a0b1c2d3`). +- `ADD_CFLAGS`: Additional C flags. For instance, + if you need to point non-standard include directory, please set it as + `ENV["ADD_CFLAGS"] = "-I'/path/to/include/dir'"`. +- `ADD_LDFLAGS`: Additional linker flags. The libmxnet source is downloaded to `Pkg.dir("MXNet", "deps", "src", "mxnet")`. The automatic build is using default configurations, with OpenCV disabled. From 3c8e9d3abdfead7e113ca81ea87f8ae5e43ca304 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sun, 4 Mar 2018 15:42:17 +0800 Subject: [PATCH 625/630] build: propagate CC/CXX into config.mk (#419) * build: propagate CC/CXX into config.mk See: https://github.com/dmlc/MXNet.jl/issues/418#issuecomment-369638203 * update doc --- deps/build.jl | 8 ++++++++ docs/src/user-guide/install.md | 2 ++ 2 files changed, 10 insertions(+) diff --git a/deps/build.jl b/deps/build.jl index 0312f6ed870c..38c8e19c2fa2 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -69,6 +69,8 @@ else end # propagate more build flags from ENV +const CC = get(ENV, "CC", nothing) +const CXX = get(ENV, "CXX", nothing) const ADD_CFLAGS = get(ENV, "ADD_CFLAGS", nothing) const ADD_LDFLAGS = get(ENV, "ADD_LDFLAGS", nothing) @@ -224,6 +226,12 @@ if !libmxnet_detected end # propagate more build flags from ENV + if CC != nothing + `sed -i -s "s@^export CC =\(.*\)@export CC = $CC@" config.mk` + end + if CXX != nothing + `sed -i -s "s@^export CXX =\(.*\)@export CXX = $CXX@" config.mk` + end if ADD_CFLAGS != nothing `sed -i -s "s@ADD_CFLAGS =\(.*\)@ADD_CFLAGS =\1 $ADD_CFLAGS@" config.mk` end diff --git a/docs/src/user-guide/install.md b/docs/src/user-guide/install.md index 4583f9f925d3..dd1262b47c61 100644 --- a/docs/src/user-guide/install.md +++ b/docs/src/user-guide/install.md @@ -31,6 +31,8 @@ There are several environment variables that change this behaviour. you can use the`MXNET_COMMIT` variable to point to either a version tag (e.g. `v0.10.0`), a branch name (e.g. `master`) or a specific commit hash (e.g. `a0b1c2d3`). +- `CC`: The path of C compiler. +- `CXX`: The path of C++ compiler. - `ADD_CFLAGS`: Additional C flags. For instance, if you need to point non-standard include directory, please set it as `ENV["ADD_CFLAGS"] = "-I'/path/to/include/dir'"`. From 3df1214e6b3e71d10d4f7156bcfb56e633b38f16 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Thu, 8 Mar 2018 20:23:06 +0800 Subject: [PATCH 626/630] build: propagate USE_JEMALLOC (#422) * build: propagate USE_JEMALLOC see https://github.com/dmlc/MXNet.jl/issues/418#issuecomment-371209108 --- deps/build.jl | 4 ++++ docs/src/user-guide/install.md | 9 +++++++++ 2 files changed, 13 insertions(+) diff --git a/deps/build.jl b/deps/build.jl index 38c8e19c2fa2..a16afe6aaac0 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -73,6 +73,7 @@ const CC = get(ENV, "CC", nothing) const CXX = get(ENV, "CXX", nothing) const ADD_CFLAGS = get(ENV, "ADD_CFLAGS", nothing) const ADD_LDFLAGS = get(ENV, "ADD_LDFLAGS", nothing) +const USE_JEMALLOC = get(ENV, "USE_JEMALLOC", nothing) # "0" or "1" function get_cpucore() if haskey(ENV, "TRAVIS") # on travis-ci @@ -238,6 +239,9 @@ if !libmxnet_detected if ADD_LDFLAGS != nothing `sed -i -s "s@ADD_LDFLAGS =\(.*\)@ADD_LDFLAGS =\1 $ADD_LDFLAGS@" config.mk` end + if USE_JEMALLOC != nothing + `sed -i -s "s@USE_JEMALLOC =\(.*\)@USE_JEMALLOC = $USE_JEMALLOC@" config.mk` + end if USE_JULIA_BLAS `make -j$(get_cpucore()) USE_BLAS=$blas_name $MSHADOW_LDFLAGS` diff --git a/docs/src/user-guide/install.md b/docs/src/user-guide/install.md index dd1262b47c61..f1d5eeefacfe 100644 --- a/docs/src/user-guide/install.md +++ b/docs/src/user-guide/install.md @@ -37,6 +37,15 @@ There are several environment variables that change this behaviour. if you need to point non-standard include directory, please set it as `ENV["ADD_CFLAGS"] = "-I'/path/to/include/dir'"`. - `ADD_LDFLAGS`: Additional linker flags. +- `USE_JEMALLOC`: Default is enabled if jemalloc available. + If you ran into segfault cause by jemalloc, + Please try to disable it. + + ```julia + # first remove whole libmxnet source: Pkg.dir("MXNet", "deps", "src") + ENV["USE_JEMALLOC"] = "0" + Pkg.build("MXNet") + ``` The libmxnet source is downloaded to `Pkg.dir("MXNet", "deps", "src", "mxnet")`. The automatic build is using default configurations, with OpenCV disabled. From 0ccf8b482ae1b7772314829d6dd13319d122f295 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Tue, 3 Apr 2018 13:24:02 +0800 Subject: [PATCH 627/630] build: add `libmxnet.so` into lib search list. (#424) In case of macOS, if user build libmxnet from source set MXNET_HOME, the output is still named as `libmxnet.so`. Ref: dmlc/MXNet.jl#423 --- deps/build.jl | 4 +++- src/base.jl | 2 +- 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/deps/build.jl b/deps/build.jl index a16afe6aaac0..da4beee76f5f 100644 --- a/deps/build.jl +++ b/deps/build.jl @@ -11,7 +11,9 @@ if haskey(ENV, "MXNET_HOME") MXNET_HOME = ENV["MXNET_HOME"] info("MXNET_HOME environment detected: $MXNET_HOME") info("Trying to load existing libmxnet...") - lib = Libdl.find_library("libmxnet.$(Libdl.dlext)", + # In case of macOS, if user build libmxnet from source and set the MXNET_HOME, + # the output is still named as `libmxnet.so`. + lib = Libdl.find_library(["libmxnet.$(Libdl.dlext)", "libmxnet.so"], [joinpath(MXNET_HOME, "lib"), MXNET_HOME]) if !isempty(lib) info("Existing libmxnet detected at $lib, skip building...") diff --git a/src/base.jl b/src/base.jl index a3dcbbf7fe35..212f24d6fe37 100644 --- a/src/base.jl +++ b/src/base.jl @@ -30,7 +30,7 @@ const grad_req_map = Dict{Symbol,GRAD_REQ}( ################################################################################ # Initialization and library API entrance ################################################################################ -const MXNET_LIB = Libdl.find_library("libmxnet.$(Libdl.dlext)", +const MXNET_LIB = Libdl.find_library(["libmxnet.$(Libdl.dlext)", "libmxnet.so"], # see build.jl [joinpath(get(ENV, "MXNET_HOME", ""), "lib"), get(ENV, "MXNET_HOME", ""), Pkg.dir("MXNet", "deps", "usr", "lib")]) From b74a51603be51619a0b275b8ff8420b4182e1a58 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 20 Aug 2018 18:14:09 +0800 Subject: [PATCH 628/630] Update README.md more about julia version --- README.md | 2 ++ 1 file changed, 2 insertions(+) diff --git a/README.md b/README.md index 26a20cf3a0db..0512b9a1aece 100644 --- a/README.md +++ b/README.md @@ -15,6 +15,8 @@ MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julia * Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. * Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. +The current support julia version is 0.6. Julia 0.7/1.0 is + Here is an example of how training a simple 3-layer MLP on MNIST looks like: ```julia From 224ae962db8ae252ce1ac317c6d4a2cfe67a7d77 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Mon, 20 Aug 2018 18:14:47 +0800 Subject: [PATCH 629/630] Typo in README --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 0512b9a1aece..59f74bdce5f0 100644 --- a/README.md +++ b/README.md @@ -15,7 +15,7 @@ MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julia * Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. * Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. -The current support julia version is 0.6. Julia 0.7/1.0 is +The current support julia version is 0.6. Julia 0.7/1.0 is not supported yet. Here is an example of how training a simple 3-layer MLP on MNIST looks like: From 9f8425b2774630f5442da257b306f4fa9afa8124 Mon Sep 17 00:00:00 2001 From: Iblis Lin Date: Sat, 29 Sep 2018 02:48:43 +0800 Subject: [PATCH 630/630] import Julia binding - enable Jenkins CI build for Julia - add license headers to Julia source code - update links for Julia README --- Jenkinsfile | 44 +++++++++++---- ci/docker/Dockerfile.build.ubuntu_cpu | 3 ++ ci/docker/install/ubuntu_julia.sh | 37 +++++++++++++ ci/docker/runtime_functions.sh | 54 +++++++++++++++++++ julia/README.md | 15 ++---- julia/appveyor.yml | 17 ++++++ julia/deps/build.jl | 21 +++++++- julia/deps/cblas.h | 19 +++++++ julia/deps/cpcblas.sh | 18 +++++++ julia/docs/Makefile | 17 ++++++ julia/docs/make.jl | 17 ++++++ julia/docs/mkdocs.yml | 17 ++++++ julia/examples/char-lstm/config.jl | 17 ++++++ julia/examples/char-lstm/lstm.jl | 17 ++++++ julia/examples/char-lstm/sampler.jl | 17 ++++++ julia/examples/char-lstm/seq-data.jl | 17 ++++++ julia/examples/char-lstm/train.jl | 17 ++++++ julia/examples/char-lstm/visualize.jl | 17 ++++++ julia/examples/cifar10/cifar10.jl | 17 ++++++ .../ijulia-pretrained-predict/imagehelper.py | 17 ++++++ julia/examples/mnist/lenet-stn.jl | 17 ++++++ julia/examples/mnist/lenet.jl | 17 ++++++ julia/examples/mnist/mlp-test.jl | 17 ++++++ julia/examples/mnist/mlp.jl | 17 ++++++ julia/examples/mnist/mnist-data.jl | 17 ++++++ julia/examples/nondefault-example.jl | 17 ++++++ julia/examples/regression-example.jl | 17 ++++++ julia/models/Inception/get.sh | 18 +++++++ julia/plugins/io/svmlight.jl | 17 ++++++ julia/src/MXNet.jl | 17 ++++++ julia/src/autograd.jl | 17 ++++++ julia/src/base.jl | 17 ++++++ julia/src/broadcast.jl | 17 ++++++ julia/src/callback.jl | 17 ++++++ julia/src/context.jl | 17 ++++++ julia/src/deprecated.jl | 17 ++++++ julia/src/executor.jl | 17 ++++++ julia/src/initializer.jl | 17 ++++++ julia/src/io.jl | 17 ++++++ julia/src/kvstore.jl | 17 ++++++ julia/src/metric.jl | 17 ++++++ julia/src/model.jl | 17 ++++++ julia/src/name.jl | 17 ++++++ julia/src/ndarray.jl | 17 ++++++ julia/src/nn-factory.jl | 17 ++++++ julia/src/optimizer.jl | 17 ++++++ julia/src/optimizers/adadelta.jl | 17 ++++++ julia/src/optimizers/adagrad.jl | 17 ++++++ julia/src/optimizers/adam.jl | 17 ++++++ julia/src/optimizers/adamax.jl | 17 ++++++ julia/src/optimizers/nadam.jl | 17 ++++++ julia/src/optimizers/rmsprop.jl | 17 ++++++ julia/src/optimizers/sgd.jl | 17 ++++++ julia/src/random.jl | 17 ++++++ julia/src/symbolic-node.jl | 17 ++++++ julia/src/util.jl | 17 ++++++ julia/src/visualize.jl | 17 ++++++ julia/test/common.jl | 17 ++++++ julia/test/runtests.jl | 17 ++++++ julia/test/travis/run_coverage.sh | 19 ++++++- julia/test/travis/run_test.sh | 18 +++++++ julia/test/travis/setup_env.sh | 18 +++++++ julia/test/unittest/autograd.jl | 17 ++++++ julia/test/unittest/bind.jl | 17 ++++++ julia/test/unittest/initializer.jl | 17 ++++++ julia/test/unittest/io.jl | 17 ++++++ julia/test/unittest/kvstore.jl | 17 ++++++ julia/test/unittest/metric.jl | 17 ++++++ julia/test/unittest/model.jl | 17 ++++++ julia/test/unittest/name.jl | 17 ++++++ julia/test/unittest/ndarray.jl | 17 ++++++ julia/test/unittest/operator.jl | 17 ++++++ julia/test/unittest/optimizer.jl | 17 ++++++ julia/test/unittest/random.jl | 17 ++++++ julia/test/unittest/symbolic-node.jl | 21 ++++++-- julia/test/unittest/util.jl | 17 ++++++ julia/test/unittest/visualize.jl | 17 ++++++ .../apache_rat_license_check/rat-excludes | 1 + tools/license_header.py | 6 ++- 79 files changed, 1371 insertions(+), 29 deletions(-) create mode 100755 ci/docker/install/ubuntu_julia.sh diff --git a/Jenkinsfile b/Jenkinsfile index 81a25deca27b..af059c58e830 100644 --- a/Jenkinsfile +++ b/Jenkinsfile @@ -89,6 +89,30 @@ def python3_gpu_ut_nocudnn(docker_container_name) { } } +def deploy_docs() { + parallel 'Docs': { + node(NODE_LINUX_CPU) { + ws('workspace/docs') { + timeout(time: max_time, unit: 'MINUTES') { + utils.init_git() + utils.docker_run('ubuntu_cpu', 'deploy_docs', false) + sh "ci/other/ci_deploy_doc.sh ${env.BRANCH_NAME} ${env.BUILD_NUMBER}" + } + } + } + }, + 'Julia docs': { + node(NODE_LINUX_CPU) { + ws('workspace/julia-docs') { + timeout(time: max_time, unit: 'MINUTES') { + utils.unpack_and_init('cpu', mx_lib) + utils.docker_run('ubuntu_cpu', 'deploy_jl_docs', false) + } + } + } + } +} + node('mxnetlinux-cpu') { // Loading the utilities requires a node context unfortunately checkout scm @@ -746,6 +770,16 @@ core_logic: { } } }, + 'Julia 0.6: CPU': { + node(NODE_LINUX_CPU) { + ws('workspace/ut-julia06-cpu') { + timeout(time: max_time, unit: 'MINUTES') { + utils.unpack_and_init('cpu', mx_lib) + utils.docker_run('ubuntu_cpu', 'unittest_ubuntu_cpu_julia06', false) + } + } + } + }, 'Python 2: CPU Win':{ node(NODE_WINDOWS_CPU) { @@ -911,15 +945,7 @@ core_logic: { } stage('Deploy') { - node(NODE_LINUX_CPU) { - ws('workspace/docs') { - timeout(time: max_time, unit: 'MINUTES') { - utils.init_git() - utils.docker_run('ubuntu_cpu', 'deploy_docs', false) - sh "ci/other/ci_deploy_doc.sh ${env.BRANCH_NAME} ${env.BUILD_NUMBER}" - } - } - } + deploy_docs() } } , diff --git a/ci/docker/Dockerfile.build.ubuntu_cpu b/ci/docker/Dockerfile.build.ubuntu_cpu index f45c8da4af87..7c7e2240ee61 100755 --- a/ci/docker/Dockerfile.build.ubuntu_cpu +++ b/ci/docker/Dockerfile.build.ubuntu_cpu @@ -45,6 +45,9 @@ RUN /work/ubuntu_r.sh COPY install/ubuntu_perl.sh /work/ RUN /work/ubuntu_perl.sh +COPY install/ubuntu_julia.sh /work/ +RUN /work/ubuntu_julia.sh + COPY install/ubuntu_clang.sh /work/ RUN /work/ubuntu_clang.sh diff --git a/ci/docker/install/ubuntu_julia.sh b/ci/docker/install/ubuntu_julia.sh new file mode 100755 index 000000000000..62013e36d8fd --- /dev/null +++ b/ci/docker/install/ubuntu_julia.sh @@ -0,0 +1,37 @@ +#!/bin/bash + +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + +# build and install are separated so changes to build don't invalidate +# the whole docker cache for the image + +set -ex + +export JLBINARY='julia.tar.gz' +export JULIADIR='/work/julia' +export JULIA="${JULIADIR}/bin/julia" + +mkdir -p $JULIADIR +# The julia version in Ubuntu repo is too old +# We download the tarball from the official link: +# https://julialang.org/downloads/ +wget -O $JLBINARY https://julialang-s3.julialang.org/bin/linux/x64/0.6/julia-0.6.2-linux-x86_64.tar.gz +tar xzvf $JLBINARY -C $JULIADIR --strip 1 +rm $JLBINARY + +$JULIA -e 'versioninfo()' diff --git a/ci/docker/runtime_functions.sh b/ci/docker/runtime_functions.sh index d1fc2239a442..96b1646eff97 100755 --- a/ci/docker/runtime_functions.sh +++ b/ci/docker/runtime_functions.sh @@ -816,6 +816,35 @@ unittest_ubuntu_gpu_R() { make rpkgtest R_LIBS=/tmp/r-site-library R_GPU_ENABLE=1 } +unittest_ubuntu_cpu_julia06() { + set -ex + export PATH="/work/julia/bin:$PATH" + export MXNET_HOME='/work/mxnet' + export JULIA_PKGDIR='/work/julia-pkg' + export DEPDIR=`julia -e 'print(Pkg.dir())'` + + julia -e 'versioninfo()' + julia -e 'Pkg.init()' + + # install package + ln -sf ${MXNET_HOME}/julia ${DEPDIR}/MXNet + + # install dependencies + julia -e 'Pkg.resolve()' + + # FIXME + export LD_PRELOAD='/usr/lib/x86_64-linux-gnu/libjemalloc.so' + + # use the prebuilt binary from $MXNET_HOME/lib + julia -e 'Pkg.build("MXNet")' + + # run the script `julia/test/runtests.jl` + julia -e 'Pkg.test("MXNet")' + + # See https://github.com/dmlc/MXNet.jl/pull/303#issuecomment-341171774 + julia -e 'using MXNet; mx._sig_checker()' +} + unittest_centos7_cpu() { set -ex cd /work/mxnet @@ -1090,6 +1119,31 @@ deploy_docs() { popd } +deploy_jl_docs() { + set -ex + export PATH="/work/julia/bin:$PATH" + export MXNET_HOME='/work/mxnet' + export JULIA_PKGDIR='/work/julia-pkg' + export DEPDIR=`julia -e 'print(Pkg.dir())'` + + julia -e 'versioninfo()' + julia -e 'Pkg.init()' + ln -sf ${MXNET_HOME}/julia ${DEPDIR}/MXNet + julia -e 'Pkg.resolve()' + + # FIXME + export LD_PRELOAD='/usr/lib/x86_64-linux-gnu/libjemalloc.so' + + # use the prebuilt binary from $MXNET_HOME/lib + julia -e 'Pkg.build("MXNet")' + # build docs + julia -e 'Pkg.add("Documenter")' + julia -e 'cd(Pkg.dir("MXNet")); include(joinpath("docs", "make.jl"))' + + # TODO: make Jenkins worker push to MXNet.jl ph-pages branch if master build + # ... +} + # broken_link_checker broken_link_checker() { diff --git a/julia/README.md b/julia/README.md index 59f74bdce5f0..a4299575f95e 100644 --- a/julia/README.md +++ b/julia/README.md @@ -1,23 +1,14 @@ # MXNet -[![Build Status](https://travis-ci.org/dmlc/MXNet.jl.svg?branch=master)](https://travis-ci.org/dmlc/MXNet.jl) -[![Windows Build](https://ci.appveyor.com/api/projects/status/re90njols2th2ide?svg=true)](https://ci.appveyor.com/project/pluskid/mxnet-jl) -[![codecov.io](https://codecov.io/github/dmlc/MXNet.jl/coverage.svg?branch=master)](https://codecov.io/github/dmlc/MXNet.jl?branch=master) -[![](https://img.shields.io/badge/docs-latest-blue.svg)](https://dmlc.github.io/MXNet.jl/latest) -[![](https://img.shields.io/badge/docs-stable-blue.svg)](https://dmlc.github.io/MXNet.jl/stable) [![MXNet](http://pkg.julialang.org/badges/MXNet_0.6.svg)](http://pkg.julialang.org/?pkg=MXNet) -[![License](http://dmlc.github.io/img/apache2.svg)](LICENSE.md) -[![Join the chat at https://gitter.im/dmlc/mxnet](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/dmlc/mxnet) -MXNet.jl is the [dmlc/mxnet](https://github.com/dmlc/mxnet) [Julia](http://julialang.org/) package. MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of its features include: +MXNet.jl is the [dmlc/mxnet](https://github.com/apache/incubator-mxnet) [Julia](http://julialang.org/) package. MXNet.jl brings flexible and efficient GPU computing and state-of-art deep learning to Julia. Some highlight of its features include: * Efficient tensor/matrix computation across multiple devices, including multiple CPUs, GPUs and distributed server nodes. -* Flexible symbolic manipulation to composite and construct state-of-the-art deep learning models. +* Flexible symbolic manipulation to composite and construction of state-of-the-art deep learning models. -The current support julia version is 0.6. Julia 0.7/1.0 is not supported yet. - -Here is an example of how training a simple 3-layer MLP on MNIST looks like: +Here is an example of how training a simple 3-layer MLP on MNIST: ```julia using MXNet diff --git a/julia/appveyor.yml b/julia/appveyor.yml index 449465246eff..50e275cfa8a8 100644 --- a/julia/appveyor.yml +++ b/julia/appveyor.yml @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + environment: matrix: - JULIA_URL: "https://julialang-s3.julialang.org/bin/winnt/x64/0.6/julia-0.6-latest-win64.exe" diff --git a/julia/deps/build.jl b/julia/deps/build.jl index da4beee76f5f..bdc33be8c79b 100644 --- a/julia/deps/build.jl +++ b/julia/deps/build.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + import JSON ################################################################################ @@ -5,7 +22,7 @@ import JSON ################################################################################ libmxnet_detected = false libmxnet_curr_ver = get(ENV, "MXNET_COMMIT", "master") -curr_win = "20171019" # v0.12.0 +curr_win = "20180211" # v1.1.0 if haskey(ENV, "MXNET_HOME") MXNET_HOME = ENV["MXNET_HOME"] @@ -171,7 +188,7 @@ if !libmxnet_detected @build_steps begin BinDeps.DirectoryRule(_mxdir, @build_steps begin ChangeDirectory(_srcdir) - `git clone https://github.com/dmlc/mxnet` + `git clone https://github.com/apache/incubator-mxnet` end) @build_steps begin ChangeDirectory(_mxdir) diff --git a/julia/deps/cblas.h b/julia/deps/cblas.h index 98a02f4fa968..d9449dc8e21d 100644 --- a/julia/deps/cblas.h +++ b/julia/deps/cblas.h @@ -1,3 +1,22 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + #ifndef CBLAS_H #define CBLAS_H diff --git a/julia/deps/cpcblas.sh b/julia/deps/cpcblas.sh index 1a592186b49c..99342897a58c 100755 --- a/julia/deps/cpcblas.sh +++ b/julia/deps/cpcblas.sh @@ -1,5 +1,23 @@ #!/bin/sh +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + + # be invoked from build.jl set -e diff --git a/julia/docs/Makefile b/julia/docs/Makefile index d1cadf2e487b..57c623889a83 100644 --- a/julia/docs/Makefile +++ b/julia/docs/Makefile @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + all: julia --color=yes ./make.jl mkdocs build diff --git a/julia/docs/make.jl b/julia/docs/make.jl index 0a2b01d25cc8..6e3705a95fdc 100644 --- a/julia/docs/make.jl +++ b/julia/docs/make.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + using Documenter, MXNet makedocs( diff --git a/julia/docs/mkdocs.yml b/julia/docs/mkdocs.yml index e636a194196d..24281730885f 100644 --- a/julia/docs/mkdocs.yml +++ b/julia/docs/mkdocs.yml @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + site_name: MXNet.jl repo_url: https://github.com/dmlc/MXNet.jl diff --git a/julia/examples/char-lstm/config.jl b/julia/examples/char-lstm/config.jl index b5961549675f..c6ed0ff63b3c 100644 --- a/julia/examples/char-lstm/config.jl +++ b/julia/examples/char-lstm/config.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + const DROPOUT = 0 const BATCH_SIZE = 32 const SEQ_LENGTH = 32 diff --git a/julia/examples/char-lstm/lstm.jl b/julia/examples/char-lstm/lstm.jl index de6748df9420..fc4bcc4b6a91 100644 --- a/julia/examples/char-lstm/lstm.jl +++ b/julia/examples/char-lstm/lstm.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + # An explicitly unrolled LSTM with fixed sequence length. using MXNet diff --git a/julia/examples/char-lstm/sampler.jl b/julia/examples/char-lstm/sampler.jl index df4647f4f893..1a4aada22957 100644 --- a/julia/examples/char-lstm/sampler.jl +++ b/julia/examples/char-lstm/sampler.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + include(joinpath(@__DIR__, "config.jl")) include(joinpath(@__DIR__, "lstm.jl")) include(joinpath(@__DIR__, "seq-data.jl")) diff --git a/julia/examples/char-lstm/seq-data.jl b/julia/examples/char-lstm/seq-data.jl index 1456ae94a1a3..3489e5bc3c39 100644 --- a/julia/examples/char-lstm/seq-data.jl +++ b/julia/examples/char-lstm/seq-data.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + # Simple data provider that load text using Iterators using MXNet diff --git a/julia/examples/char-lstm/train.jl b/julia/examples/char-lstm/train.jl index 8b7a682c9560..57bfeb6b6e11 100644 --- a/julia/examples/char-lstm/train.jl +++ b/julia/examples/char-lstm/train.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + include(joinpath(@__DIR__, "config.jl")) include(joinpath(@__DIR__, "lstm.jl")) include(joinpath(@__DIR__, "seq-data.jl")) diff --git a/julia/examples/char-lstm/visualize.jl b/julia/examples/char-lstm/visualize.jl index acf757515005..e2a2c87c9c10 100644 --- a/julia/examples/char-lstm/visualize.jl +++ b/julia/examples/char-lstm/visualize.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + include(joinpath(dirname(@__FILE__), "config.jl")) include(joinpath(dirname(@__FILE__), "lstm.jl")) diff --git a/julia/examples/cifar10/cifar10.jl b/julia/examples/cifar10/cifar10.jl index 5d3d2eeafe41..a00664ce3a50 100644 --- a/julia/examples/cifar10/cifar10.jl +++ b/julia/examples/cifar10/cifar10.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + using MXNet #-------------------------------------------------------------------------------- diff --git a/julia/examples/imagenet/ijulia-pretrained-predict/imagehelper.py b/julia/examples/imagenet/ijulia-pretrained-predict/imagehelper.py index 7584b45d9313..dddef7415f45 100644 --- a/julia/examples/imagenet/ijulia-pretrained-predict/imagehelper.py +++ b/julia/examples/imagenet/ijulia-pretrained-predict/imagehelper.py @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + import numpy as np from skimage import io, transform diff --git a/julia/examples/mnist/lenet-stn.jl b/julia/examples/mnist/lenet-stn.jl index ae94bf9b16f7..95cd0955d402 100644 --- a/julia/examples/mnist/lenet-stn.jl +++ b/julia/examples/mnist/lenet-stn.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + using MXNet #-------------------------------------------------------------------------------- diff --git a/julia/examples/mnist/lenet.jl b/julia/examples/mnist/lenet.jl index 64bcdea9cba9..5ee15d69dd1b 100644 --- a/julia/examples/mnist/lenet.jl +++ b/julia/examples/mnist/lenet.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + using MXNet #-------------------------------------------------------------------------------- diff --git a/julia/examples/mnist/mlp-test.jl b/julia/examples/mnist/mlp-test.jl index dac2c9cd84eb..1af84ed3ba8a 100644 --- a/julia/examples/mnist/mlp-test.jl +++ b/julia/examples/mnist/mlp-test.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + # This file is primarily to be included from runtest.jl. We tried to cover various # features of MXNet.jl in this example in order to detect regression errors. diff --git a/julia/examples/mnist/mlp.jl b/julia/examples/mnist/mlp.jl index 8a73d2aa7637..20facc9b71b3 100644 --- a/julia/examples/mnist/mlp.jl +++ b/julia/examples/mnist/mlp.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + using MXNet #-------------------------------------------------------------------------------- diff --git a/julia/examples/mnist/mnist-data.jl b/julia/examples/mnist/mnist-data.jl index 7349152617f9..12160cf6f18e 100644 --- a/julia/examples/mnist/mnist-data.jl +++ b/julia/examples/mnist/mnist-data.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + function get_mnist_providers(batch_size::Int; data_name=:data, label_name=:softmax_label, flat=true) # download MNIST into Pkg.dir("MXNet")/data/mnist if not exist filenames = mx.get_mnist_ubyte() diff --git a/julia/examples/nondefault-example.jl b/julia/examples/nondefault-example.jl index b93887850ca3..75eff085a459 100644 --- a/julia/examples/nondefault-example.jl +++ b/julia/examples/nondefault-example.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + #= Contents: This file contains code for: - Setting the initial values of the biases and weights equal to the final values of a previous run. diff --git a/julia/examples/regression-example.jl b/julia/examples/regression-example.jl index 7d05baf3c632..bbbb415fe664 100644 --- a/julia/examples/regression-example.jl +++ b/julia/examples/regression-example.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + #= This script shows how a simple MLP net may be used for regression. It shows how data in memory may be diff --git a/julia/models/Inception/get.sh b/julia/models/Inception/get.sh index dfd3701bd0b4..16452a361d98 100755 --- a/julia/models/Inception/get.sh +++ b/julia/models/Inception/get.sh @@ -1,4 +1,22 @@ #!/bin/bash +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + + wget -c http://data.dmlc.ml/mxnet/data/Inception.zip unzip Inception.zip diff --git a/julia/plugins/io/svmlight.jl b/julia/plugins/io/svmlight.jl index 46b79743b87f..f9d9b2ec83db 100644 --- a/julia/plugins/io/svmlight.jl +++ b/julia/plugins/io/svmlight.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + #=doc SVMLight / LibSVM is a popular data format for sparse features. Some preprocessed datasets in this format could be found at http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/ diff --git a/julia/src/MXNet.jl b/julia/src/MXNet.jl index a22e4040fece..03c3cb89b530 100644 --- a/julia/src/MXNet.jl +++ b/julia/src/MXNet.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + __precompile__() module MXNet diff --git a/julia/src/autograd.jl b/julia/src/autograd.jl index 4584decb0a52..72fb82ba1bbb 100644 --- a/julia/src/autograd.jl +++ b/julia/src/autograd.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + # Autograd for NDArray # this is a port of Python's autograd module # https://github.com/apache/incubator-mxnet/blob/master/python/mxnet/autograd.py diff --git a/julia/src/base.jl b/julia/src/base.jl index 212f24d6fe37..ce1c183eafb5 100644 --- a/julia/src/base.jl +++ b/julia/src/base.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + "Exception thrown when an error occurred calling MXNet API." struct MXError <: Exception msg :: AbstractString diff --git a/julia/src/broadcast.jl b/julia/src/broadcast.jl index 1b58addec321..fee960a46271 100644 --- a/julia/src/broadcast.jl +++ b/julia/src/broadcast.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + using TakingBroadcastSeriously: Broadcasted, unwrap for f in :[%, diff --git a/julia/src/callback.jl b/julia/src/callback.jl index 16e44fdc632d..06e431de06d0 100644 --- a/julia/src/callback.jl +++ b/julia/src/callback.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ AbstractCallback diff --git a/julia/src/context.jl b/julia/src/context.jl index 2b83eebe97a7..c97522b3b846 100644 --- a/julia/src/context.jl +++ b/julia/src/context.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + @enum CONTEXT_TYPE CPU=1 GPU=2 CPU_PINNED=3 """ diff --git a/julia/src/deprecated.jl b/julia/src/deprecated.jl index 67b1707cdee6..12c5345aa198 100644 --- a/julia/src/deprecated.jl +++ b/julia/src/deprecated.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + # NDArray reshape (#272) @deprecate reshape(arr::NDArray; shape=()) reshape(arr, shape) @deprecate Reshape(arr::NDArray; shape=()) reshape(arr, shape) diff --git a/julia/src/executor.jl b/julia/src/executor.jl index c99517b6d76b..4bf4339d65d1 100644 --- a/julia/src/executor.jl +++ b/julia/src/executor.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + import Base: bind """ diff --git a/julia/src/initializer.jl b/julia/src/initializer.jl index 188c5deb6255..95dbeb31febd 100644 --- a/julia/src/initializer.jl +++ b/julia/src/initializer.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ AbstractInitializer diff --git a/julia/src/io.jl b/julia/src/io.jl index c8dbee9b8e1a..e5f43950754c 100644 --- a/julia/src/io.jl +++ b/julia/src/io.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ AbstractDataProvider diff --git a/julia/src/kvstore.jl b/julia/src/kvstore.jl index 755d6f3d1b20..ac0367144384 100644 --- a/julia/src/kvstore.jl +++ b/julia/src/kvstore.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + import Base.push! """ diff --git a/julia/src/metric.jl b/julia/src/metric.jl index 489df2ddd8b2..772eb3b3e680 100644 --- a/julia/src/metric.jl +++ b/julia/src/metric.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ AbstractEvalMetric diff --git a/julia/src/model.jl b/julia/src/model.jl index a9febc922ec6..109cb35e38a6 100644 --- a/julia/src/model.jl +++ b/julia/src/model.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ AbstractModel diff --git a/julia/src/name.jl b/julia/src/name.jl index d281770eb357..8180886c869c 100644 --- a/julia/src/name.jl +++ b/julia/src/name.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + abstract type AbstractNameManager end const NameType = Union{Base.Symbol, AbstractString} const NameCounter = Dict{Base.Symbol, Int} diff --git a/julia/src/ndarray.jl b/julia/src/ndarray.jl index d2ceb8498ca0..9e47150a1a00 100644 --- a/julia/src/ndarray.jl +++ b/julia/src/ndarray.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + # All the types supported by mshadow. See `mshadow/base.h` const DType = Union{Float32, Float64, Float16, UInt8, Int32, Int8, Int64} @enum TypeFlag kFloat32 kFloat64 kFloat16 kUint8 kInt32 kInt8 kInt64 diff --git a/julia/src/nn-factory.jl b/julia/src/nn-factory.jl index ab88d21adf29..b5134f9d2bd5 100644 --- a/julia/src/nn-factory.jl +++ b/julia/src/nn-factory.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ MLP(input, spec; hidden_activation = :relu, prefix) diff --git a/julia/src/optimizer.jl b/julia/src/optimizer.jl index 06f93a5942d2..6436878df678 100644 --- a/julia/src/optimizer.jl +++ b/julia/src/optimizer.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + ############################################################################### # Types ############################################################################### diff --git a/julia/src/optimizers/adadelta.jl b/julia/src/optimizers/adadelta.jl index 9fee3517a3cb..2b0cd0060261 100644 --- a/julia/src/optimizers/adadelta.jl +++ b/julia/src/optimizers/adadelta.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + doc""" AdaDelta(; kwargs...) diff --git a/julia/src/optimizers/adagrad.jl b/julia/src/optimizers/adagrad.jl index c72bac1e3b7e..4236cb8cda20 100644 --- a/julia/src/optimizers/adagrad.jl +++ b/julia/src/optimizers/adagrad.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + doc""" AdaGrad(; kwargs...) diff --git a/julia/src/optimizers/adam.jl b/julia/src/optimizers/adam.jl index 0d5c1a23850d..c6aa99ba71fb 100644 --- a/julia/src/optimizers/adam.jl +++ b/julia/src/optimizers/adam.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ ADAM diff --git a/julia/src/optimizers/adamax.jl b/julia/src/optimizers/adamax.jl index 87ef0aa68831..de6a1ab759b3 100644 --- a/julia/src/optimizers/adamax.jl +++ b/julia/src/optimizers/adamax.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ AdaMax(; kwargs...) diff --git a/julia/src/optimizers/nadam.jl b/julia/src/optimizers/nadam.jl index 524465ecb984..fdcd1ea7e7ab 100644 --- a/julia/src/optimizers/nadam.jl +++ b/julia/src/optimizers/nadam.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + doc""" Nadam(; kwargs...) diff --git a/julia/src/optimizers/rmsprop.jl b/julia/src/optimizers/rmsprop.jl index 3c51835300c4..8351142681b1 100644 --- a/julia/src/optimizers/rmsprop.jl +++ b/julia/src/optimizers/rmsprop.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + doc""" RMSProp(; kwargs...) diff --git a/julia/src/optimizers/sgd.jl b/julia/src/optimizers/sgd.jl index 9da9f1a0b72b..dfd3d954baa3 100644 --- a/julia/src/optimizers/sgd.jl +++ b/julia/src/optimizers/sgd.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + doc""" SGD(; kwargs...) diff --git a/julia/src/random.jl b/julia/src/random.jl index 1f612e310fe8..b9b32a42ecff 100644 --- a/julia/src/random.jl +++ b/julia/src/random.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ rand!(x::NDArray; low = 0, high = 1) diff --git a/julia/src/symbolic-node.jl b/julia/src/symbolic-node.jl index bb3c97773488..508f9d449028 100644 --- a/julia/src/symbolic-node.jl +++ b/julia/src/symbolic-node.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + """ SymbolicNode diff --git a/julia/src/util.jl b/julia/src/util.jl index c4f5e63244dd..c07c9ec910fb 100644 --- a/julia/src/util.jl +++ b/julia/src/util.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + ################################################################################ # Dataset related utilities ################################################################################ diff --git a/julia/src/visualize.jl b/julia/src/visualize.jl index 91bbd0c48481..b41db7e9e5a7 100644 --- a/julia/src/visualize.jl +++ b/julia/src/visualize.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + import JSON """ diff --git a/julia/test/common.jl b/julia/test/common.jl index 5854fc6659d0..5ac5f905143a 100644 --- a/julia/test/common.jl +++ b/julia/test/common.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + ################################################################################ # Common models used in testing ################################################################################ diff --git a/julia/test/runtests.jl b/julia/test/runtests.jl index eb05ff2f5ca4..8b46bfda6726 100644 --- a/julia/test/runtests.jl +++ b/julia/test/runtests.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + using MXNet using Base.Test diff --git a/julia/test/travis/run_coverage.sh b/julia/test/travis/run_coverage.sh index 73816fac7b98..ee22b258b549 100644 --- a/julia/test/travis/run_coverage.sh +++ b/julia/test/travis/run_coverage.sh @@ -1 +1,18 @@ -julia -e 'cd(Pkg.dir("MXNet")); Pkg.add("Coverage"); using Coverage; Codecov.submit(process_folder())' \ No newline at end of file +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + +julia -e 'cd(Pkg.dir("MXNet")); Pkg.add("Coverage"); using Coverage; Codecov.submit(process_folder())' diff --git a/julia/test/travis/run_test.sh b/julia/test/travis/run_test.sh index bf726eb49157..414b1450b554 100755 --- a/julia/test/travis/run_test.sh +++ b/julia/test/travis/run_test.sh @@ -1,4 +1,22 @@ #!/bin/bash + +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + set -e if [[ -a .git/shallow ]]; then git fetch --unshallow; fi diff --git a/julia/test/travis/setup_env.sh b/julia/test/travis/setup_env.sh index 4bae93243949..9d2f7341998d 100755 --- a/julia/test/travis/setup_env.sh +++ b/julia/test/travis/setup_env.sh @@ -1,5 +1,23 @@ #!/bin/bash +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + + echo "##########################" echo $TRAVIS_OS_NAME diff --git a/julia/test/unittest/autograd.jl b/julia/test/unittest/autograd.jl index 12c1022bd208..96f275b626af 100644 --- a/julia/test/unittest/autograd.jl +++ b/julia/test/unittest/autograd.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestAutoGrad using Base.Test diff --git a/julia/test/unittest/bind.jl b/julia/test/unittest/bind.jl index 3bac43f2345c..538b556bf474 100644 --- a/julia/test/unittest/bind.jl +++ b/julia/test/unittest/bind.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestBind using MXNet using Base.Test diff --git a/julia/test/unittest/initializer.jl b/julia/test/unittest/initializer.jl index 750959f2eb20..fa528c9f8e13 100644 --- a/julia/test/unittest/initializer.jl +++ b/julia/test/unittest/initializer.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + @testset "Initializers" begin @testset "Bilinear initializer" begin # Setup a filter with scale = 2 diff --git a/julia/test/unittest/io.jl b/julia/test/unittest/io.jl index f8e558613c99..81f2ff79a83b 100644 --- a/julia/test/unittest/io.jl +++ b/julia/test/unittest/io.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestIO using MXNet diff --git a/julia/test/unittest/kvstore.jl b/julia/test/unittest/kvstore.jl index 89af95203c90..96e1643d8d83 100644 --- a/julia/test/unittest/kvstore.jl +++ b/julia/test/unittest/kvstore.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestKVStore using MXNet using Base.Test diff --git a/julia/test/unittest/metric.jl b/julia/test/unittest/metric.jl index ca51f83671d9..32c4538b608c 100644 --- a/julia/test/unittest/metric.jl +++ b/julia/test/unittest/metric.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestMetric using MXNet diff --git a/julia/test/unittest/model.jl b/julia/test/unittest/model.jl index 86a3a6f131ec..dbe97093dc68 100644 --- a/julia/test/unittest/model.jl +++ b/julia/test/unittest/model.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestModel using Base.Test diff --git a/julia/test/unittest/name.jl b/julia/test/unittest/name.jl index 9287bf087074..eea73efb43c9 100644 --- a/julia/test/unittest/name.jl +++ b/julia/test/unittest/name.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestNameManager using MXNet using Base.Test diff --git a/julia/test/unittest/ndarray.jl b/julia/test/unittest/ndarray.jl index 891dffd0f390..3bacbb009dfc 100644 --- a/julia/test/unittest/ndarray.jl +++ b/julia/test/unittest/ndarray.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestNDArray using MXNet diff --git a/julia/test/unittest/operator.jl b/julia/test/unittest/operator.jl index 85fc7c6238e9..ed8312d91cc9 100644 --- a/julia/test/unittest/operator.jl +++ b/julia/test/unittest/operator.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestOperator using MXNet diff --git a/julia/test/unittest/optimizer.jl b/julia/test/unittest/optimizer.jl index 664d53d6421a..b068f12fffd7 100644 --- a/julia/test/unittest/optimizer.jl +++ b/julia/test/unittest/optimizer.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestOptimizer using Base.Test diff --git a/julia/test/unittest/random.jl b/julia/test/unittest/random.jl index 34b9d3625c0d..973a4bc32faa 100644 --- a/julia/test/unittest/random.jl +++ b/julia/test/unittest/random.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestRandom using MXNet using Base.Test diff --git a/julia/test/unittest/symbolic-node.jl b/julia/test/unittest/symbolic-node.jl index e3e003d296af..507af17332f8 100644 --- a/julia/test/unittest/symbolic-node.jl +++ b/julia/test/unittest/symbolic-node.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestSymbolicNode using MXNet @@ -137,10 +154,8 @@ function test_attrs() data2 = mx.Variable(:data2, attrs = Dict(:test => "hallo!")) @test get(mx.get_attr(data2, :test)) == "hallo!" - conv = mx.Convolution(data2, kernel = (1,1), num_filter = 1, attrs = Dict(:a => "a", :π => "π")) + conv = mx.Convolution(data2, kernel = (1,1), num_filter = 1) @test isnull(mx.get_attr(conv, :b)) - @test get(mx.get_attr(conv, :a)) == "a" - @test get(mx.get_attr(conv, :π)) == "π" @test isa(mx.get_name(conv), Symbol) @test_throws MethodError mx.Variable(:data3, attrs = Dict(:test => "1.0", :test2 => 1.0)) diff --git a/julia/test/unittest/util.jl b/julia/test/unittest/util.jl index 0e6107ca0acc..ddd613ca48ea 100644 --- a/julia/test/unittest/util.jl +++ b/julia/test/unittest/util.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestUtil using Base.Test diff --git a/julia/test/unittest/visualize.jl b/julia/test/unittest/visualize.jl index f4ccbf0e5a81..58d111b0fe14 100644 --- a/julia/test/unittest/visualize.jl +++ b/julia/test/unittest/visualize.jl @@ -1,3 +1,20 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + module TestVisualize using MXNet using Base.Test diff --git a/tests/nightly/apache_rat_license_check/rat-excludes b/tests/nightly/apache_rat_license_check/rat-excludes index 301a342f4664..0c305f498b34 100755 --- a/tests/nightly/apache_rat_license_check/rat-excludes +++ b/tests/nightly/apache_rat_license_check/rat-excludes @@ -57,3 +57,4 @@ apache-rat-tasks/* moderngpu/* deformable_im2col.cuh deformable_im2col.h +REQUIRE diff --git a/tools/license_header.py b/tools/license_header.py index 7aef33b71213..f6726891f521 100755 --- a/tools/license_header.py +++ b/tools/license_header.py @@ -76,13 +76,15 @@ 'example/rcnn/rcnn/cython/nms_kernel.cu', 'prepare_mkl.sh', 'example/image-classification/predict-cpp/image-classification-predict.cc', - 'src/operator/contrib/ctc_include/'] + 'src/operator/contrib/ctc_include/', + 'julia/REQUIRE'] # language extensions and the according commment mark _LANGS = {'.cc':'*', '.h':'*', '.cu':'*', '.cuh':'*', '.py':'#', '.pm':'#', '.scala':'*', '.cc':'*', '.sh':'#', '.cmake':'#', '.java':'*', '.sh':'#', '.cpp':'*', '.hpp':'*', '.c':'*', - '.bat':'rem', '.pl':'#', '.m':'%', '.R':'#', '.mk':'#', '.cfg':'#', '.t':'#', '.ps1': '#'} + '.bat':'rem', '.pl':'#', '.m':'%', '.R':'#', '.mk':'#', '.cfg':'#', + '.t':'#', '.ps1':'#', '.jl':'#'} # Previous license header, which will be removed _OLD_LICENSE = re.compile('.*Copyright.*by Contributors')