view org/vision.org @ 171:15bde60217aa

updated docstring for vision-fn
author Robert McIntyre <rlm@mit.edu>
date Sat, 04 Feb 2012 05:02:25 -0700
parents 1a00b4918529
children 04a39e6bb695
line wrap: on
line source
1 #+title: Simulated Sense of Sight
2 #+author: Robert McIntyre
3 #+email: rlm@mit.edu
4 #+description: Simulated sight for AI research using JMonkeyEngine3 and clojure
5 #+keywords: computer vision, jMonkeyEngine3, clojure
6 #+SETUPFILE: ../../aurellem/org/setup.org
7 #+INCLUDE: ../../aurellem/org/level-0.org
8 #+babel: :mkdirp yes :noweb yes :exports both
10 * COMMENT Vision
12 I want to make creatures with eyes. Each eye can be independely moved
13 and should see its own version of the world depending on where it is.
15 Here's how vision will work.
17 Make the continuation in scene-processor take FrameBuffer,
18 byte-buffer, BufferedImage already sized to the correct
19 dimensions. the continuation will decide wether to "mix" them
20 into the BufferedImage, lazily ignore them, or mix them halfway
21 and call c/graphics card routines.
23 (vision creature) will take an optional :skip argument which will
24 inform the continuations in scene processor to skip the given
25 number of cycles 0 means that no cycles will be skipped.
27 (vision creature) will return [init-functions sensor-functions].
28 The init-functions are each single-arg functions that take the
29 world and register the cameras and must each be called before the
30 corresponding sensor-functions. Each init-function returns the
31 viewport for that eye which can be manipulated, saved, etc. Each
32 sensor-function is a thunk and will return data in the same
33 format as the tactile-sensor functions the structure is
34 [topology, sensor-data]. Internally, these sensor-functions
35 maintain a reference to sensor-data which is periodically updated
36 by the continuation function established by its init-function.
37 They can be queried every cycle, but their information may not
38 necessairly be different every cycle.
40 Each eye in the creature in blender will work the same way as
41 joints -- a zero dimensional object with no geometry whose local
42 coordinate system determines the orientation of the resulting
43 eye. All eyes will have a parent named "eyes" just as all joints
44 have a parent named "joints". The resulting camera will be a
45 ChaseCamera or a CameraNode bound to the geo that is closest to
46 the eye marker. The eye marker will contain the metadata for the
47 eye, and will be moved by it's bound geometry. The dimensions of
48 the eye's camera are equal to the dimensions of the eye's "UV"
49 map.
51 #+name: eyes
52 #+begin_src clojure
53 (ns cortex.vision
54 "Simulate the sense of vision in jMonkeyEngine3. Enables multiple
55 eyes from different positions to observe the same world, and pass
56 the observed data to any arbitray function."
57 {:author "Robert McIntyre"}
58 (:use (cortex world sense util))
59 (:use clojure.contrib.def)
60 (:import com.jme3.post.SceneProcessor)
61 (:import (com.jme3.util BufferUtils Screenshots))
62 (:import java.nio.ByteBuffer)
63 (:import java.awt.image.BufferedImage)
64 (:import com.jme3.renderer.ViewPort)
65 (:import com.jme3.math.ColorRGBA)
66 (:import com.jme3.renderer.Renderer)
67 (:import com.jme3.scene.Node))
69 (cortex.import/mega-import-jme3)
72 (defn vision-pipeline
73 "Create a SceneProcessor object which wraps a vision processing
74 continuation function. The continuation is a function that takes
75 [#^Renderer r #^FrameBuffer fb #^ByteBuffer b #^BufferedImage bi],
76 each of which has already been appropiately sized."
77 [continuation]
78 (let [byte-buffer (atom nil)
79 renderer (atom nil)
80 image (atom nil)]
81 (proxy [SceneProcessor] []
82 (initialize
83 [renderManager viewPort]
84 (let [cam (.getCamera viewPort)
85 width (.getWidth cam)
86 height (.getHeight cam)]
87 (reset! renderer (.getRenderer renderManager))
88 (reset! byte-buffer
89 (BufferUtils/createByteBuffer
90 (* width height 4)))
91 (reset! image (BufferedImage.
92 width height
93 BufferedImage/TYPE_4BYTE_ABGR))))
94 (isInitialized [] (not (nil? @byte-buffer)))
95 (reshape [_ _ _])
96 (preFrame [_])
97 (postQueue [_])
98 (postFrame
99 [#^FrameBuffer fb]
100 (.clear @byte-buffer)
101 (continuation @renderer fb @byte-buffer @image))
102 (cleanup []))))
104 (defn frameBuffer->byteBuffer!
105 "Transfer the data in the graphics card (Renderer, FrameBuffer) to
106 the CPU (ByteBuffer)."
107 [#^Renderer r #^FrameBuffer fb #^ByteBuffer bb]
108 (.readFrameBuffer r fb bb) bb)
110 (defn byteBuffer->bufferedImage!
111 "Convert the C-style BGRA image data in the ByteBuffer bb to the AWT
112 style ABGR image data and place it in BufferedImage bi."
113 [#^ByteBuffer bb #^BufferedImage bi]
114 (Screenshots/convertScreenShot bb bi) bi)
116 (defn BufferedImage!
117 "Continuation which will grab the buffered image from the materials
118 provided by (vision-pipeline)."
119 [#^Renderer r #^FrameBuffer fb #^ByteBuffer bb #^BufferedImage bi]
120 (byteBuffer->bufferedImage!
121 (frameBuffer->byteBuffer! r fb bb) bi))
123 (defn add-camera!
124 "Add a camera to the world, calling continuation on every frame
125 produced."
126 [#^Application world camera continuation]
127 (let [width (.getWidth camera)
128 height (.getHeight camera)
129 render-manager (.getRenderManager world)
130 viewport (.createMainView render-manager "eye-view" camera)]
131 (doto viewport
132 (.setClearFlags true true true)
133 (.setBackgroundColor ColorRGBA/Black)
134 (.addProcessor (vision-pipeline continuation))
135 (.attachScene (.getRootNode world)))))
137 (defn retina-sensor-profile
138 "Return a map of pixel selection functions to BufferedImages
139 describing the distribution of light-sensitive components of this
140 eye. Each function creates an integer from the rgb values found in
141 the pixel. :red, :green, :blue, :gray are already defined as
142 extracting the red, green, blue, and average components
143 respectively."
144 [#^Spatial eye]
145 (if-let [eye-map (meta-data eye "eye")]
146 (map-vals
147 load-image
148 (eval (read-string eye-map)))))
150 (defn eye-dimensions
151 "Returns [width, height] specified in the metadata of the eye"
152 [#^Spatial eye]
153 (let [dimensions
154 (map #(vector (.getWidth %) (.getHeight %))
155 (vals (retina-sensor-profile eye)))]
156 [(apply max (map first dimensions))
157 (apply max (map second dimensions))]))
159 (defvar
160 ^{:arglists '([creature])}
161 eyes
162 (sense-nodes "eyes")
163 "Return the children of the creature's \"eyes\" node.")
165 (defn add-eye!
166 "Create a Camera centered on the current position of 'eye which
167 follows the closest physical node in 'creature and sends visual
168 data to 'continuation."
169 [#^Node creature #^Spatial eye]
170 (let [target (closest-node creature eye)
171 [cam-width cam-height] (eye-dimensions eye)
172 cam (Camera. cam-width cam-height)]
173 (.setLocation cam (.getWorldTranslation eye))
174 (.setRotation cam (.getWorldRotation eye))
175 (.setFrustumPerspective
176 cam 45 (/ (.getWidth cam) (.getHeight cam))
177 1 1000)
178 (bind-sense target cam)
179 cam))
181 (def presets
182 {:all 0xFFFFFF
183 :red 0xFF0000
184 :blue 0x0000FF
185 :green 0x00FF00})
187 (defn vision-fn
188 "Returns a list of functions, each of which will return a color
189 channel's worth of visual information when called inside a running
190 simulation."
191 [#^Node creature #^Spatial eye & {skip :skip :or {skip 0}}]
192 (let [retinal-map (retina-sensor-profile eye)
193 camera (add-eye! creature eye)
194 vision-image
195 (atom
196 (BufferedImage. (.getWidth camera)
197 (.getHeight camera)
198 BufferedImage/TYPE_BYTE_BINARY))
199 register-eye!
200 (runonce
201 (fn [world]
202 (add-camera!
203 world camera
204 (let [counter (atom 0)]
205 (fn [r fb bb bi]
206 (if (zero? (rem (swap! counter inc) (inc skip)))
207 (reset! vision-image
208 (BufferedImage! r fb bb bi))))))))]
209 (vec
210 (map
211 (fn [[key image]]
212 (let [whites (white-coordinates image)
213 topology (vec (collapse whites))
214 mask (presets key)]
215 (fn [world]
216 (register-eye! world)
217 (vector
218 topology
219 (vec
220 (for [[x y] whites]
221 (bit-and
222 mask (.getRGB @vision-image x y))))))))
223 retinal-map))))
226 ;; TODO maybe should add a viewport-manipulation function to
227 ;; automatically change viewport settings, attach shadow filters, etc.
229 (defn vision!
230 "Returns a function which returns visual sensory data when called
231 inside a running simulation"
232 [#^Node creature & {skip :skip :or {skip 0}}]
233 (reduce
234 concat
235 (for [eye (eyes creature)]
236 (vision-fn creature eye))))
238 #+end_src
241 Note the use of continuation passing style for connecting the eye to a
242 function to process the output. You can create any number of eyes, and
243 each of them will see the world from their own =Camera=. Once every
244 frame, the rendered image is copied to a =BufferedImage=, and that
245 data is sent off to the continuation function. Moving the =Camera=
246 which was used to create the eye will change what the eye sees.
248 * Example
250 #+name: test-vision
251 #+begin_src clojure
252 (ns cortex.test.vision
253 (:use (cortex world util vision))
254 (:import java.awt.image.BufferedImage)
255 (:import javax.swing.JPanel)
256 (:import javax.swing.SwingUtilities)
257 (:import java.awt.Dimension)
258 (:import javax.swing.JFrame)
259 (:import com.jme3.math.ColorRGBA)
260 (:import com.jme3.scene.Node)
261 (:import com.jme3.math.Vector3f))
263 (defn test-two-eyes
264 "Testing vision:
265 Tests the vision system by creating two views of the same rotating
266 object from different angles and displaying both of those views in
267 JFrames.
269 You should see a rotating cube, and two windows,
270 each displaying a different view of the cube."
271 []
272 (let [candy
273 (box 1 1 1 :physical? false :color ColorRGBA/Blue)]
274 (world
275 (doto (Node.)
276 (.attachChild candy))
277 {}
278 (fn [world]
279 (let [cam (.clone (.getCamera world))
280 width (.getWidth cam)
281 height (.getHeight cam)]
282 (add-camera! world cam
283 ;;no-op
284 (comp (view-image) BufferedImage!)
285 )
286 (add-camera! world
287 (doto (.clone cam)
288 (.setLocation (Vector3f. -10 0 0))
289 (.lookAt Vector3f/ZERO Vector3f/UNIT_Y))
290 ;;no-op
291 (comp (view-image) BufferedImage!))
292 ;; This is here to restore the main view
293 ;; after the other views have completed processing
294 (add-camera! world (.getCamera world) no-op)))
295 (fn [world tpf]
296 (.rotate candy (* tpf 0.2) 0 0)))))
297 #+end_src
299 #+results: test-vision
300 : #'cortex.test.vision/test-two-eyes
302 The example code will create two videos of the same rotating object
303 from different angles. It can be used both for stereoscopic vision
304 simulation or for simulating multiple creatures, each with their own
305 sense of vision.
307 - As a neat bonus, this idea behind simulated vision also enables one
308 to [[../../cortex/html/capture-video.html][capture live video feeds from jMonkeyEngine]].
311 * COMMENT code generation
312 #+begin_src clojure :tangle ../src/cortex/vision.clj
313 <<eyes>>
314 #+end_src
316 #+begin_src clojure :tangle ../src/cortex/test/vision.clj
317 <<test-vision>>
318 #+end_src