Skip to content
This repository was archived by the owner on Mar 21, 2024. It is now read-only.

Commit fec2e20

Browse files
committed
Updated html docgen and kepler reduction tune
Former-commit-id: 448cc6d
1 parent 9b1febf commit fec2e20

File tree

276 files changed

+790
-450
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

276 files changed

+790
-450
lines changed

cub/device/device_reduce.cuh

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -178,11 +178,11 @@ struct DeviceReduceDispatch
178178
/// SM35
179179
struct Policy350
180180
{
181-
// ReduceRegionPolicy1B (GTX Titan: 206.0 GB/s @ 192M 1B items)
181+
// ReduceRegionPolicy1B (GTX Titan: 228.7 GB/s @ 192M 1B items)
182182
typedef BlockReduceRegionPolicy<
183183
128, ///< Threads per thread block
184-
12, ///< Items per thread per tile of input
185-
1, ///< Number of items per vectorized load
184+
24, ///< Items per thread per tile of input
185+
4, ///< Number of items per vectorized load
186186
BLOCK_REDUCE_RAKING, ///< Cooperative block-wide reduction algorithm to use
187187
LOAD_LDG, ///< Cache load modifier
188188
GRID_MAPPING_DYNAMIC> ///< How to map tiles of input onto thread blocks
@@ -193,14 +193,14 @@ struct DeviceReduceDispatch
193193
ITEMS_PER_THREAD = CUB_MIN(NOMINAL_4B_ITEMS_PER_THREAD, CUB_MAX(1, (NOMINAL_4B_ITEMS_PER_THREAD * 4 / sizeof(T)))),
194194
};
195195

196-
// ReduceRegionPolicy4B (GTX Titan: 254.2 GB/s @ 48M 4B items)
196+
// ReduceRegionPolicy4B (GTX Titan: 255.1 GB/s @ 48M 4B items)
197197
typedef BlockReduceRegionPolicy<
198-
512, ///< Threads per thread block
198+
256, ///< Threads per thread block
199199
ITEMS_PER_THREAD, ///< Items per thread per tile of input
200-
1, ///< Number of items per vectorized load
200+
2, ///< Number of items per vectorized load
201201
BLOCK_REDUCE_RAKING, ///< Cooperative block-wide reduction algorithm to use
202-
LOAD_DEFAULT, ///< Cache load modifier
203-
GRID_MAPPING_EVEN_SHARE> ///< How to map tiles of input onto thread blocks
202+
LOAD_LDG, ///< Cache load modifier
203+
GRID_MAPPING_DYNAMIC> ///< How to map tiles of input onto thread blocks
204204
ReduceRegionPolicy4B;
205205

206206
// ReduceRegionPolicy

docs/html/CHANGE_LOG.TXT

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
//-----------------------------------------------------------------------------
22

3-
1.1.0 12/10/2013
3+
1.1.1 12/11/2013
44
- New features:
55
- Added TexObjInputIterator, TexRefInputIterator, CacheModifiedInputIterator, and CacheModifiedOutputIterator types for loading & storing arbitrary types through the cache hierarchy. Compatible with Thrust API.
66
- Added descending sorting to DeviceRadixSort and BlockRadixSort

docs/html/annotated.html

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -149,7 +149,7 @@
149149
</div>
150150
</td></tr>
151151
<tr id="row_0_33_0_"><td class="entry"><img src="ftv2blank.png" alt="&#160;" width="16" height="22" /><img src="ftv2vertline.png" alt="|" width="16" height="22" /><img src="ftv2lastnode.png" alt="\" width="16" height="22" /><img src="ftv2cl.png" alt="C" width="24" height="22" /><a class="el" href="structcub_1_1_block_histogram_1_1_temp_storage.html" target="_self">TempStorage</a></td><td class="desc">The operations exposed by <a class="el" href="classcub_1_1_block_histogram.html" title="The BlockHistogram class provides collective methods for constructing block-wide histograms from data...">BlockHistogram</a> require a temporary memory allocation of this nested type for thread communication. This opaque storage can be allocated directly using the <code>__shared__</code> keyword. Alternatively, it can be aliased to externally allocated memory (shared or global) or <code>union</code>'d with other storage allocation types to facilitate memory reuse </td></tr>
152-
<tr id="row_0_34_" class="even"><td class="entry"><img src="ftv2blank.png" alt="&#160;" width="16" height="22" /><img id="arr_0_34_" src="ftv2mnode.png" alt="o" width="16" height="22" onclick="toggleFolder('0_34_')"/><img src="ftv2cl.png" alt="C" width="24" height="22" /><a class="el" href="classcub_1_1_block_load.html" target="_self">BlockLoad</a></td><td class="desc">The <a class="el" href="classcub_1_1_block_load.html" title="The BlockLoad class provides collective data movement methods for loading a linear segment of items f...">BlockLoad</a> class provides <a href="index.html#sec0"><em>collective</em></a> data movement methods for loading a linear segment of items from memory into a <a href="index.html#sec5sec4"><em>blocked arrangement</em></a> across a CUDA thread block. </p>
152+
<tr id="row_0_34_" class="even"><td class="entry"><img src="ftv2blank.png" alt="&#160;" width="16" height="22" /><img id="arr_0_34_" src="ftv2mnode.png" alt="o" width="16" height="22" onclick="toggleFolder('0_34_')"/><img src="ftv2cl.png" alt="C" width="24" height="22" /><a class="el" href="classcub_1_1_block_load.html" target="_self">BlockLoad</a></td><td class="desc">The <a class="el" href="classcub_1_1_block_load.html" title="The BlockLoad class provides collective data movement methods for loading a linear segment of items f...">BlockLoad</a> class provides <a href="index.html#sec0"><em>collective</em></a> data movement methods for loading a linear segment of items from memory into a <a href="index.html#sec4sec3"><em>blocked arrangement</em></a> across a CUDA thread block. </p>
153153
<div class="image">
154154
<img src="block_load_logo.png" alt="block_load_logo.png"/>
155155
</div>
@@ -173,7 +173,7 @@
173173
</div>
174174
</td></tr>
175175
<tr id="row_0_37_0_"><td class="entry"><img src="ftv2blank.png" alt="&#160;" width="16" height="22" /><img src="ftv2vertline.png" alt="|" width="16" height="22" /><img src="ftv2lastnode.png" alt="\" width="16" height="22" /><img src="ftv2cl.png" alt="C" width="24" height="22" /><a class="el" href="structcub_1_1_block_scan_1_1_temp_storage.html" target="_self">TempStorage</a></td><td class="desc">The operations exposed by <a class="el" href="classcub_1_1_block_scan.html" title="The BlockScan class provides collective methods for computing a parallel prefix sum/scan of items par...">BlockScan</a> require a temporary memory allocation of this nested type for thread communication. This opaque storage can be allocated directly using the <code>__shared__</code> keyword. Alternatively, it can be aliased to externally allocated memory (shared or global) or <code>union</code>'d with other storage allocation types to facilitate memory reuse </td></tr>
176-
<tr id="row_0_38_" class="even"><td class="entry"><img src="ftv2blank.png" alt="&#160;" width="16" height="22" /><img id="arr_0_38_" src="ftv2mnode.png" alt="o" width="16" height="22" onclick="toggleFolder('0_38_')"/><img src="ftv2cl.png" alt="C" width="24" height="22" /><a class="el" href="classcub_1_1_block_store.html" target="_self">BlockStore</a></td><td class="desc">The <a class="el" href="classcub_1_1_block_store.html" title="The BlockStore class provides collective data movement methods for writing a blocked arrangement of i...">BlockStore</a> class provides <a href="index.html#sec0"><em>collective</em></a> data movement methods for writing a <a href="index.html#sec5sec4"><em>blocked arrangement</em></a> of items partitioned across a CUDA thread block to a linear segment of memory. </p>
176+
<tr id="row_0_38_" class="even"><td class="entry"><img src="ftv2blank.png" alt="&#160;" width="16" height="22" /><img id="arr_0_38_" src="ftv2mnode.png" alt="o" width="16" height="22" onclick="toggleFolder('0_38_')"/><img src="ftv2cl.png" alt="C" width="24" height="22" /><a class="el" href="classcub_1_1_block_store.html" target="_self">BlockStore</a></td><td class="desc">The <a class="el" href="classcub_1_1_block_store.html" title="The BlockStore class provides collective data movement methods for writing a blocked arrangement of i...">BlockStore</a> class provides <a href="index.html#sec0"><em>collective</em></a> data movement methods for writing a <a href="index.html#sec4sec3"><em>blocked arrangement</em></a> of items partitioned across a CUDA thread block to a linear segment of memory. </p>
177177
<div class="image">
178178
<img src="block_store_logo.png" alt="block_store_logo.png"/>
179179
</div>
@@ -227,7 +227,7 @@
227227
<!-- HTML footer for doxygen 1.8.3.1-->
228228
<!-- start footer part -->
229229
<hr class="footer"/><address class="footer"><small>
230-
Generated on Tue Dec 10 2013 04:41:10 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
230+
Generated on Wed Dec 11 2013 07:19:22 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
231231
<img class="footer" src="doxygen.png" alt="doxygen"/>
232232
</a> 1.8.4
233233
<br>

docs/html/arg__index__input__iterator_8cuh.html

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -135,7 +135,7 @@
135135
<!-- HTML footer for doxygen 1.8.3.1-->
136136
<!-- start footer part -->
137137
<hr class="footer"/><address class="footer"><small>
138-
Generated on Tue Dec 10 2013 04:41:07 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
138+
Generated on Wed Dec 11 2013 07:19:20 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
139139
<img class="footer" src="doxygen.png" alt="doxygen"/>
140140
</a> 1.8.4
141141
<br>

docs/html/arg__index__input__iterator_8cuh_source.html

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -281,7 +281,7 @@
281281
<!-- HTML footer for doxygen 1.8.3.1-->
282282
<!-- start footer part -->
283283
<hr class="footer"/><address class="footer"><small>
284-
Generated on Tue Dec 10 2013 04:41:06 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
284+
Generated on Wed Dec 11 2013 07:19:19 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
285285
<img class="footer" src="doxygen.png" alt="doxygen"/>
286286
</a> 1.8.4
287287
<br>

docs/html/block__discontinuity_8cuh.html

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -137,7 +137,7 @@
137137
<!-- HTML footer for doxygen 1.8.3.1-->
138138
<!-- start footer part -->
139139
<hr class="footer"/><address class="footer"><small>
140-
Generated on Tue Dec 10 2013 04:41:07 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
140+
Generated on Wed Dec 11 2013 07:19:20 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
141141
<img class="footer" src="doxygen.png" alt="doxygen"/>
142142
</a> 1.8.4
143143
<br>

docs/html/block__discontinuity_8cuh_source.html

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -398,7 +398,7 @@
398398
<!-- HTML footer for doxygen 1.8.3.1-->
399399
<!-- start footer part -->
400400
<hr class="footer"/><address class="footer"><small>
401-
Generated on Tue Dec 10 2013 04:41:06 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
401+
Generated on Wed Dec 11 2013 07:19:19 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
402402
<img class="footer" src="doxygen.png" alt="doxygen"/>
403403
</a> 1.8.4
404404
<br>

docs/html/block__exchange_8cuh.html

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -139,7 +139,7 @@
139139
<!-- HTML footer for doxygen 1.8.3.1-->
140140
<!-- start footer part -->
141141
<hr class="footer"/><address class="footer"><small>
142-
Generated on Tue Dec 10 2013 04:41:07 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
142+
Generated on Wed Dec 11 2013 07:19:20 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
143143
<img class="footer" src="doxygen.png" alt="doxygen"/>
144144
</a> 1.8.4
145145
<br>
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
929acf0309668d0996d5fca70aaa85a4a4346c5c
1+
fe0e2875731d5335ee1a074b01fcfd03637fe2f8

docs/html/block__histogram_8cuh.html

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -148,7 +148,7 @@
148148
<!-- HTML footer for doxygen 1.8.3.1-->
149149
<!-- start footer part -->
150150
<hr class="footer"/><address class="footer"><small>
151-
Generated on Tue Dec 10 2013 04:41:07 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
151+
Generated on Wed Dec 11 2013 07:19:20 for CUB by &#160;<a href="http://www.doxygen.org/index.html">
152152
<img class="footer" src="doxygen.png" alt="doxygen"/>
153153
</a> 1.8.4
154154
<br>

0 commit comments

Comments
 (0)